aboutsummaryrefslogtreecommitdiffstatshomepage
path: root/src
diff options
context:
space:
mode:
authorHsiangNianian <i@jyunko.cn>2026-01-05 14:33:10 +0800
committerHsiangNianian <i@jyunko.cn>2026-01-05 14:33:10 +0800
commitdf94eb6c125279a9c32bc85de8633371d50afbed (patch)
treefa7e99e5078bbcb62e7b9dcc181f4fbc282129c4 /src
parent25380fb4de77966a0f3d00681be25857c27b0869 (diff)
downloadbase-model-df94eb6c125279a9c32bc85de8633371d50afbed.tar.gz
base-model-df94eb6c125279a9c32bc85de8633371d50afbed.zip
feat: update max_length parameter for TRPGParser and onnx_infer to improve text parsing capabilities
Diffstat (limited to 'src')
-rw-r--r--src/base_model_trpgner/inference/__init__.py6
1 files changed, 3 insertions, 3 deletions
diff --git a/src/base_model_trpgner/inference/__init__.py b/src/base_model_trpgner/inference/__init__.py
index 3d1d720..41f3504 100644
--- a/src/base_model_trpgner/inference/__init__.py
+++ b/src/base_model_trpgner/inference/__init__.py
@@ -214,13 +214,13 @@ class TRPGParser:
9: "B-timestamp", 10: "I-timestamp",
}
- def parse(self, text: str) -> Dict[str, Any]:
+ def parse(self, text: str, max_length: int = 512) -> Dict[str, Any]:
"""
解析单条 TRPG 日志
Args:
text: 待解析的日志文本
-
+ max_length: 最大序列长度,大小512以内
Returns:
包含 metadata 和 content 的字典
- metadata: speaker, timestamp
@@ -239,7 +239,7 @@ class TRPGParser:
return_offsets_mapping=True,
padding="max_length",
truncation=True,
- max_length=128,
+ max_length=max_length or 512,
)
# 推理