Thanks to visit codestin.com
Credit goes to github.com

Skip to content

Commit a0cdff3

Browse files
authored
[chatglm] set default max_seq_length to 2048 (PaddlePaddle#5970)
* set max_seq_length to 2048 * Add THUDM/chatglm-6b-v1.1 * Add chatglm v1.1 config
1 parent 3642ec5 commit a0cdff3

4 files changed

Lines changed: 13 additions & 6 deletions

File tree

β€Žpaddlenlp/taskflow/taskflow.pyβ€Ž

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -473,8 +473,12 @@
473473
"task_class": ChatGLMTask,
474474
"task_flag": "text_generation-tiny-random-chatglm",
475475
},
476+
"THUDM/chatglm-6b-v1.1": {
477+
"task_class": ChatGLMTask,
478+
"task_flag": "text_generation-THUDM/chatglm-6b-v1.1",
479+
},
476480
},
477-
"default": {"model": "THUDM/chatglm-6b"},
481+
"default": {"model": "THUDM/chatglm-6b-v1.1"},
478482
},
479483
"zero_shot_text_classification": {
480484
"models": {
@@ -727,6 +731,7 @@
727731
"__internal_testing__/tiny-random-uie-m",
728732
"__internal_testing__/tiny-random-uie-x",
729733
"THUDM/chatglm-6b",
734+
"THUDM/chatglm-6b-v1.1",
730735
]
731736

732737

β€Žpaddlenlp/taskflow/text2text_generation.pyβ€Ž

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,9 +35,9 @@ def __init__(self, task, model, **kwargs):
3535
self._static_mode = False
3636
self._dtype = kwargs.get("dtype", "float16")
3737
self.kwargs["generation_task"] = task
38-
self._tgt_length = kwargs.get("tgt_length", 128)
38+
self._tgt_length = kwargs.get("tgt_length", 2048)
3939
# Token max length
40-
self._max_seq_length = kwargs.get("max_seq_length", 128)
40+
self._max_seq_length = kwargs.get("max_seq_length", 2048)
4141
self._top_k = kwargs.get("top_k", 1)
4242
self._top_p = kwargs.get("top_p", 1.0)
4343
self._temperature = kwargs.get("temperature", 1.0)

β€Žpaddlenlp/transformers/chatglm/configuration.pyβ€Ž

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,8 @@
2424

2525
CHATGLM_PRETRAINED_RESOURCE_FILES_MAP = {
2626
"model_state": {
27-
"THUDM/chatglm-6b": "https://paddlenlp.bj.bcebos.com/models/community/THUDM/chatglm-6b/model_state.pdparams"
27+
"THUDM/chatglm-6b": "https://paddlenlp.bj.bcebos.com/models/community/THUDM/chatglm-6b/model_state.pdparams",
28+
"THUDM/chatglm-6b-v1.1": "https://paddlenlp.bj.bcebos.com/models/community/THUDM/chatglm-6b-v1.1/model_state.pdparams",
2829
}
2930
}
3031

β€Žpaddlenlp/transformers/chatglm/tokenizer.pyβ€Ž

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -165,11 +165,12 @@ class ChatGLMTokenizer(PretrainedTokenizer):
165165
"""
166166

167167
resource_files_names = {"vocab_file": "ice_text.model"}
168-
max_model_input_sizes = {"THUDM/chatglm-6b": 2048}
168+
max_model_input_sizes = {"THUDM/chatglm-6b": 2048, "THUDM/chatglm-6b-v1.1": 2048}
169169
model_input_names = ["input_ids", "attention_mask", "position_ids"]
170170
pretrained_resource_files_map = {
171171
"model_file": {
172-
"THUDM/chatglm-6b": "https://paddlenlp.bj.bcebos.com/models/community/THUDM/chatglm-6b/ice_text.model"
172+
"THUDM/chatglm-6b": "https://paddlenlp.bj.bcebos.com/models/community/THUDM/chatglm-6b/ice_text.model",
173+
"THUDM/chatglm-6b-v1.1": "https://paddlenlp.bj.bcebos.com/models/community/THUDM/chatglm-6b-v1.1/ice_text.model",
173174
}
174175
}
175176

0 commit comments

Comments
Β (0)