[Sync] Bump version 0.2.3 (#957)

This commit is contained in:
Fengzhe Zhou 2024-03-12 11:51:56 +08:00 committed by GitHub
parent 64fde73b15
commit ab6cdb2be8
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 11 additions and 9 deletions

View File

@ -1 +1 @@
__version__ = '0.2.2'
__version__ = '0.2.3'

View File

@ -175,6 +175,7 @@ class ChatInferencer(BaseInferencer):
temperature: Optional[float] = 0.0,
do_sample: Optional[bool] = False,
infer_mode: str = 'last',
max_out_len: int = 512,
**kwargs) -> None:
super().__init__(
model=model,
@ -193,6 +194,7 @@ class ChatInferencer(BaseInferencer):
save_every = 1
self.save_every = save_every
self.dialogue_mode = False
self.max_out_len = max_out_len
def _set_meta_template(self, model):
origin = model.template_parser
@ -334,8 +336,8 @@ class ChatInferencer(BaseInferencer):
]
history = chat[:assistant_indices[-1]]
output = self.model.generate_from_template([history],
max_out_len=512)[0]
output = self.model.generate_from_template(
[history], max_out_len=self.max_out_len)[0]
output_handler.save_results(
origin_prompt=history,
prediction=output,
@ -356,11 +358,11 @@ class ChatInferencer(BaseInferencer):
[history],
do_sample=self.do_sample,
temperature=self.temperature,
max_out_len=512)[0]
max_out_len=self.max_out_len)[0]
else:
output = self.model.generate_from_template([history],
do_sample=False,
max_out_len=512)[0]
output = self.model.generate_from_template(
[history], do_sample=False,
max_out_len=self.max_out_len)[0]
chat[i]['content'] = output
if not self.dialogue_mode:
output_handler.save_multiround_results(
@ -397,8 +399,8 @@ class ChatInferencer(BaseInferencer):
for i in assistant_indices:
history = chat[:i]
output = self.model.generate_from_template([history],
max_out_len=512)[0]
output = self.model.generate_from_template(
[history], max_out_len=self.max_out_len)[0]
output_handler.save_multiround_results(
origin_prompt=history[-1]['content'],
prediction=output,