Update eos token id

This commit is contained in:
Daya Guo 2024-02-02 10:42:46 +08:00 committed by GitHub
parent 9d2c23c96d
commit 5ca49c93b1
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -135,8 +135,8 @@ messages=[
{ 'role': 'user', 'content': "write a quick sort algorithm in python."} { 'role': 'user', 'content': "write a quick sort algorithm in python."}
] ]
inputs = tokenizer.apply_chat_template(messages, add_generation_prompt=True, return_tensors="pt").to(model.device) inputs = tokenizer.apply_chat_template(messages, add_generation_prompt=True, return_tensors="pt").to(model.device)
# 32021 is the id of <|EOT|> token # tokenizer.eos_token_id is the id of <|EOT|> token
outputs = model.generate(inputs, max_new_tokens=512, do_sample=False, top_k=50, top_p=0.95, num_return_sequences=1, eos_token_id=32021) outputs = model.generate(inputs, max_new_tokens=512, do_sample=False, top_k=50, top_p=0.95, num_return_sequences=1, eos_token_id=tokenizer.eos_token_id)
print(tokenizer.decode(outputs[0][len(inputs[0]):], skip_special_tokens=True)) print(tokenizer.decode(outputs[0][len(inputs[0]):], skip_special_tokens=True))
``` ```
This code will output the following result: This code will output the following result: