Skip to content

Commit 62b0c79

Browse files
Add eom_id to Llama3 Tokenizer (#1586)
1 parent be8f1e7 commit 62b0c79

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

torchtune/models/llama3/_tokenizer.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -98,8 +98,8 @@ def __init__(
9898
# Media tokens
9999
self.image_id = self.special_tokens["<|image|>"]
100100

101-
# During generation, stop when either eos_id or eot_id is encountered
102-
self.stop_tokens = [self.eos_id, self.eot_id]
101+
# During generation, stop when either eos_id, eot_id, or eom_id is encountered
102+
self.stop_tokens = [self.eos_id, self.eot_id, self.eom_id]
103103

104104
self.tt_model = TikTokenBaseTokenizer(
105105
path=path,

0 commit comments

Comments
 (0)