Skip to content

Commit 5f60250

Browse files
committed
Fix missing <|eom_id|> token in Llama 3 vocabulary.
1 parent 7c493df commit 5f60250

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

Llama3.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2045,7 +2045,7 @@ public ChatFormat(Tokenizer tokenizer) {
20452045
this.endHeader = specialTokens.get("<|end_header_id|>");
20462046
this.endOfTurn = specialTokens.get("<|eot_id|>");
20472047
this.endOfText = specialTokens.get("<|end_of_text|>");
2048-
this.endOfMessage = specialTokens.get("<|eom_id|>");
2048+
this.endOfMessage = specialTokens.getOrDefault("<|eom_id|>", -1); // only in 3.1
20492049
}
20502050

20512051
public Tokenizer getTokenizer() {

0 commit comments

Comments
 (0)