@@ -410,8 +410,8 @@ def __init__(
410410 if self .verbose :
411411 print (f"Model metadata: { self .metadata } " , file = sys .stderr )
412412
413- eos_token_id = int ( self .metadata . get ( "tokenizer.ggml.eos_token_id" , self . token_eos ()) )
414- bos_token_id = int ( self .metadata . get ( "tokenizer.ggml.bos_token_id" , self . token_bos ()) )
413+ eos_token_id = self .token_eos ()
414+ bos_token_id = self .token_bos ()
415415
416416 eos_token = self ._model .token_get_text (eos_token_id )
417417 bos_token = self ._model .token_get_text (bos_token_id )
@@ -961,9 +961,9 @@ def _create_completion(
961961
962962 completion_id : str = f"cmpl-{ str (uuid .uuid4 ())} "
963963 created : int = int (time .time ())
964- prefix_token_id : int = int ( self .metadata . get ( "tokenizer.ggml.prefix_token_id" , self . _model .token_prefix ()) )
965- middle_token_id : int = int ( self .metadata . get ( "tokenizer.ggml.middle_token_id" , self . _model .token_middle ()) )
966- suffix_token_id : int = int ( self .metadata . get ( "tokenizer.ggml.suffix_token_id" , self . _model .token_suffix ()) )
964+ prefix_token_id : int = self ._model .token_prefix ()
965+ middle_token_id : int = self ._model .token_middle ()
966+ suffix_token_id : int = self ._model .token_suffix ()
967967 # If prompt is empty, initialize completion with BOS token to avoid
968968 # detokenization including a space at the beginning of the completion
969969 completion_tokens : List [int ] = [] if len (prompt ) > 0 else [self .token_bos ()]
0 commit comments