gokaygokay commited on
Commit
603fd34
1 Parent(s): a66f4c7

Update tokenization_InternLM_XComposer.py

Browse files
Files changed (1) hide show
  1. tokenization_InternLM_XComposer.py +2 -1
tokenization_InternLM_XComposer.py CHANGED
@@ -64,7 +64,7 @@ class InternLMXComposerTokenizer(PreTrainedTokenizer):
64
  ):
65
  self.sp_model_kwargs = {} if sp_model_kwargs is None else sp_model_kwargs
66
  self.sp_model = spm.SentencePieceProcessor(**self.sp_model_kwargs)
67
- self.sp_model.Load(vocab_file)
68
  super().__init__(
69
  bos_token=bos_token,
70
  eos_token=eos_token,
@@ -73,6 +73,7 @@ class InternLMXComposerTokenizer(PreTrainedTokenizer):
73
  clean_up_tokenization_spaces=clean_up_tokenization_spaces,
74
  **kwargs,
75
  )
 
76
  self.vocab_file = vocab_file
77
  self.add_bos_token = add_bos_token
78
  self.add_eos_token = add_eos_token
 
64
  ):
65
  self.sp_model_kwargs = {} if sp_model_kwargs is None else sp_model_kwargs
66
  self.sp_model = spm.SentencePieceProcessor(**self.sp_model_kwargs)
67
+
68
  super().__init__(
69
  bos_token=bos_token,
70
  eos_token=eos_token,
 
73
  clean_up_tokenization_spaces=clean_up_tokenization_spaces,
74
  **kwargs,
75
  )
76
+ self.sp_model.Load(vocab_file)
77
  self.vocab_file = vocab_file
78
  self.add_bos_token = add_bos_token
79
  self.add_eos_token = add_eos_token