stanrom commited on
Commit
c3b6e57
·
verified ·
1 Parent(s): ffc8e21

Update tokenization_InternLM_XComposer.py

Browse files
Files changed (1) hide show
  1. tokenization_InternLM_XComposer.py +2 -1
tokenization_InternLM_XComposer.py CHANGED
@@ -70,12 +70,13 @@ class InternLMXComposerTokenizer(PreTrainedTokenizer):
70
  pad_token=pad_token,
71
  clean_up_tokenization_spaces=clean_up_tokenization_spaces,
72
  **kwargs,
 
73
  )
74
  self.vocab_file = vocab_file
75
  self.add_bos_token = add_bos_token
76
  self.add_eos_token = add_eos_token
77
  self.decode_with_prefix_space = decode_with_prefix_space
78
- self.sp_model = spm.SentencePieceProcessor(**self.sp_model_kwargs)
79
  self.sp_model.Load(vocab_file)
80
  self._no_prefix_space_tokens = None
81
 
 
70
  pad_token=pad_token,
71
  clean_up_tokenization_spaces=clean_up_tokenization_spaces,
72
  **kwargs,
73
+ self.sp_model = spm.SentencePieceProcessor(**self.sp_model_kwargs),
74
  )
75
  self.vocab_file = vocab_file
76
  self.add_bos_token = add_bos_token
77
  self.add_eos_token = add_eos_token
78
  self.decode_with_prefix_space = decode_with_prefix_space
79
+
80
  self.sp_model.Load(vocab_file)
81
  self._no_prefix_space_tokens = None
82