arxyzan commited on
Commit
681493a
1 Parent(s): 889f931

Update preprocessor/tokenizer_config.yaml

Browse files
Files changed (1) hide show
  1. preprocessor/tokenizer_config.yaml +4 -2
preprocessor/tokenizer_config.yaml CHANGED
@@ -1,7 +1,9 @@
1
  name: bpe_tokenizer
2
  config_type: preprocessor
3
- truncation_strategy: no_truncation
4
- padding_strategy: no_padding
 
 
5
  pad_token_id: 0
6
  pad_token: <pad>
7
  continuing_subword_prefix: ''
 
1
  name: bpe_tokenizer
2
  config_type: preprocessor
3
+ truncation_strategy: longest_first
4
+ truncation_direction: right
5
+ padding_strategy: longest
6
+ padding_direction: right
7
  pad_token_id: 0
8
  pad_token: <pad>
9
  continuing_subword_prefix: ''