File tree Expand file tree Collapse file tree 1 file changed +6
-3
lines changed Expand file tree Collapse file tree 1 file changed +6
-3
lines changed Original file line number Diff line number Diff line change @@ -112,9 +112,12 @@ def _get_tokenizer(self, max_length: int = 512) -> Tokenizer:
112
112
Returns:
113
113
Tokenizer: Configured tokenizer for text processing.
114
114
"""
115
- config = json .load (open (str (self .model_dir / "config.json" )))
116
- tokenizer_config = json .load (open (str (self .model_dir / "tokenizer_config.json" )))
117
- tokens_map = json .load (open (str (self .model_dir / "special_tokens_map.json" )))
115
+ with open (str (self .model_dir / "config.json" )) as config_file :
116
+ config = json .load (config_file )
117
+ with open (str (self .model_dir / "tokenizer_config.json" )) as tokenizer_config_file :
118
+ tokenizer_config = json .load (tokenizer_config_file )
119
+ with open (str (self .model_dir / "special_tokens_map.json" )) as tokens_map_file :
120
+ tokens_map = json .load (tokens_map_file )
118
121
tokenizer = Tokenizer .from_file (str (self .model_dir / "tokenizer.json" ))
119
122
120
123
tokenizer .enable_truncation (max_length = min (tokenizer_config ["model_max_length" ], max_length ))
You can’t perform that action at this time.
0 commit comments