File tree Expand file tree Collapse file tree 1 file changed +2
-1
lines changed
fusedrug/data/tokenizer/ops Expand file tree Collapse file tree 1 file changed +2
-1
lines changed Original file line number Diff line number Diff line change @@ -193,6 +193,7 @@ def __call__(
193
193
on_unknown : Optional [str ] = "warn" ,
194
194
verbose : Optional [int ] = 1 ,
195
195
validate_ends_with_eos : Optional [bool ] = None ,
196
+ additional_caller_info_text : Optional [str ] = "" ,
196
197
) -> NDict :
197
198
"""_summary_
198
199
@@ -297,7 +298,7 @@ def __call__(
297
298
len (encoded .overflowing ) > 0
298
299
): # note, encoded.overflowing may have multiple items, and each item can contain multiple items
299
300
print (
300
- f"Warning: FastModularTokenizer (pid={ os .getpid ()} ) had to truncate sequence: [{ overflow_info } ] \
301
+ f"Warning: FastModularTokenizer (pid={ os .getpid ()} , { additional_caller_info_text } ) had to truncate sequence: [{ overflow_info } ] \
301
302
for tokenizer: { self ._tokenizer_path } for sample_id { get_sample_id (sample_dict )} "
302
303
)
303
304
You can’t perform that action at this time.
0 commit comments