File tree Expand file tree Collapse file tree 2 files changed +16
-1
lines changed Expand file tree Collapse file tree 2 files changed +16
-1
lines changed Original file line number Diff line number Diff line change @@ -187,7 +187,7 @@ def process_result_tokens(
187
187
slot_valid = slot_data .valid
188
188
slot_lengths = slot_data .lengths
189
189
samples , speculations = slot_tokens .shape
190
- stop_tokens = [ tokenizer .eos_id , tokenizer . pad_id ]
190
+ stop_tokens = tokenizer .stop_tokens
191
191
# Stop anything which has reached it's max length.
192
192
complete = complete | (slot_lengths > slot_max_length )
193
193
if debug :
@@ -349,6 +349,11 @@ def bos_id(self) -> int:
349
349
"""ID of the BOS token."""
350
350
return self .vocab .bos_id
351
351
352
+ @property
353
+ def stop_tokens (self ) -> set [int ]:
354
+ """ID of the stop token."""
355
+ return {self .eos_id , self .pad_id }
356
+
352
357
353
358
class TikToken (tokenizer_api .Tokenizer ):
354
359
"""Tokenizer to convert strings to token ids and vice-versa."""
@@ -394,6 +399,11 @@ def decode(self, token_ids: list[int]) -> str:
394
399
str: String generated from the token ids.
395
400
"""
396
401
return self .tokenizer .decode (token_ids )
402
+
403
+ @property
404
+ def stop_tokens (self ) -> set [int ]:
405
+ """ID of the stop token."""
406
+ return self .tokenizer .stop_tokens
397
407
398
408
@property
399
409
def pad_id (self ) -> int :
Original file line number Diff line number Diff line change @@ -65,3 +65,8 @@ def eos_id(self) -> int:
65
65
@abc .abstractmethod
66
66
def bos_id (self ) -> int :
67
67
"""ID of BOS token."""
68
+
69
+ @property
70
+ def stop_tokens (self ) -> set [int ]:
71
+ """ID of the stop token."""
72
+ return {self .eos_id , self .pad_id }
You can’t perform that action at this time.
0 commit comments