Batcher added
This commit is contained in:
@@ -31,7 +31,7 @@ class TokeNanoCore:
|
||||
def vocabulary_size(self):
|
||||
BPE_VOC_SIZE = self.__bpe_encoder.vocabulary_size
|
||||
SPECIAL_VOC_SIZE = self.__special_encoder.vocabulary_size
|
||||
return BPE_VOC_SIZE + SPECIAL_VOC_SIZE
|
||||
return BPE_VOC_SIZE + SPECIAL_VOC_SIZE + 1
|
||||
|
||||
def encode(self, corpus: str) -> list[int]:
|
||||
output: list[int] = []
|
||||
|
||||
Reference in New Issue
Block a user