We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent fbe7dfa commit e76627bCopy full SHA for e76627b
convert.py
@@ -334,7 +334,10 @@ def load(model_plus: ModelPlus) -> Params:
334
class BpeVocab:
335
def __init__(self, fname_tokenizer: Path, fname_added_tokens: Path | None) -> None:
336
self.bpe_tokenizer = json.loads(open(str(fname_tokenizer), encoding="utf-8").read())
337
- self.vocab = self.bpe_tokenizer["model"]["vocab"]
+ try:
338
+ self.vocab = self.bpe_tokenizer["model"]["vocab"]
339
+ except:
340
+ self.vocab = self.bpe_tokenizer
341
added_tokens: dict[str, int]
342
if fname_added_tokens is not None:
343
# FIXME: Verify that added tokens here _cannot_ overlap with the main vocab.
0 commit comments