dicta-il
/

dictabert-joint

Feature Extraction

text-embeddings-inference

Model card Files Files and versions

Shaltiel commited on Oct 15, 2024

Commit

8c81f2a

·

verified ·

1 Parent(s): e68d30b

Update BertForMorphTagging.py

Files changed (1) hide show

BertForMorphTagging.py +2 -0

BertForMorphTagging.py CHANGED Viewed

@@ -177,6 +177,8 @@ def parse_logits(input_ids: List[List[int]], sentences: List[str], tokenizer: Be
     #       { pos: str, feats: dict, prefixes: List[str], suffix: str | bool, suffix_feats: dict | None}
     special_toks = tokenizer.all_special_tokens
     special_toks.remove(tokenizer.unk_token)
     ret = []
     for sent_idx,sentence in enumerate(sentences):
         input_id_strs = tokenizer.convert_ids_to_tokens(input_ids[sent_idx])

     #       { pos: str, feats: dict, prefixes: List[str], suffix: str | bool, suffix_feats: dict | None}
     special_toks = tokenizer.all_special_tokens
     special_toks.remove(tokenizer.unk_token)
+    special_toks.remove(tokenizer.mask_token)
     ret = []
     for sent_idx,sentence in enumerate(sentences):
         input_id_strs = tokenizer.convert_ids_to_tokens(input_ids[sent_idx])