Skip to content

Commit cde42c8

Browse files
authored
ty test
1 parent 892e3c3 commit cde42c8

2 files changed

Lines changed: 16 additions & 8 deletions

File tree

convert_hf_to_gguf.py

Lines changed: 9 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -45,9 +45,9 @@
4545
_MISTRAL_COMMON_DATASET_STD = (0.26862954, 0.26130258, 0.27577711)
4646

4747
_mistral_common_installed = False
48-
TokenizerVersion = None
49-
Tekkenizer = None
50-
SentencePieceTokenizer = None
48+
TokenizerVersion: Any = None
49+
Tekkenizer: Any = None
50+
SentencePieceTokenizer: Any = None
5151
_mistral_import_error_msg = (
5252
"Mistral format requires `mistral-common` to be installed. Please run "
5353
"`pip install mistral-common[image,audio]` to install it."
@@ -220,7 +220,7 @@ def index_tensors(self, remote_hf_model_id: str | None = None) -> dict[str, Call
220220
if weight_map is None or not isinstance(weight_map, dict):
221221
raise ValueError(f"Can't load 'weight_map' from {index_name!r}")
222222
tensor_names_from_index.update(weight_map.keys())
223-
part_dict: dict[str, None] = dict.fromkeys(weight_map.values(), None)
223+
part_dict: dict[str, None] = dict.fromkeys(weight_map.values(), None) # ty: ignore[invalid-assignment]
224224
part_names = sorted(part_dict.keys())
225225
else:
226226
weight_map = {}
@@ -5878,7 +5878,7 @@ def set_vocab(self):
58785878
logger.error(f'Error: Missing {tokenizer_path}')
58795879
sys.exit(1)
58805880

5881-
sentencepiece_model = model.ModelProto() # pyright: ignore[reportAttributeAccessIssue]
5881+
sentencepiece_model = model.ModelProto() # pyright: ignore[reportAttributeAccessIssue] # ty: ignore[unresolved-attribute]
58825882
sentencepiece_model.ParseFromString(open(tokenizer_path, "rb").read())
58835883
add_prefix = sentencepiece_model.normalizer_spec.add_dummy_prefix
58845884

@@ -6199,7 +6199,7 @@ def _xlmroberta_set_vocab(self) -> None:
61996199

62006200
vocab_size = max(self.hparams.get("vocab_size", 0), tokenizer.vocab_size)
62016201
else:
6202-
sentencepiece_model = model.ModelProto() # pyright: ignore[reportAttributeAccessIssue]
6202+
sentencepiece_model = model.ModelProto() # pyright: ignore[reportAttributeAccessIssue] # ty: ignore[unresolved-attribute]
62036203
sentencepiece_model.ParseFromString(open(tokenizer_path, "rb").read())
62046204
assert sentencepiece_model.trainer_spec.model_type == 1 # UNIGRAM
62056205

@@ -8876,7 +8876,7 @@ def set_vocab(self):
88768876
if not tokenizer_path.is_file():
88778877
raise FileNotFoundError(f"File not found: {tokenizer_path}")
88788878

8879-
sentencepiece_model = model.ModelProto() # pyright: ignore[reportAttributeAccessIssue]
8879+
sentencepiece_model = model.ModelProto() # pyright: ignore[reportAttributeAccessIssue] # ty: ignore[unresolved-attribute]
88808880
sentencepiece_model.ParseFromString(open(tokenizer_path, "rb").read())
88818881

88828882
# some models like Pile-T5 family use BPE tokenizer instead of Unigram
@@ -9013,7 +9013,7 @@ def set_vocab(self):
90139013
if not tokenizer_path.is_file():
90149014
raise FileNotFoundError(f"File not found: {tokenizer_path}")
90159015

9016-
sentencepiece_model = model.ModelProto() # pyright: ignore[reportAttributeAccessIssue]
9016+
sentencepiece_model = model.ModelProto() # pyright: ignore[reportAttributeAccessIssue] # ty: ignore[unresolved-attribute]
90179017
sentencepiece_model.ParseFromString(open(tokenizer_path, "rb").read())
90189018

90199019
# some models like Pile-T5 family use BPE tokenizer instead of Unigram
@@ -12275,6 +12275,7 @@ def __torch_function__(cls, func, types, args=(), kwargs=None):
1227512275
kwargs = {}
1227612276

1227712277
if func is torch.Tensor.numpy:
12278+
assert len(args)
1227812279
return args[0].numpy()
1227912280

1228012281
return cls._wrap_fn(func)(*args, **kwargs)

ty.toml

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,7 @@
1+
[environment]
2+
extra-paths = ["./gguf-py", "./examples/model-conversion/scripts", "./tools/server/tests"]
3+
python-version = "3.10"
4+
5+
[rules]
6+
deprecated = "warn"
7+
unresolved-import = "ignore"

0 commit comments

Comments
 (0)