We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 04d84fe commit be62d32Copy full SHA for be62d32
scripts/inference.py
@@ -394,9 +394,9 @@ def select_int8_module(
394
395
if args.int8_smoothquant:
396
# TODO: consider saving this info into config during quantization
397
- if any("granite" in p for p in [args.model_path, args.architecture]):
+ if any("granite" in p.lower() for p in [args.model_path, args.architecture]):
398
smoothquant_layers = ["key", "value", "w1", "wg"]
399
- elif any("roberta" in p for p in [args.model_path, args.architecture]):
+ elif any("roberta" in p.lower() for p in [args.model_path, args.architecture]):
400
smoothquant_layers = ["query", "key", "value", "w1"]
401
else:
402
raise NotImplementedError(
0 commit comments