pytorch
diff --git a/‎.gitignore‎
Lines changed: 1 addition & 0 deletions b/‎.gitignore‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎benchmarks/quantization/create_quantized_model.py‎
Lines changed: 1 addition & 30 deletions b/‎benchmarks/quantization/create_quantized_model.py‎
Lines changed: 1 addition & 30 deletions
@@ -381,3 +381,4 @@ torchao/experimental/deps
 
 # local claude code files
 CLAUDE.local.md
+.claude
@@ -9,36 +9,7 @@
 
 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, TorchAoConfig
-
-from torchao.quantization import (
-    Float8DynamicActivationFloat8WeightConfig,
-    Float8DynamicActivationInt4WeightConfig,
-    Int4WeightOnlyConfig,
-    Int8DynamicActivationInt8WeightConfig,
-    Int8WeightOnlyConfig,
-    PerRow,
-)
-
-
-def string_to_config(s):
-    if s == "None":
-        return None
-    elif s == "float8_rowwise":
-        return Float8DynamicActivationFloat8WeightConfig(granularity=PerRow())
-    elif s == "int4_groupwise_weight_float8_rowwise_activation":
-        return Float8DynamicActivationInt4WeightConfig()
-    elif s == "int4_groupwise_hqq_weight_only":
-        return Int4WeightOnlyConfig(
-            group_size=32,
-            int4_packing_format="tile_packed_to_4d",
-            int4_choose_qparams_algorithm="hqq",
-        )
-    elif s == "int8_rowwise_weight_only":
-        return Int8WeightOnlyConfig()
-    elif s == "int8_rowwise":
-        return Int8DynamicActivationInt8WeightConfig()
-    else:
-        raise AssertionError(f"unsupported {s}")
+from utils import string_to_config
 
 
 def quantize_model_and_save(model_id, quant_config, output_dir):
Original file line number	Diff line number	Diff line change
`@@ -381,3 +381,4 @@ torchao/experimental/deps`
`381`	`381`
`382`	`382`	`# local claude code files`
`383`	`383`	`CLAUDE.local.md`
	`384`	`+.claude`