5
0
vahe1994 1 жил өмнө
parent
commit
a95f52be81

+ 2 - 1
src/petals/server/from_pretrained.py

@@ -57,7 +57,8 @@ def load_pretrained_block(
         block = get_model_block(config, layer_idx=block_index)
 
     block_prefix = f"{config.block_prefix}.{block_index}."
-
+    print(config)
+    print(is_gptq_quant(config))
     if is_gptq_quant(config):
         print("Now loading GPTQ")
         hf_quantizer = AutoHfQuantizer.from_config(config.quantization_config, pre_quantized=True)