3 年之前 · 324ea2dc96
--- a/cli/quantize_for_cpu.py
+++ b/cli/quantize_for_cpu.py
@@ -47,3 +47,7 @@ if __name__ == "__main__":
 
				             layer_fp32, {torch.nn.Linear: qconfig}, dtype=torch.qint8, inplace=True
			
 
				         )
			
 
				         torch.save(layer_quantized.state_dict(), os.path.join(args.output_path, f"block_{i}_qint8.pth"))
			
 
				+
			
 
				+    model.transformer.h = torch.nn.ModuleList()
			
 
				+    torch.save(model.state_dict(), os.path.join(args.output_path, f"client.pth"))
			
 
				+