|
layer_fp32, {torch.nn.Linear: qconfig}, dtype=torch.qint8, inplace=True
|
|
layer_fp32, {torch.nn.Linear: qconfig}, dtype=torch.qint8, inplace=True
|
|
torch.save(layer_quantized.state_dict(), os.path.join(args.output_path, f"block_{i}_qint8.pth"))
|
|
torch.save(layer_quantized.state_dict(), os.path.join(args.output_path, f"block_{i}_qint8.pth"))
|