@@ -98,6 +98,7 @@ def load_pretrained_block(
set_module_tensor_to_device(block, param_name, "cpu", value=param, dtype=param.dtype)
logger.info(f"Loaded {model_name} block {block_index}")
+ print(block.self_attn.q_proj.weight)
return block