import torch | |
blob_path = "./llama-2-chat-7b_r0.8_g128.pth" | |
blob = torch.load(blob_path) | |
for layer, attr in blob.items(): | |
print(f"{layer:30} | q_dtype: {attr['q_dtype']:5} | orig. shape: {str(attr['original_shape']):15} | quantized_shape: {str(attr['q_weight'].shape):15}") | |
print("done.") |