Abhinav Kulkarni
commited on
Commit
•
dc71fb8
1
Parent(s):
b2ff941
Updated README
Browse files
README.md
CHANGED
@@ -68,6 +68,7 @@ with init_empty_weights():
|
|
68 |
torch_dtype=torch.float16, trust_remote_code=True)
|
69 |
|
70 |
real_quantize_model_weight(model, w_bit=w_bit, q_config=q_config, init_only=True)
|
|
|
71 |
|
72 |
model = load_checkpoint_and_dispatch(model, load_quant, device_map="balanced")
|
73 |
|
|
|
68 |
torch_dtype=torch.float16, trust_remote_code=True)
|
69 |
|
70 |
real_quantize_model_weight(model, w_bit=w_bit, q_config=q_config, init_only=True)
|
71 |
+
model.tie_weights()
|
72 |
|
73 |
model = load_checkpoint_and_dispatch(model, load_quant, device_map="balanced")
|
74 |
|