Update mz_gguf_loader.py
This commit is contained in:
parent
db23e2ecc0
commit
ce903c0384
@ -27,6 +27,7 @@ def quantize_load_state_dict(model, state_dict, device="cpu", cublas_ops=False):
|
|||||||
setattr(model, "cublas_half_matmul", True)
|
setattr(model, "cublas_half_matmul", True)
|
||||||
print("Using cublas_ops")
|
print("Using cublas_ops")
|
||||||
except:
|
except:
|
||||||
|
print("Failed to load cublas_ops")
|
||||||
raise ImportError("Install cublas_ops (https://github.com/aredden/torch-cublas-hgemm) to use cublas_ops")
|
raise ImportError("Install cublas_ops (https://github.com/aredden/torch-cublas-hgemm) to use cublas_ops")
|
||||||
else:
|
else:
|
||||||
linear_ops = F.linear
|
linear_ops = F.linear
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user