fix layer_name

This commit is contained in:
Yu Li
2024-08-03 09:21:42 -05:00
parent 52893f1f34
commit b1e6311cc2
2 changed files with 2 additions and 2 deletions

View File

@@ -298,7 +298,7 @@ class AirLLMBaseModel(GenerationMixin):
layers = []
for param_name, param in state_dict.items():
if self.hf_quantizer is None:
layers.append(layer_name)
layers.append(param_name)
else:
if '.weight' in param_name:
layer_name = param_name[:param_name.index(".weight") + len(".weight")]

View File

@@ -5,7 +5,7 @@ with open("README.md", "r") as fh:
setuptools.setup(
name="airllm",
version="2.9",
version="2.9.1",
author="Gavin Li",
author_email="gavinli@animaai.cloud",
description="AirLLM allows single 4GB GPU card to run 70B large language models without quantization, distillation or pruning. 8GB vmem to run 405B Llama3.1.",