Skip to content

Commit 7fc0123

Browse files
zolltyzhanghao.smooth
authored andcommitted
add support for Chinese-LLaMA-Alpaca (lm-sys#2700)
1 parent 9f600e7 commit 7fc0123

File tree

2 files changed

+32
-0
lines changed

2 files changed

+32
-0
lines changed

fastchat/model/model_adapter.py

Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1726,6 +1726,31 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
17261726
return get_conv_template("llama2-chinese")
17271727

17281728

1729+
class Lamma2ChineseAlpacaAdapter(BaseModelAdapter):
1730+
"""The model adapter for ymcui/Chinese-LLaMA-Alpaca sft"""
1731+
1732+
def match(self, model_path: str):
1733+
return "chinese-alpaca" in model_path.lower()
1734+
1735+
def load_model(self, model_path: str, from_pretrained_kwargs: dict):
1736+
revision = from_pretrained_kwargs.get("revision", "main")
1737+
tokenizer = AutoTokenizer.from_pretrained(
1738+
model_path,
1739+
trust_remote_code=True,
1740+
revision=revision,
1741+
)
1742+
model = AutoModelForCausalLM.from_pretrained(
1743+
model_path,
1744+
trust_remote_code=True,
1745+
low_cpu_mem_usage=True,
1746+
**from_pretrained_kwargs,
1747+
)
1748+
return model, tokenizer
1749+
1750+
def get_default_conv_template(self, model_path: str) -> Conversation:
1751+
return get_conv_template("llama2-chinese")
1752+
1753+
17291754
class VigogneAdapter(BaseModelAdapter):
17301755
"""The model adapter for vigogne (e.g., bofenghuang/vigogne-2-7b-chat)"""
17311756

@@ -1941,6 +1966,7 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
19411966
register_model_adapter(BGEAdapter)
19421967
register_model_adapter(E5Adapter)
19431968
register_model_adapter(Lamma2ChineseAdapter)
1969+
register_model_adapter(Lamma2ChineseAlpacaAdapter)
19441970
register_model_adapter(VigogneAdapter)
19451971
register_model_adapter(OpenLLaMaOpenInstructAdapter)
19461972
register_model_adapter(ReaLMAdapter)

fastchat/model/model_registry.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -330,6 +330,12 @@ def get_model_info(name: str) -> ModelInfo:
330330
"https://huggingface.co/FlagAlpha/Llama2-Chinese-13b-Chat",
331331
"Llama2-Chinese is a multi-language large-scale language model (LLM), developed by FlagAlpha.",
332332
)
333+
register_model_info(
334+
["Chinese-Alpaca-2-7B", "Chinese-Alpaca-2-13B"],
335+
"Chinese-Alpaca",
336+
"https://huggingface.co/hfl/chinese-alpaca-2-13b",
337+
"New extended Chinese vocabulary beyond Llama-2, open-sourcing the Chinese LLaMA-2 and Alpaca-2 LLMs.",
338+
)
333339
register_model_info(
334340
["Vigogne-2-7B-Instruct", "Vigogne-2-13B-Instruct"],
335341
"Vigogne-Instruct",

0 commit comments

Comments
 (0)