Skip to content

Commit

Permalink
add support for Chinese-LLaMA-Alpaca (lm-sys#2700)
Browse files Browse the repository at this point in the history
  • Loading branch information
zollty authored and zhanghao.smooth committed Jan 26, 2024
1 parent 9f600e7 commit 7fc0123
Show file tree
Hide file tree
Showing 2 changed files with 32 additions and 0 deletions.
26 changes: 26 additions & 0 deletions fastchat/model/model_adapter.py
Original file line number Diff line number Diff line change
Expand Up @@ -1726,6 +1726,31 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
return get_conv_template("llama2-chinese")


class Lamma2ChineseAlpacaAdapter(BaseModelAdapter):
"""The model adapter for ymcui/Chinese-LLaMA-Alpaca sft"""

def match(self, model_path: str):
return "chinese-alpaca" in model_path.lower()

def load_model(self, model_path: str, from_pretrained_kwargs: dict):
revision = from_pretrained_kwargs.get("revision", "main")
tokenizer = AutoTokenizer.from_pretrained(
model_path,
trust_remote_code=True,
revision=revision,
)
model = AutoModelForCausalLM.from_pretrained(
model_path,
trust_remote_code=True,
low_cpu_mem_usage=True,
**from_pretrained_kwargs,
)
return model, tokenizer

def get_default_conv_template(self, model_path: str) -> Conversation:
return get_conv_template("llama2-chinese")


class VigogneAdapter(BaseModelAdapter):
"""The model adapter for vigogne (e.g., bofenghuang/vigogne-2-7b-chat)"""

Expand Down Expand Up @@ -1941,6 +1966,7 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
register_model_adapter(BGEAdapter)
register_model_adapter(E5Adapter)
register_model_adapter(Lamma2ChineseAdapter)
register_model_adapter(Lamma2ChineseAlpacaAdapter)
register_model_adapter(VigogneAdapter)
register_model_adapter(OpenLLaMaOpenInstructAdapter)
register_model_adapter(ReaLMAdapter)
Expand Down
6 changes: 6 additions & 0 deletions fastchat/model/model_registry.py
Original file line number Diff line number Diff line change
Expand Up @@ -330,6 +330,12 @@ def get_model_info(name: str) -> ModelInfo:
"https://huggingface.co/FlagAlpha/Llama2-Chinese-13b-Chat",
"Llama2-Chinese is a multi-language large-scale language model (LLM), developed by FlagAlpha.",
)
register_model_info(
["Chinese-Alpaca-2-7B", "Chinese-Alpaca-2-13B"],
"Chinese-Alpaca",
"https://huggingface.co/hfl/chinese-alpaca-2-13b",
"New extended Chinese vocabulary beyond Llama-2, open-sourcing the Chinese LLaMA-2 and Alpaca-2 LLMs.",
)
register_model_info(
["Vigogne-2-7B-Instruct", "Vigogne-2-13B-Instruct"],
"Vigogne-Instruct",
Expand Down

0 comments on commit 7fc0123

Please sign in to comment.