diff --git a/4-lora_sft.py b/4-lora_sft.py index f6328f1..6e75b5d 100644 --- a/4-lora_sft.py +++ b/4-lora_sft.py @@ -102,8 +102,8 @@ def find_all_linear_names(model): def init_model(): - model_name_or_path = "./minimind-v1-small" - tokenizer_name_or_path = "./minimind-v1-small" + model_name_or_path = "jingyaogong/minimind-v1-small" + tokenizer_name_or_path = "jingyaogong/minimind-v1-small" tokenizer = AutoTokenizer.from_pretrained(tokenizer_name_or_path, trust_remote_code=True, use_fast=False) model = AutoModelForCausalLM.from_pretrained(model_name_or_path, trust_remote_code=True).to(args.device)