Skip to content

Commit

Permalink
Merge pull request #123 from FederatedAI/feature-2.2.0-update_doc
Browse files Browse the repository at this point in the history
Feature 2.2.0 update doc
  • Loading branch information
mgqa34 authored Aug 1, 2024
2 parents 5fad8d8 + 8ac3bbb commit ce0e2e9
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions doc/tutorial/fdkt/fdkt.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -39,7 +39,7 @@
"cell_type": "markdown",
"metadata": {},
"source": [
"The following code will sample 5000 datalines of 'Health' subdomain, and train data will generated under the folder './balance_processed_data/Health/train.json'"
"The following code will sample 5000 datalines of 'Health' subdomain, and train data will generated under the folder './processed_data/Health/train.json'"
]
},
{
Expand Down Expand Up @@ -391,7 +391,7 @@
"llm_pretrained_path = \"Qwen1.5-7B-Chat\"\n",
"embedding_model_path = \"all-mpnet-base-v2\"\n",
"slm_pretrained_path = \"gpt2-xl\"\n",
"slm_data_path = \"./process/Health/train.json\"\n",
"slm_data_path = \"./processed_data/Health/train.json\"\n",
"\n",
"\n",
"def get_optimizer(model, optimizer=\"adam\", lr=1e-4):\n",
Expand Down Expand Up @@ -472,7 +472,7 @@
"\n",
" embedding_lm = SentenceTransformerModel(model_name_or_path=embedding_model_path).load()\n",
" training_args = FDKTTrainingArguments(\n",
" sample_num_per_cluster=5,\n",
" sample_num_per_cluster=4,\n",
" filter_prompt_max_length=2**14,\n",
" filter_generation_config=dict(\n",
" max_tokens=4096,\n",
Expand Down Expand Up @@ -559,7 +559,7 @@
"llm_pretrained_path = \"Qwen1.5-7B-Chat\"\n",
"embedding_model_path = \"all-mpnet-base-v2/\"\n",
"slm_pretrained_path = \"gpt2-xl\"\n",
"slm_data_path = \"./process/Health/train.json\" # should be absolute path\n",
"slm_data_path = \"./processed_data/Health/train.json\" # should be absolute path\n",
"\n",
"\n",
"def get_llm_conf():\n",
Expand All @@ -581,7 +581,7 @@
" )\n",
"\n",
" training_args = FDKTTrainingArguments(\n",
" sample_num_per_cluster=5,\n",
" sample_num_per_cluster=4,\n",
" filter_prompt_max_length=2 ** 14,\n",
" filter_generation_config=dict(\n",
" max_tokens=4096,\n",
Expand Down

0 comments on commit ce0e2e9

Please sign in to comment.