fix shell (#2764)

modelscope · Dec 25, 2024 · 6488cba · 6488cba
1 parent dbeec0f
commit 6488cba
Show file tree

Hide file tree

Showing 55 changed files with 73 additions and 73 deletions.
diff --git a/README.md b/README.md
@@ -114,9 +114,9 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#500 \
-              AI-ModelScope/alpaca-gpt4-data-en#500 \
-              swift/self-cognition#500 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#500' \
+              'AI-ModelScope/alpaca-gpt4-data-en#500' \
+              'swift/self-cognition#500' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/README_CN.md b/README_CN.md
@@ -107,9 +107,9 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#500 \
-              AI-ModelScope/alpaca-gpt4-data-en#500 \
-              swift/self-cognition#500 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#500' \
+              'AI-ModelScope/alpaca-gpt4-data-en#500' \
+              'swift/self-cognition#500' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/docs/source/GetStarted/快速开始.md b/docs/source/GetStarted/快速开始.md
@@ -31,9 +31,9 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#500 \
-              AI-ModelScope/alpaca-gpt4-data-en#500 \
-              swift/self-cognition#500 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#500' \
+              'AI-ModelScope/alpaca-gpt4-data-en#500' \
+              'swift/self-cognition#500' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/docs/source/Instruction/导出.md b/docs/source/Instruction/导出.md
@@ -77,7 +77,7 @@ CUDA_VISIBLE_DEVICES=0 swift infer \
 CUDA_VISIBLE_DEVICES=0 swift sft \
     --model Qwen/Qwen2-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#5000 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#5000' \
     --quant_method bnb \
     --quant_bits 4 \
     --torch_dtype bfloat16
@@ -86,15 +86,15 @@ CUDA_VISIBLE_DEVICES=0 swift sft \
 CUDA_VISIBLE_DEVICES=0 swift sft \
     --model Qwen/Qwen2-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#5000 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#5000' \
     --quant_method hqq \
     --quant_bits 4
 
 # eetq
 CUDA_VISIBLE_DEVICES=0 swift sft \
     --model Qwen/Qwen2-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#5000 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#5000' \
     --quant_method eetq \
     --torch_dtype float16
 ```

diff --git a/docs/source_en/GetStarted/Quick-start.md b/docs/source_en/GetStarted/Quick-start.md
@@ -31,9 +31,9 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#500 \
-              AI-ModelScope/alpaca-gpt4-data-en#500 \
-              swift/self-cognition#500 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#500' \
+              'AI-ModelScope/alpaca-gpt4-data-en#500' \
+              'swift/self-cognition#500' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/docs/source_en/Instruction/Export.md b/docs/source_en/Instruction/Export.md
@@ -78,7 +78,7 @@ CUDA_VISIBLE_DEVICES=0 swift infer \
 CUDA_VISIBLE_DEVICES=0 swift sft \
     --model Qwen/Qwen2-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#5000 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#5000' \
     --quant_method bnb \
     --quant_bits 4 \
     --torch_dtype bfloat16
@@ -87,15 +87,15 @@ CUDA_VISIBLE_DEVICES=0 swift sft \
 CUDA_VISIBLE_DEVICES=0 swift sft \
     --model Qwen/Qwen2-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#5000 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#5000' \
     --quant_method hqq \
     --quant_bits 4
 
 # eetq
 CUDA_VISIBLE_DEVICES=0 swift sft \
     --model Qwen/Qwen2-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#5000 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#5000' \
     --quant_method eetq \
     --torch_dtype float16
 ```

diff --git a/examples/export/quantize/awq.sh b/examples/export/quantize/awq.sh
@@ -1,8 +1,8 @@
 CUDA_VISIBLE_DEVICES=0 \
 swift export \
     --model Qwen/Qwen2.5-1.5B-Instruct \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#500 \
-              AI-ModelScope/alpaca-gpt4-data-en#500 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#500' \
+              'AI-ModelScope/alpaca-gpt4-data-en#500' \
     --quant_n_samples 128 \
     --quant_batch_size 1 \
     --max_length 2048 \

diff --git a/examples/export/quantize/gptq.sh b/examples/export/quantize/gptq.sh
@@ -3,8 +3,8 @@ OMP_NUM_THREADS=14 \
 CUDA_VISIBLE_DEVICES=0 \
 swift export \
     --model Qwen/Qwen2.5-1.5B-Instruct \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#500 \
-              AI-ModelScope/alpaca-gpt4-data-en#500 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#500' \
+              'AI-ModelScope/alpaca-gpt4-data-en#500' \
     --quant_n_samples 128 \
     --quant_batch_size 1 \
     --max_length 2048 \

diff --git a/examples/notebook/qwen2.5-self-cognition/sft.sh b/examples/notebook/qwen2.5-self-cognition/sft.sh
@@ -4,9 +4,9 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-3B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#500 \
-              AI-ModelScope/alpaca-gpt4-data-en#500 \
-              swift/self-cognition#500 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#500' \
+              'AI-ModelScope/alpaca-gpt4-data-en#500' \
+              'swift/self-cognition#500' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/examples/train/all_to_all/train.sh b/examples/train/all_to_all/train.sh
@@ -7,7 +7,7 @@ image_area=518400 \
 swift sft \
     --model BAAI/Emu3-Gen \
     --train_type lora \
-    --dataset swift/TextCaps#40 \
+    --dataset 'swift/TextCaps#40' \
     --loss_scale react \
     --tools_prompt react_zh \
     --torch_dtype bfloat16 \

diff --git a/examples/train/demo.sh b/examples/train/demo.sh
@@ -3,9 +3,9 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/alpaca-gpt4-data-zh#500 \
-              AI-ModelScope/alpaca-gpt4-data-en#500 \
-              swift/self-cognition#500 \
+    --dataset 'AI-ModelScope/alpaca-gpt4-data-zh#500' \
+              'AI-ModelScope/alpaca-gpt4-data-en#500' \
+              'swift/self-cognition#500' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/examples/train/full/train.sh b/examples/train/full/train.sh
@@ -3,7 +3,7 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type full \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --learning_rate 1e-5 \

diff --git a/examples/train/lazy_tokenize/train.sh b/examples/train/lazy_tokenize/train.sh
@@ -3,7 +3,7 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --learning_rate 1e-4 \

diff --git a/examples/train/multi-gpu/ddp/train.sh b/examples/train/multi-gpu/ddp/train.sh
@@ -7,7 +7,7 @@ swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
     --torch_dtype bfloat16 \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --lora_rank 8 \

diff --git a/examples/train/multi-gpu/ddp_device_map/train.sh b/examples/train/multi-gpu/ddp_device_map/train.sh
@@ -6,7 +6,7 @@ NPROC_PER_NODE=$nproc_per_node \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/examples/train/multi-gpu/deepspeed/train_zero2.sh b/examples/train/multi-gpu/deepspeed/train_zero2.sh
@@ -6,7 +6,7 @@ NPROC_PER_NODE=$nproc_per_node \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/examples/train/multi-gpu/deepspeed/train_zero3.sh b/examples/train/multi-gpu/deepspeed/train_zero3.sh
@@ -6,7 +6,7 @@ NPROC_PER_NODE=$nproc_per_node \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --lora_rank 8 \

diff --git a/examples/train/multi-gpu/fsdp_qlora/train.sh b/examples/train/multi-gpu/fsdp_qlora/train.sh
@@ -6,7 +6,7 @@ accelerate launch --config_file "./examples/train/fsdp_qlora/fsdp_offload.json"
     swift/cli/sft.py \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --max_length 2048 \

diff --git a/examples/train/multi-node/accelerate/train_node1.sh b/examples/train/multi-node/accelerate/train_node1.sh
@@ -4,7 +4,7 @@ accelerate launch --config_file ./examples/train/multi-node/accelerate/multi_nod
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
     --torch_dtype bfloat16 \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --lora_rank 8 \
     --lora_alpha 32 \

diff --git a/examples/train/multi-node/accelerate/train_node2.sh b/examples/train/multi-node/accelerate/train_node2.sh
@@ -4,7 +4,7 @@ accelerate launch --config_file ./examples/train/multi-node/accelerate/multi_nod
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
     --torch_dtype bfloat16 \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --lora_rank 8 \
     --lora_alpha 32 \

diff --git a/examples/train/multi-node/deepspeed/train.sh b/examples/train/multi-node/deepspeed/train.sh
@@ -5,7 +5,7 @@ deepspeed --hostfile=./examples/train/multi-node-deepspeed/host.txt \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
     --torch_dtype bfloat16 \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --lora_rank 8 \
     --lora_alpha 32 \

diff --git a/examples/train/multi-node/dlc/train.sh b/examples/train/multi-node/dlc/train.sh
@@ -3,7 +3,7 @@ NODE_RANK=$RANK \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --lora_rank 8 \

diff --git a/examples/train/multi-node/swift/train_node1.sh b/examples/train/multi-node/swift/train_node1.sh
@@ -7,7 +7,7 @@ swift sft \
       --model Qwen/Qwen2.5-7B-Instruct \
       --train_type lora \
       --torch_dtype bfloat16 \
-      --dataset swift/self-cognition#1000 \
+      --dataset 'swift/self-cognition#1000' \
       --num_train_epochs 1 \
       --lora_rank 8 \
       --lora_alpha 32 \

diff --git a/examples/train/multi-node/swift/train_node2.sh b/examples/train/multi-node/swift/train_node2.sh
@@ -7,7 +7,7 @@ swift sft \
       --model Qwen/Qwen2.5-7B-Instruct \
       --train_type lora \
       --torch_dtype bfloat16 \
-      --dataset swift/self-cognition#1000 \
+      --dataset 'swift/self-cognition#1000' \
       --num_train_epochs 1 \
       --lora_rank 8 \
       --lora_alpha 32 \

diff --git a/examples/train/multi-node/torchrun/train_node1.sh b/examples/train/multi-node/torchrun/train_node1.sh
@@ -4,7 +4,7 @@ torchrun --master_port 29500 --nproc_per_node=4 --nnodes=2 --node_rank=0 --maste
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
     --torch_dtype bfloat16 \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --lora_rank 8 \
     --lora_alpha 32 \

diff --git a/examples/train/multi-node/torchrun/train_node2.sh b/examples/train/multi-node/torchrun/train_node2.sh
@@ -4,7 +4,7 @@ torchrun --master_port 29500 --nproc_per_node=4 --nnodes=2 --node_rank=1 --maste
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
     --torch_dtype bfloat16 \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --lora_rank 8 \
     --lora_alpha 32 \

diff --git a/examples/train/multimodal/grounding.sh b/examples/train/multimodal/grounding.sh
@@ -4,7 +4,7 @@ MAX_PIXELS=1003520 \
 swift sft \
     --model Qwen/Qwen2-VL-7B-Instruct \
     --train_type lora \
-    --dataset swift/refcoco:grounding#1000 \
+    --dataset 'swift/refcoco:grounding#1000' \
     --num_train_epochs 1 \
     --learning_rate 1e-4 \
     --lora_rank 8 \

diff --git a/examples/train/multimodal/ocr.sh b/examples/train/multimodal/ocr.sh
@@ -3,7 +3,7 @@ CUDA_VISIBLE_DEVICES=0,1 \
 MAX_PIXELS=1003520 \
 swift sft \
     --model Qwen/QVQ-72B-Preview \
-    --dataset AI-ModelScope/LaTeX_OCR:human_handwrite#20000 \
+    --dataset 'AI-ModelScope/LaTeX_OCR:human_handwrite#20000' \
     --train_type lora \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \

diff --git a/examples/train/multimodal/vqa.sh b/examples/train/multimodal/vqa.sh
@@ -6,7 +6,7 @@ MAX_PIXELS=1003520 \
 swift sft \
     --model Qwen/Qwen2-VL-7B-Instruct \
     --train_type lora \
-    --dataset swift/OK-VQA_train#1000 \
+    --dataset 'swift/OK-VQA_train#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --learning_rate 1e-4 \

diff --git a/examples/train/packing/train.sh b/examples/train/packing/train.sh
@@ -7,7 +7,7 @@ swift sft \
     --packing true \
     --max_length 8192 \
     --max_steps 100 \
-    --dataset swift/self-cognition#5000 \
+    --dataset 'swift/self-cognition#5000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --learning_rate 1e-4 \

diff --git a/examples/train/plugins/train_loss_scale.sh b/examples/train/plugins/train_loss_scale.sh
@@ -5,7 +5,7 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --learning_rate 1e-4 \

diff --git a/examples/train/rlhf/kto.sh b/examples/train/rlhf/kto.sh
@@ -6,7 +6,7 @@ swift rlhf \
     --rlhf_type kto \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/ultrafeedback-binarized-preferences-cleaned-kto#10000 \
+    --dataset 'AI-ModelScope/ultrafeedback-binarized-preferences-cleaned-kto#10000' \
     --num_train_epochs 2 \
     --learning_rate 1e-4 \
     --lora_rank 8 \

diff --git a/examples/train/seq_cls/sft.sh b/examples/train/seq_cls/sft.sh
@@ -4,7 +4,7 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B \
     --train_type lora \
-    --dataset DAMO_NLP/jd:cls#2000 \
+    --dataset 'DAMO_NLP/jd:cls#2000' \
     --torch_dtype bfloat16 \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \

diff --git a/examples/train/sequence_parallel/train.sh b/examples/train/sequence_parallel/train.sh
@@ -6,7 +6,7 @@ NPROC_PER_NODE=$nproc_per_node \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset AI-ModelScope/LongAlpaca-12k#5000 \
+    --dataset 'AI-ModelScope/LongAlpaca-12k#5000' \
     --num_train_epochs 1 \
     --sequence_parallel_size 2 \
     --learning_rate 1e-4 \

diff --git a/examples/train/streaming/train.sh b/examples/train/streaming/train.sh
@@ -2,7 +2,7 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type lora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --streaming true \
     --max_steps 1000 \
     --learning_rate 1e-4 \

diff --git a/examples/train/tuners/adalora/train.sh b/examples/train/tuners/adalora/train.sh
@@ -3,7 +3,7 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type adalora \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --learning_rate 1e-4 \

diff --git a/examples/train/tuners/adapter/train.sh b/examples/train/tuners/adapter/train.sh
@@ -3,7 +3,7 @@ CUDA_VISIBLE_DEVICES=0 \
 swift sft \
     --model Qwen/Qwen2.5-7B-Instruct \
     --train_type adapter \
-    --dataset swift/self-cognition#1000 \
+    --dataset 'swift/self-cognition#1000' \
     --num_train_epochs 1 \
     --per_device_train_batch_size 1 \
     --learning_rate 1e-4 \