Amshaker commited on
Commit
5d67d4c
·
verified ·
1 Parent(s): 891cf8b

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +2 -0
  2. qwen3-1.7b-sft/README.md +61 -0
  3. qwen3-1.7b-sft/added_tokens.json +28 -0
  4. qwen3-1.7b-sft/all_results.json +8 -0
  5. qwen3-1.7b-sft/chat_template.jinja +85 -0
  6. qwen3-1.7b-sft/checkpoint-6502/added_tokens.json +28 -0
  7. qwen3-1.7b-sft/checkpoint-6502/chat_template.jinja +85 -0
  8. qwen3-1.7b-sft/checkpoint-6502/config.json +30 -0
  9. qwen3-1.7b-sft/checkpoint-6502/generation_config.json +6 -0
  10. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  11. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  12. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  13. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  14. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  15. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  16. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  17. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  18. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  19. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  20. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  21. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  22. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  23. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  24. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  25. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  26. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  27. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  28. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  29. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  30. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  31. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  32. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  33. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  34. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
  35. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +3 -0
  36. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +3 -0
  37. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +3 -0
  38. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +3 -0
  39. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +3 -0
  40. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +3 -0
  41. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +3 -0
  42. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +3 -0
  43. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  44. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +3 -0
  45. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +3 -0
  46. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +3 -0
  47. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +3 -0
  48. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +3 -0
  49. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +3 -0
  50. qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +3 -0
.gitattributes CHANGED
@@ -42,3 +42,5 @@ SDPO-train32-alpha0.5-rollout8-lr1e-5-bigmath-Qwen-Qwen3-1.7B/global_step_60/act
42
  SDPO-train32-alpha0.5-rollout8-lr1e-5-bigmath-Qwen-Qwen3-1.7B/global_step_70/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
43
  SDPO-train32-alpha0.5-rollout8-lr1e-5-bigmath-Qwen-Qwen3-1.7B/global_step_80/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
44
  qwen3-1.7b-sft-lora/checkpoint-9752/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
42
  SDPO-train32-alpha0.5-rollout8-lr1e-5-bigmath-Qwen-Qwen3-1.7B/global_step_70/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
43
  SDPO-train32-alpha0.5-rollout8-lr1e-5-bigmath-Qwen-Qwen3-1.7B/global_step_80/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
44
  qwen3-1.7b-sft-lora/checkpoint-9752/tokenizer.json filter=lfs diff=lfs merge=lfs -text
45
+ qwen3-1.7b-sft/checkpoint-6502/tokenizer.json filter=lfs diff=lfs merge=lfs -text
46
+ qwen3-1.7b-sft/tokenizer.json filter=lfs diff=lfs merge=lfs -text
qwen3-1.7b-sft/README.md ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ license: other
4
+ base_model: Qwen/Qwen3-1.7B-Base
5
+ tags:
6
+ - llama-factory
7
+ - full
8
+ - generated_from_trainer
9
+ model-index:
10
+ - name: qwen3-1.7b-sft
11
+ results: []
12
+ ---
13
+
14
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
+ should probably proofread and complete it, then remove this comment. -->
16
+
17
+ # qwen3-1.7b-sft
18
+
19
+ This model is a fine-tuned version of [Qwen/Qwen3-1.7B-Base](https://huggingface.co/Qwen/Qwen3-1.7B-Base) on the mobilek2_sft1 and the mobilek2_sft2 datasets.
20
+
21
+ ## Model description
22
+
23
+ More information needed
24
+
25
+ ## Intended uses & limitations
26
+
27
+ More information needed
28
+
29
+ ## Training and evaluation data
30
+
31
+ More information needed
32
+
33
+ ## Training procedure
34
+
35
+ ### Training hyperparameters
36
+
37
+ The following hyperparameters were used during training:
38
+ - learning_rate: 5e-05
39
+ - train_batch_size: 1
40
+ - eval_batch_size: 8
41
+ - seed: 42
42
+ - distributed_type: multi-GPU
43
+ - num_devices: 48
44
+ - gradient_accumulation_steps: 2
45
+ - total_train_batch_size: 96
46
+ - total_eval_batch_size: 384
47
+ - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
48
+ - lr_scheduler_type: cosine
49
+ - lr_scheduler_warmup_ratio: 0.05
50
+ - num_epochs: 2.0
51
+
52
+ ### Training results
53
+
54
+
55
+
56
+ ### Framework versions
57
+
58
+ - Transformers 4.52.4
59
+ - Pytorch 2.7.0+rocm6.3
60
+ - Datasets 4.0.0
61
+ - Tokenizers 0.21.4
qwen3-1.7b-sft/added_tokens.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</think>": 151668,
3
+ "</tool_call>": 151658,
4
+ "</tool_response>": 151666,
5
+ "<think>": 151667,
6
+ "<tool_call>": 151657,
7
+ "<tool_response>": 151665,
8
+ "<|box_end|>": 151649,
9
+ "<|box_start|>": 151648,
10
+ "<|endoftext|>": 151643,
11
+ "<|file_sep|>": 151664,
12
+ "<|fim_middle|>": 151660,
13
+ "<|fim_pad|>": 151662,
14
+ "<|fim_prefix|>": 151659,
15
+ "<|fim_suffix|>": 151661,
16
+ "<|im_end|>": 151645,
17
+ "<|im_start|>": 151644,
18
+ "<|image_pad|>": 151655,
19
+ "<|object_ref_end|>": 151647,
20
+ "<|object_ref_start|>": 151646,
21
+ "<|quad_end|>": 151651,
22
+ "<|quad_start|>": 151650,
23
+ "<|repo_name|>": 151663,
24
+ "<|video_pad|>": 151656,
25
+ "<|vision_end|>": 151653,
26
+ "<|vision_pad|>": 151654,
27
+ "<|vision_start|>": 151652
28
+ }
qwen3-1.7b-sft/all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.0,
3
+ "total_flos": 7602235458453504.0,
4
+ "train_loss": 0.4130896302561729,
5
+ "train_runtime": 242271.9548,
6
+ "train_samples_per_second": 2.576,
7
+ "train_steps_per_second": 0.027
8
+ }
qwen3-1.7b-sft/chat_template.jinja ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- if tools %}
2
+ {{- '<|im_start|>system\n' }}
3
+ {%- if messages[0].role == 'system' %}
4
+ {{- messages[0].content + '\n\n' }}
5
+ {%- endif %}
6
+ {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
7
+ {%- for tool in tools %}
8
+ {{- "\n" }}
9
+ {{- tool | tojson }}
10
+ {%- endfor %}
11
+ {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
12
+ {%- else %}
13
+ {%- if messages[0].role == 'system' %}
14
+ {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
15
+ {%- endif %}
16
+ {%- endif %}
17
+ {%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
18
+ {%- for message in messages[::-1] %}
19
+ {%- set index = (messages|length - 1) - loop.index0 %}
20
+ {%- if ns.multi_step_tool and message.role == "user" and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
21
+ {%- set ns.multi_step_tool = false %}
22
+ {%- set ns.last_query_index = index %}
23
+ {%- endif %}
24
+ {%- endfor %}
25
+ {%- for message in messages %}
26
+ {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
27
+ {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}
28
+ {%- elif message.role == "assistant" %}
29
+ {%- set content = message.content %}
30
+ {%- set reasoning_content = '' %}
31
+ {%- if message.reasoning_content is defined and message.reasoning_content is not none %}
32
+ {%- set reasoning_content = message.reasoning_content %}
33
+ {%- else %}
34
+ {%- if '</think>' in message.content %}
35
+ {%- set content = message.content.split('</think>')[-1].lstrip('\n') %}
36
+ {%- set reasoning_content = message.content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
37
+ {%- endif %}
38
+ {%- endif %}
39
+ {%- if loop.index0 > ns.last_query_index %}
40
+ {%- if loop.last or (not loop.last and reasoning_content) %}
41
+ {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
42
+ {%- else %}
43
+ {{- '<|im_start|>' + message.role + '\n' + content }}
44
+ {%- endif %}
45
+ {%- else %}
46
+ {{- '<|im_start|>' + message.role + '\n' + content }}
47
+ {%- endif %}
48
+ {%- if message.tool_calls %}
49
+ {%- for tool_call in message.tool_calls %}
50
+ {%- if (loop.first and content) or (not loop.first) %}
51
+ {{- '\n' }}
52
+ {%- endif %}
53
+ {%- if tool_call.function %}
54
+ {%- set tool_call = tool_call.function %}
55
+ {%- endif %}
56
+ {{- '<tool_call>\n{"name": "' }}
57
+ {{- tool_call.name }}
58
+ {{- '", "arguments": ' }}
59
+ {%- if tool_call.arguments is string %}
60
+ {{- tool_call.arguments }}
61
+ {%- else %}
62
+ {{- tool_call.arguments | tojson }}
63
+ {%- endif %}
64
+ {{- '}\n</tool_call>' }}
65
+ {%- endfor %}
66
+ {%- endif %}
67
+ {{- '<|im_end|>\n' }}
68
+ {%- elif message.role == "tool" %}
69
+ {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
70
+ {{- '<|im_start|>user' }}
71
+ {%- endif %}
72
+ {{- '\n<tool_response>\n' }}
73
+ {{- message.content }}
74
+ {{- '\n</tool_response>' }}
75
+ {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
76
+ {{- '<|im_end|>\n' }}
77
+ {%- endif %}
78
+ {%- endif %}
79
+ {%- endfor %}
80
+ {%- if add_generation_prompt %}
81
+ {{- '<|im_start|>assistant\n' }}
82
+ {%- if enable_thinking is defined and enable_thinking is false %}
83
+ {{- '<think>\n\n</think>\n\n' }}
84
+ {%- endif %}
85
+ {%- endif %}
qwen3-1.7b-sft/checkpoint-6502/added_tokens.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</think>": 151668,
3
+ "</tool_call>": 151658,
4
+ "</tool_response>": 151666,
5
+ "<think>": 151667,
6
+ "<tool_call>": 151657,
7
+ "<tool_response>": 151665,
8
+ "<|box_end|>": 151649,
9
+ "<|box_start|>": 151648,
10
+ "<|endoftext|>": 151643,
11
+ "<|file_sep|>": 151664,
12
+ "<|fim_middle|>": 151660,
13
+ "<|fim_pad|>": 151662,
14
+ "<|fim_prefix|>": 151659,
15
+ "<|fim_suffix|>": 151661,
16
+ "<|im_end|>": 151645,
17
+ "<|im_start|>": 151644,
18
+ "<|image_pad|>": 151655,
19
+ "<|object_ref_end|>": 151647,
20
+ "<|object_ref_start|>": 151646,
21
+ "<|quad_end|>": 151651,
22
+ "<|quad_start|>": 151650,
23
+ "<|repo_name|>": 151663,
24
+ "<|video_pad|>": 151656,
25
+ "<|vision_end|>": 151653,
26
+ "<|vision_pad|>": 151654,
27
+ "<|vision_start|>": 151652
28
+ }
qwen3-1.7b-sft/checkpoint-6502/chat_template.jinja ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- if tools %}
2
+ {{- '<|im_start|>system\n' }}
3
+ {%- if messages[0].role == 'system' %}
4
+ {{- messages[0].content + '\n\n' }}
5
+ {%- endif %}
6
+ {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
7
+ {%- for tool in tools %}
8
+ {{- "\n" }}
9
+ {{- tool | tojson }}
10
+ {%- endfor %}
11
+ {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
12
+ {%- else %}
13
+ {%- if messages[0].role == 'system' %}
14
+ {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
15
+ {%- endif %}
16
+ {%- endif %}
17
+ {%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
18
+ {%- for message in messages[::-1] %}
19
+ {%- set index = (messages|length - 1) - loop.index0 %}
20
+ {%- if ns.multi_step_tool and message.role == "user" and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
21
+ {%- set ns.multi_step_tool = false %}
22
+ {%- set ns.last_query_index = index %}
23
+ {%- endif %}
24
+ {%- endfor %}
25
+ {%- for message in messages %}
26
+ {%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
27
+ {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}
28
+ {%- elif message.role == "assistant" %}
29
+ {%- set content = message.content %}
30
+ {%- set reasoning_content = '' %}
31
+ {%- if message.reasoning_content is defined and message.reasoning_content is not none %}
32
+ {%- set reasoning_content = message.reasoning_content %}
33
+ {%- else %}
34
+ {%- if '</think>' in message.content %}
35
+ {%- set content = message.content.split('</think>')[-1].lstrip('\n') %}
36
+ {%- set reasoning_content = message.content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
37
+ {%- endif %}
38
+ {%- endif %}
39
+ {%- if loop.index0 > ns.last_query_index %}
40
+ {%- if loop.last or (not loop.last and reasoning_content) %}
41
+ {{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
42
+ {%- else %}
43
+ {{- '<|im_start|>' + message.role + '\n' + content }}
44
+ {%- endif %}
45
+ {%- else %}
46
+ {{- '<|im_start|>' + message.role + '\n' + content }}
47
+ {%- endif %}
48
+ {%- if message.tool_calls %}
49
+ {%- for tool_call in message.tool_calls %}
50
+ {%- if (loop.first and content) or (not loop.first) %}
51
+ {{- '\n' }}
52
+ {%- endif %}
53
+ {%- if tool_call.function %}
54
+ {%- set tool_call = tool_call.function %}
55
+ {%- endif %}
56
+ {{- '<tool_call>\n{"name": "' }}
57
+ {{- tool_call.name }}
58
+ {{- '", "arguments": ' }}
59
+ {%- if tool_call.arguments is string %}
60
+ {{- tool_call.arguments }}
61
+ {%- else %}
62
+ {{- tool_call.arguments | tojson }}
63
+ {%- endif %}
64
+ {{- '}\n</tool_call>' }}
65
+ {%- endfor %}
66
+ {%- endif %}
67
+ {{- '<|im_end|>\n' }}
68
+ {%- elif message.role == "tool" %}
69
+ {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
70
+ {{- '<|im_start|>user' }}
71
+ {%- endif %}
72
+ {{- '\n<tool_response>\n' }}
73
+ {{- message.content }}
74
+ {{- '\n</tool_response>' }}
75
+ {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
76
+ {{- '<|im_end|>\n' }}
77
+ {%- endif %}
78
+ {%- endif %}
79
+ {%- endfor %}
80
+ {%- if add_generation_prompt %}
81
+ {{- '<|im_start|>assistant\n' }}
82
+ {%- if enable_thinking is defined and enable_thinking is false %}
83
+ {{- '<think>\n\n</think>\n\n' }}
84
+ {%- endif %}
85
+ {%- endif %}
qwen3-1.7b-sft/checkpoint-6502/config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen3ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 151643,
8
+ "eos_token_id": 151643,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 2048,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 6144,
14
+ "max_position_embeddings": 32768,
15
+ "max_window_layers": 28,
16
+ "model_type": "qwen3",
17
+ "num_attention_heads": 16,
18
+ "num_hidden_layers": 28,
19
+ "num_key_value_heads": 8,
20
+ "rms_norm_eps": 1e-06,
21
+ "rope_scaling": null,
22
+ "rope_theta": 1000000,
23
+ "sliding_window": null,
24
+ "tie_word_embeddings": true,
25
+ "torch_dtype": "bfloat16",
26
+ "transformers_version": "4.52.4",
27
+ "use_cache": false,
28
+ "use_sliding_window": false,
29
+ "vocab_size": 151936
30
+ }
qwen3-1.7b-sft/checkpoint-6502/generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 151643,
3
+ "eos_token_id": 151643,
4
+ "max_new_tokens": 2048,
5
+ "transformers_version": "4.52.4"
6
+ }
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb783c8f298187ac41585f65b50d7c7d960954d24378f2b331c9234f1dabe640
3
+ size 430150469
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b4638b6aea0f339baa807d460f6e4e9b5746dabb18b5b1d8bb872a1b561a614
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:684f021b026eb54f9800a4306738bd2962c288b0f390eae6c59eed121bd79f7e
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d37f19b149205bd4a9e51490df501fa90f40a15f01dd93fb0e6073350c68cc6
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ef7c5a8852f372f03456eba3acdcf837798a16a3066b10d4a76362dcdf5c872
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a10cf0d903270d13b8f6dd0486ff41b10499ddfbf3f5e1b93ff46e9f7a70102
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba359f490230d80bb170385a2d7438d7ac91b791c81811431933971010fdd027
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9197096a8984ac294a322f7608c12d88a2c6aa8735e78f4d1bafa804a0929c3
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8469e7c7a11a55213a1b26ff1ff81e338fb7aabfef5a28d26b009e0f552e0a25
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07e3900ae1f5fc9b813b6d61eb6e2adf648dc219937ca2499c8f7494f602d43f
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06809e973763e16119eac4534e8c35055f95c29a781afbc0e2b173aec37f1acb
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9477232db152287c80188c601e99fa4c35135624f4a2860cee1e4bc01d09439
3
+ size 430150469
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ec36024d9f354a1187099011d21b91fdc03dcc748a4ff35ddfee5f5234e3747
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3340b60acf2dce215d60911e1d10dfe6bf5cb35ada16bd5035053c9b7304ece
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f4edf75aa816e3295d6d28efa6d58e1273ea6e9b224ce39ca5fd6d6475da8a3
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:430c46a07e49ae43b1b9766669e8eebaf3d786d08452613970bed4182a457819
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00652bfede69a7510bb61b3f6f5734b077e54fc2f75d17ac054f77b2b69bf156
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4e657332bd40f454cdc19b64cafbcafc2147dbc2d262448504ce7991d24c4ec
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89876d4d8b907fc7c92fffaa7d37148978b3a8f187d26557fb84724e7864d3ae
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f1417169726a77a0dcc9391d87f07b01e230f640bc002a51dc6c86fbf696f01
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d228a913aae6242124b5d1e977c59987a6f2f8794be1048b69c85a205daa82de
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06b337c29e09c04b3916bf592c0c0100431b62dd0e86c673b1be1b257dcd9344
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:631319f3d95fe3c34a5bb92690042c8fb0238a323d4bff1fbad2881abc41951f
3
+ size 430150469
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d57536d6b2bd36b39ddffa8f5a19d7906551db48cc6834e53a39a562021d659
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61a1cfe5b04796f462952267e55510ecbe279c30af31b63781111c8fa374aaec
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6523180bd30da7e0a47b6757f0d34c4d098f7173e4454f7cd52be434aa713aaa
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7aa63328b40cf564f8da326cbf94dbdc8c4828ae22ad82f987b07c12e76b8fc
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4605eb9ea821f6d5de2034e4490f391111f99e5529aafdb25488bbdc486edcdc
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0308f4040ec2ae950eb2a8568d7344525c4d48475d0e97a46213047fb796b2cb
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0106d82fae0856b78eb44bc22e39392102de48689843f4d3e4c51892adb617d
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8469015ca7d192546b2dbc8a0ceefd64b7a3d497843eeebd1da7a0c9e9035f27
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a62a972526d89730d86c8cdc51ce0055816e533adf8d51642bc003941d8997a
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:380c3afbed633b2b7f4600bc5fd9600de2f77ca9f5713b50f6d143181f7417ed
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5484dc5808786305a2ab99712f043d210fe981f9de05381ec24a2bcfbff6d9e6
3
+ size 430150469
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eecf9d92cd445ef1ef52a58712361bb0236e4f9204cc6960adec9dc501f50a6a
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00912cc19e445b1a215c06a5eab30e46be5ab2acf1507dca2aa4e2cd09a44af7
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9df9e869b8aa7e66ec1cae7233b3062a705ed7a00ccacaea1b9a9dc4cd88a74
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbf39df961241da8b81d3b1cbc92f24d933253957a0a3e3f7ede97a7891ff9d2
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:132db6007792d0377338ab42bcc59a1eb28a537274f0f3e95d66aa4778a56513
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adb68f8bd30cf8dc1ab1e5b4d071cd4839dfb039a37aeedcf86511a32b0aa777
3
+ size 430150483
qwen3-1.7b-sft/checkpoint-6502/global_step6502/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c3ea7fcb8bfca29c6b317eed9ee74d98dbe83fcc916b6cd6523c7c251e87a1b
3
+ size 430150483