Upload task output 1

Browse files

Files changed (10) hide show

README.md +1 -1
adapter_config.json +2 -2
adapter_model.safetensors +2 -2
added_tokens.json +1 -20
chat_template.jinja +6 -54
special_tokens_map.json +1 -12
tokenizer.json +2 -2
tokenizer_config.json +1 -165
trainer_state.json +23 -23
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -3,7 +3,7 @@ base_model: None
 library_name: peft
 pipeline_tag: text-generation
 tags:
-- base_model:adapter:/cache/models/Qwen--Qwen2.5-3B-Instruct
 - grpo
 - lora
 - transformers

 library_name: peft
 pipeline_tag: text-generation
 tags:
+- base_model:adapter:/cache/models/Qwen--Qwen2-7B-Instruct
 - grpo
 - lora
 - transformers

adapter_config.json CHANGED Viewed

@@ -30,11 +30,11 @@
   "revision": null,
   "target_modules": [
     "gate_proj",
     "down_proj",
     "k_proj",
     "v_proj",
-    "o_proj",
-    "up_proj",
     "q_proj"
   ],
   "target_parameters": null,

   "revision": null,
   "target_modules": [
     "gate_proj",
+    "o_proj",
     "down_proj",
+    "up_proj",
     "k_proj",
     "v_proj",
     "q_proj"
   ],
   "target_parameters": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c21840f4e747b01282174f4331451ae9581186e575ae9022732c3f5ff5d3b93c
-size 239536272

 version https://git-lfs.github.com/spec/v1
+oid sha256:1d1e0fbd0ec6c150d20f1fa3a376a2cfb2ab4bc5b23e44af2c0452abddf82b6d
+size 323014168

added_tokens.json CHANGED Viewed

@@ -1,24 +1,5 @@
 {
-  "</tool_call>": 151658,
-  "<tool_call>": 151657,
-  "<|box_end|>": 151649,
-  "<|box_start|>": 151648,
   "<|endoftext|>": 151643,
-  "<|file_sep|>": 151664,
-  "<|fim_middle|>": 151660,
-  "<|fim_pad|>": 151662,
-  "<|fim_prefix|>": 151659,
-  "<|fim_suffix|>": 151661,
   "<|im_end|>": 151645,
-  "<|im_start|>": 151644,
-  "<|image_pad|>": 151655,
-  "<|object_ref_end|>": 151647,
-  "<|object_ref_start|>": 151646,
-  "<|quad_end|>": 151651,
-  "<|quad_start|>": 151650,
-  "<|repo_name|>": 151663,
-  "<|video_pad|>": 151656,
-  "<|vision_end|>": 151653,
-  "<|vision_pad|>": 151654,
-  "<|vision_start|>": 151652
 }

 {
   "<|endoftext|>": 151643,
   "<|im_end|>": 151645,
+  "<|im_start|>": 151644
 }

chat_template.jinja CHANGED Viewed

@@ -1,54 +1,6 @@
-{%- if tools %}
-    {{- '<|im_start|>system\n' }}
-    {%- if messages[0]['role'] == 'system' %}
-        {{- messages[0]['content'] }}
-    {%- else %}
-        {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }}
-    {%- endif %}
-    {{- "\n\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
-    {%- for tool in tools %}
-        {{- "\n" }}
-        {{- tool | tojson }}
-    {%- endfor %}
-    {{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
-{%- else %}
-    {%- if messages[0]['role'] == 'system' %}
-        {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}
-    {%- else %}
-        {{- '<|im_start|>system\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\n' }}
-    {%- endif %}
-{%- endif %}
-{%- for message in messages %}
-    {%- if (message.role == "user") or (message.role == "system" and not loop.first) or (message.role == "assistant" and not message.tool_calls) %}
-        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}
-    {%- elif message.role == "assistant" %}
-        {{- '<|im_start|>' + message.role }}
-        {%- if message.content %}
-            {{- '\n' + message.content }}
-        {%- endif %}
-        {%- for tool_call in message.tool_calls %}
-            {%- if tool_call.function is defined %}
-                {%- set tool_call = tool_call.function %}
-            {%- endif %}
-            {{- '\n<tool_call>\n{"name": "' }}
-            {{- tool_call.name }}
-            {{- '", "arguments": ' }}
-            {{- tool_call.arguments | tojson }}
-            {{- '}\n</tool_call>' }}
-        {%- endfor %}
-        {{- '<|im_end|>\n' }}
-    {%- elif message.role == "tool" %}
-        {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != "tool") %}
-            {{- '<|im_start|>user' }}
-        {%- endif %}
-        {{- '\n<tool_response>\n' }}
-        {{- message.content }}
-        {{- '\n</tool_response>' }}
-        {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
-            {{- '<|im_end|>\n' }}
-        {%- endif %}
-    {%- endif %}
-{%- endfor %}
-{%- if add_generation_prompt %}
-    {{- '<|im_start|>assistant\n' }}
-{%- endif %}

+{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system
+You are a helpful assistant.<|im_end|>
+' }}{% endif %}{{'<|im_start|>' + message['role'] + '
+' + message['content'] + '<|im_end|>' + '
+'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant
+' }}{% endif %}

special_tokens_map.json CHANGED Viewed

@@ -1,18 +1,7 @@
 {
   "additional_special_tokens": [
     "<|im_start|>",
-    "<|im_end|>",
-    "<|object_ref_start|>",
-    "<|object_ref_end|>",
-    "<|box_start|>",
-    "<|box_end|>",
-    "<|quad_start|>",
-    "<|quad_end|>",
-    "<|vision_start|>",
-    "<|vision_end|>",
-    "<|vision_pad|>",
-    "<|image_pad|>",
-    "<|video_pad|>"
   ],
   "eos_token": {
     "content": "<|im_end|>",

 {
   "additional_special_tokens": [
     "<|im_start|>",
+    "<|im_end|>"
   ],
   "eos_token": {
     "content": "<|im_end|>",

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa
-size 11421896

 version https://git-lfs.github.com/spec/v1
+oid sha256:bcfe42da0a4497e8b2b172c1f9f4ec423a46dc12907f4349c55025f670422ba9
+size 11418266

tokenizer_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "add_bos_token": false,
   "add_prefix_space": false,
   "added_tokens_decoder": {
     "151643": {
@@ -25,174 +24,11 @@
       "rstrip": false,
       "single_word": false,
       "special": true
-    },
-    "151646": {
-      "content": "<|object_ref_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151647": {
-      "content": "<|object_ref_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151648": {
-      "content": "<|box_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151649": {
-      "content": "<|box_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151650": {
-      "content": "<|quad_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151651": {
-      "content": "<|quad_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151652": {
-      "content": "<|vision_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151653": {
-      "content": "<|vision_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151654": {
-      "content": "<|vision_pad|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151655": {
-      "content": "<|image_pad|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151656": {
-      "content": "<|video_pad|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151657": {
-      "content": "<tool_call>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151658": {
-      "content": "</tool_call>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151659": {
-      "content": "<|fim_prefix|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151660": {
-      "content": "<|fim_middle|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151661": {
-      "content": "<|fim_suffix|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151662": {
-      "content": "<|fim_pad|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151663": {
-      "content": "<|repo_name|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151664": {
-      "content": "<|file_sep|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
     }
   },
   "additional_special_tokens": [
     "<|im_start|>",
-    "<|im_end|>",
-    "<|object_ref_start|>",
-    "<|object_ref_end|>",
-    "<|box_start|>",
-    "<|box_end|>",
-    "<|quad_start|>",
-    "<|quad_end|>",
-    "<|vision_start|>",
-    "<|vision_end|>",
-    "<|vision_pad|>",
-    "<|image_pad|>",
-    "<|video_pad|>"
   ],
   "bos_token": null,
   "clean_up_tokenization_spaces": false,

 {
   "add_prefix_space": false,
   "added_tokens_decoder": {
     "151643": {
       "rstrip": false,
       "single_word": false,
       "special": true
     }
   },
   "additional_special_tokens": [
     "<|im_start|>",
+    "<|im_end|>"
   ],
   "bos_token": null,
   "clean_up_tokenization_spaces": false,

trainer_state.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2e-05,
   "eval_steps": 500,
   "global_step": 1,
   "is_hyper_param_search": false,
@@ -16,36 +16,36 @@
       "clip_ratio/low_min": 0.0,
       "clip_ratio/region_mean": 0.0,
       "completions/clipped_ratio": 0.0,
-      "completions/max_length": 1086.0,
-      "completions/max_terminated_length": 1086.0,
-      "completions/mean_length": 979.09375,
-      "completions/mean_terminated_length": 979.09375,
-      "completions/min_length": 688.0,
-      "completions/min_terminated_length": 688.0,
-      "entropy": 0.179680151399225,
-      "epoch": 2e-05,
       "frac_reward_zero_std": 0.0,
-      "grad_norm": 2.6082828044891357,
       "kl": 0.0,
       "learning_rate": 0.0,
-      "loss": -0.031,
-      "num_tokens": 65935.0,
-      "reward": -0.5424860715866089,
-      "reward_std": 0.18259182572364807,
-      "rewards/rollout_reward_func/mean": -0.5424860715866089,
-      "rewards/rollout_reward_func/std": 0.18774119019508362,
-      "sampling/importance_sampling_ratio/max": 2.453181743621826,
-      "sampling/importance_sampling_ratio/mean": 1.000138282775879,
-      "sampling/importance_sampling_ratio/min": 0.4654485583305359,
-      "sampling/sampling_logp_difference/max": 0.897385835647583,
-      "sampling/sampling_logp_difference/mean": 0.023822877556085587,
       "step": 1,
-      "step_time": 17.349584551999897
     }
   ],
   "logging_steps": 1.0,
   "max_steps": 600,
-  "num_input_tokens_seen": 65935,
   "num_train_epochs": 1,
   "save_steps": 500,
   "stateful_callbacks": {

   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 4e-05,
   "eval_steps": 500,
   "global_step": 1,
   "is_hyper_param_search": false,
       "clip_ratio/low_min": 0.0,
       "clip_ratio/region_mean": 0.0,
       "completions/clipped_ratio": 0.0,
+      "completions/max_length": 1052.0,
+      "completions/max_terminated_length": 1052.0,
+      "completions/mean_length": 939.96875,
+      "completions/mean_terminated_length": 939.96875,
+      "completions/min_length": 286.0,
+      "completions/min_terminated_length": 286.0,
+      "entropy": 0.17989059770479798,
+      "epoch": 4e-05,
       "frac_reward_zero_std": 0.0,
+      "grad_norm": 0.6168491840362549,
       "kl": 0.0,
       "learning_rate": 0.0,
+      "loss": -0.037,
+      "num_tokens": 130829.0,
+      "reward": -0.48928576707839966,
+      "reward_std": 0.16871649026870728,
+      "rewards/rollout_reward_func/mean": -0.48928576707839966,
+      "rewards/rollout_reward_func/std": 0.18516120314598083,
+      "sampling/importance_sampling_ratio/max": 1.2845007181167603,
+      "sampling/importance_sampling_ratio/mean": 0.9977670907974243,
+      "sampling/importance_sampling_ratio/min": 0.6358659267425537,
+      "sampling/sampling_logp_difference/max": 0.452767550945282,
+      "sampling/sampling_logp_difference/mean": 0.012648524716496468,
       "step": 1,
+      "step_time": 24.471392321000167
     }
   ],
   "logging_steps": 1.0,
   "max_steps": 600,
+  "num_input_tokens_seen": 130829,
   "num_train_epochs": 1,
   "save_steps": 500,
   "stateful_callbacks": {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:679164a463b407a1a65e26213a5a15185afdb00e0f798acff83b9fcfc0a6eea9
 size 8145

 version https://git-lfs.github.com/spec/v1
+oid sha256:62006adb6a5f6ef0ccf535fbf49cda0cd9c458d12dc2ad9e29abaa7fd5f9b059
 size 8145