sujithatz/finbot-quen2.5-merged_adapter

Browse files

Files changed (11) hide show

.gitattributes +1 -0
README.md +258 -0
adapter_config.json +34 -0
adapter_model.safetensors +3 -0
added_tokens.json +24 -0
merges.txt +0 -0
special_tokens_map.json +19 -0
tokenizer.json +3 -0
tokenizer_config.json +207 -0
training_args.bin +3 -0
vocab.json +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,258 @@

+---
+base_model: Qwen/Qwen2.5-0.5B-Instruct
+library_name: peft
+license: apache-2.0
+tags:
+- trl
+- sft
+- generated_from_trainer
+model-index:
+- name: quen_2.5_lora
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# quen_2.5_lora
+This model is a fine-tuned version of [Qwen/Qwen2.5-0.5B-Instruct](https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct) on an unknown dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.7650
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0001
+- train_batch_size: 4
+- eval_batch_size: 4
+- seed: 0
+- optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
+- lr_scheduler_type: cosine
+- lr_scheduler_warmup_ratio: 0.01
+- num_epochs: 8
+### Training results
+| Training Loss | Epoch  | Step | Validation Loss |
+|:-------------:|:------:|:----:|:---------------:|
+| 3.1119        | 0.0405 | 3    | 3.1017          |
+| 2.8734        | 0.0811 | 6    | 2.6094          |
+| 2.4188        | 0.1216 | 9    | 2.1546          |
+| 1.9335        | 0.1622 | 12   | 1.7862          |
+| 1.5361        | 0.2027 | 15   | 1.4732          |
+| 1.314         | 0.2432 | 18   | 1.2791          |
+| 1.1747        | 0.2838 | 21   | 1.1653          |
+| 1.1407        | 0.3243 | 24   | 1.1104          |
+| 1.1734        | 0.3649 | 27   | 1.0887          |
+| 1.0495        | 0.4054 | 30   | 1.0401          |
+| 1.0401        | 0.4459 | 33   | 0.9906          |
+| 1.0623        | 0.4865 | 36   | 0.9594          |
+| 0.8152        | 0.5270 | 39   | 0.9367          |
+| 0.9261        | 0.5676 | 42   | 0.9248          |
+| 0.9469        | 0.6081 | 45   | 0.9135          |
+| 0.8381        | 0.6486 | 48   | 0.8871          |
+| 0.8456        | 0.6892 | 51   | 0.8553          |
+| 0.908         | 0.7297 | 54   | 0.8272          |
+| 0.999         | 0.7703 | 57   | 0.8152          |
+| 0.897         | 0.8108 | 60   | 0.8053          |
+| 0.8747        | 0.8514 | 63   | 0.7915          |
+| 1.0646        | 0.8919 | 66   | 0.7873          |
+| 0.6771        | 0.9324 | 69   | 0.7815          |
+| 0.9386        | 0.9730 | 72   | 0.7635          |
+| 0.6348        | 1.0135 | 75   | 0.7552          |
+| 0.5763        | 1.0541 | 78   | 0.7474          |
+| 0.7059        | 1.0946 | 81   | 0.7431          |
+| 0.6111        | 1.1351 | 84   | 0.7394          |
+| 0.6937        | 1.1757 | 87   | 0.7416          |
+| 0.6408        | 1.2162 | 90   | 0.7332          |
+| 0.5931        | 1.2568 | 93   | 0.7319          |
+| 0.5792        | 1.2973 | 96   | 0.7179          |
+| 0.5502        | 1.3378 | 99   | 0.7083          |
+| 0.7356        | 1.3784 | 102  | 0.7049          |
+| 0.5204        | 1.4189 | 105  | 0.6983          |
+| 0.6132        | 1.4595 | 108  | 0.6858          |
+| 0.7527        | 1.5    | 111  | 0.6744          |
+| 0.6798        | 1.5405 | 114  | 0.6716          |
+| 0.7266        | 1.5811 | 117  | 0.6656          |
+| 0.5347        | 1.6216 | 120  | 0.6711          |
+| 0.6522        | 1.6622 | 123  | 0.6680          |
+| 0.8567        | 1.7027 | 126  | 0.6558          |
+| 0.5204        | 1.7432 | 129  | 0.6488          |
+| 0.6443        | 1.7838 | 132  | 0.6393          |
+| 0.5436        | 1.8243 | 135  | 0.6322          |
+| 0.6054        | 1.8649 | 138  | 0.6346          |
+| 0.4488        | 1.9054 | 141  | 0.6389          |
+| 0.7171        | 1.9459 | 144  | 0.6322          |
+| 0.5383        | 1.9865 | 147  | 0.6273          |
+| 0.4812        | 2.0270 | 150  | 0.6235          |
+| 0.7911        | 2.0676 | 153  | 0.6296          |
+| 0.514         | 2.1081 | 156  | 0.6444          |
+| 0.4481        | 2.1486 | 159  | 0.6453          |
+| 0.3983        | 2.1892 | 162  | 0.6357          |
+| 0.2386        | 2.2297 | 165  | 0.6327          |
+| 0.4447        | 2.2703 | 168  | 0.6359          |
+| 0.4302        | 2.3108 | 171  | 0.6387          |
+| 0.4514        | 2.3514 | 174  | 0.6402          |
+| 0.2813        | 2.3919 | 177  | 0.6313          |
+| 0.4747        | 2.4324 | 180  | 0.6259          |
+| 0.547         | 2.4730 | 183  | 0.6257          |
+| 0.3154        | 2.5135 | 186  | 0.6247          |
+| 0.5583        | 2.5541 | 189  | 0.6130          |
+| 0.5726        | 2.5946 | 192  | 0.6087          |
+| 0.4701        | 2.6351 | 195  | 0.6086          |
+| 0.4866        | 2.6757 | 198  | 0.6133          |
+| 0.4015        | 2.7162 | 201  | 0.6213          |
+| 0.4277        | 2.7568 | 204  | 0.6238          |
+| 0.3157        | 2.7973 | 207  | 0.6249          |
+| 0.3883        | 2.8378 | 210  | 0.6210          |
+| 0.5436        | 2.8784 | 213  | 0.6127          |
+| 0.526         | 2.9189 | 216  | 0.6056          |
+| 0.4465        | 2.9595 | 219  | 0.5982          |
+| 0.3692        | 3.0    | 222  | 0.5917          |
+| 0.3022        | 3.0405 | 225  | 0.5956          |
+| 0.2875        | 3.0811 | 228  | 0.6153          |
+| 0.5544        | 3.1216 | 231  | 0.6343          |
+| 0.4159        | 3.1622 | 234  | 0.6370          |
+| 0.4963        | 3.2027 | 237  | 0.6289          |
+| 0.3248        | 3.2432 | 240  | 0.6190          |
+| 0.349         | 3.2838 | 243  | 0.6111          |
+| 0.3107        | 3.3243 | 246  | 0.6121          |
+| 0.2219        | 3.3649 | 249  | 0.6196          |
+| 0.251         | 3.4054 | 252  | 0.6273          |
+| 0.3366        | 3.4459 | 255  | 0.6259          |
+| 0.3182        | 3.4865 | 258  | 0.6243          |
+| 0.4133        | 3.5270 | 261  | 0.6260          |
+| 0.3297        | 3.5676 | 264  | 0.6303          |
+| 0.2276        | 3.6081 | 267  | 0.6365          |
+| 0.1842        | 3.6486 | 270  | 0.6383          |
+| 0.4961        | 3.6892 | 273  | 0.6314          |
+| 0.3785        | 3.7297 | 276  | 0.6240          |
+| 0.2834        | 3.7703 | 279  | 0.6189          |
+| 0.3397        | 3.8108 | 282  | 0.6139          |
+| 0.2795        | 3.8514 | 285  | 0.6104          |
+| 0.3114        | 3.8919 | 288  | 0.6078          |
+| 0.2395        | 3.9324 | 291  | 0.6111          |
+| 0.1948        | 3.9730 | 294  | 0.6142          |
+| 0.2284        | 4.0135 | 297  | 0.6194          |
+| 0.2638        | 4.0541 | 300  | 0.6303          |
+| 0.252         | 4.0946 | 303  | 0.6517          |
+| 0.183         | 4.1351 | 306  | 0.6645          |
+| 0.2415        | 4.1757 | 309  | 0.6604          |
+| 0.1791        | 4.2162 | 312  | 0.6530          |
+| 0.2013        | 4.2568 | 315  | 0.6489          |
+| 0.1827        | 4.2973 | 318  | 0.6532          |
+| 0.1792        | 4.3378 | 321  | 0.6585          |
+| 0.2568        | 4.3784 | 324  | 0.6628          |
+| 0.1682        | 4.4189 | 327  | 0.6650          |
+| 0.25          | 4.4595 | 330  | 0.6730          |
+| 0.2664        | 4.5    | 333  | 0.6741          |
+| 0.2316        | 4.5405 | 336  | 0.6773          |
+| 0.3467        | 4.5811 | 339  | 0.6705          |
+| 0.2426        | 4.6216 | 342  | 0.6681          |
+| 0.2421        | 4.6622 | 345  | 0.6622          |
+| 0.4063        | 4.7027 | 348  | 0.6609          |
+| 0.2255        | 4.7432 | 351  | 0.6569          |
+| 0.1933        | 4.7838 | 354  | 0.6534          |
+| 0.1975        | 4.8243 | 357  | 0.6497          |
+| 0.3065        | 4.8649 | 360  | 0.6491          |
+| 0.1641        | 4.9054 | 363  | 0.6513          |
+| 0.2032        | 4.9459 | 366  | 0.6553          |
+| 0.1886        | 4.9865 | 369  | 0.6590          |
+| 0.2539        | 5.0270 | 372  | 0.6677          |
+| 0.1464        | 5.0676 | 375  | 0.6879          |
+| 0.2295        | 5.1081 | 378  | 0.7066          |
+| 0.1438        | 5.1486 | 381  | 0.7167          |
+| 0.1603        | 5.1892 | 384  | 0.7135          |
+| 0.1379        | 5.2297 | 387  | 0.7095          |
+| 0.2783        | 5.2703 | 390  | 0.7103          |
+| 0.1575        | 5.3108 | 393  | 0.7042          |
+| 0.1743        | 5.3514 | 396  | 0.7114          |
+| 0.1168        | 5.3919 | 399  | 0.7083          |
+| 0.284         | 5.4324 | 402  | 0.7072          |
+| 0.1013        | 5.4730 | 405  | 0.7063          |
+| 0.2612        | 5.5135 | 408  | 0.7051          |
+| 0.1343        | 5.5541 | 411  | 0.7103          |
+| 0.1009        | 5.5946 | 414  | 0.7105          |
+| 0.3127        | 5.6351 | 417  | 0.7090          |
+| 0.1355        | 5.6757 | 420  | 0.7060          |
+| 0.1345        | 5.7162 | 423  | 0.7057          |
+| 0.1865        | 5.7568 | 426  | 0.7039          |
+| 0.119         | 5.7973 | 429  | 0.7067          |
+| 0.149         | 5.8378 | 432  | 0.7120          |
+| 0.1748        | 5.8784 | 435  | 0.7123          |
+| 0.1781        | 5.9189 | 438  | 0.7113          |
+| 0.2075        | 5.9595 | 441  | 0.7118          |
+| 0.1591        | 6.0    | 444  | 0.7112          |
+| 0.1224        | 6.0405 | 447  | 0.7118          |
+| 0.2234        | 6.0811 | 450  | 0.7171          |
+| 0.1165        | 6.1216 | 453  | 0.7227          |
+| 0.2518        | 6.1622 | 456  | 0.7326          |
+| 0.1288        | 6.2027 | 459  | 0.7431          |
+| 0.1176        | 6.2432 | 462  | 0.7481          |
+| 0.1231        | 6.2838 | 465  | 0.7511          |
+| 0.146         | 6.3243 | 468  | 0.7530          |
+| 0.1169        | 6.3649 | 471  | 0.7518          |
+| 0.1048        | 6.4054 | 474  | 0.7541          |
+| 0.1092        | 6.4459 | 477  | 0.7507          |
+| 0.1458        | 6.4865 | 480  | 0.7518          |
+| 0.2177        | 6.5270 | 483  | 0.7509          |
+| 0.1585        | 6.5676 | 486  | 0.7510          |
+| 0.1337        | 6.6081 | 489  | 0.7546          |
+| 0.122         | 6.6486 | 492  | 0.7524          |
+| 0.0793        | 6.6892 | 495  | 0.7554          |
+| 0.1544        | 6.7297 | 498  | 0.7521          |
+| 0.1387        | 6.7703 | 501  | 0.7529          |
+| 0.1253        | 6.8108 | 504  | 0.7529          |
+| 0.1296        | 6.8514 | 507  | 0.7542          |
+| 0.1094        | 6.8919 | 510  | 0.7516          |
+| 0.1009        | 6.9324 | 513  | 0.7512          |
+| 0.1871        | 6.9730 | 516  | 0.7526          |
+| 0.1017        | 7.0135 | 519  | 0.7538          |
+| 0.1536        | 7.0541 | 522  | 0.7529          |
+| 0.0886        | 7.0946 | 525  | 0.7565          |
+| 0.0983        | 7.1351 | 528  | 0.7576          |
+| 0.084         | 7.1757 | 531  | 0.7586          |
+| 0.099         | 7.2162 | 534  | 0.7564          |
+| 0.1089        | 7.2568 | 537  | 0.7592          |
+| 0.1145        | 7.2973 | 540  | 0.7612          |
+| 0.1823        | 7.3378 | 543  | 0.7615          |
+| 0.2784        | 7.3784 | 546  | 0.7602          |
+| 0.0887        | 7.4189 | 549  | 0.7617          |
+| 0.1133        | 7.4595 | 552  | 0.7640          |
+| 0.1207        | 7.5    | 555  | 0.7630          |
+| 0.0954        | 7.5405 | 558  | 0.7643          |
+| 0.1135        | 7.5811 | 561  | 0.7629          |
+| 0.096         | 7.6216 | 564  | 0.7637          |
+| 0.1088        | 7.6622 | 567  | 0.7655          |
+| 0.1628        | 7.7027 | 570  | 0.7655          |
+| 0.1431        | 7.7432 | 573  | 0.7650          |
+| 0.1034        | 7.7838 | 576  | 0.7639          |
+| 0.181         | 7.8243 | 579  | 0.7637          |
+| 0.062         | 7.8649 | 582  | 0.7649          |
+| 0.0769        | 7.9054 | 585  | 0.7654          |
+| 0.1951        | 7.9459 | 588  | 0.7647          |
+| 0.1175        | 7.9865 | 591  | 0.7650          |
+### Framework versions
+- PEFT 0.13.2
+- Transformers 4.46.0
+- Pytorch 2.4.0
+- Datasets 3.0.2
+- Tokenizers 0.20.0

adapter_config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "Qwen/Qwen2.5-0.5B-Instruct",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 32,
+  "lora_dropout": 0.05,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 16,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "down_proj",
+    "gate_proj",
+    "o_proj",
+    "up_proj",
+    "q_proj",
+    "v_proj",
+    "k_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2b036d3c4044bc3c7152cfdc35c1edc67b951d0c35baaea7351ca546fb5e6283
+size 35237104

added_tokens.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "</tool_call>": 151658,
+  "<tool_call>": 151657,
+  "<|box_end|>": 151649,
+  "<|box_start|>": 151648,
+  "<|endoftext|>": 151643,
+  "<|file_sep|>": 151664,
+  "<|fim_middle|>": 151660,
+  "<|fim_pad|>": 151662,
+  "<|fim_prefix|>": 151659,
+  "<|fim_suffix|>": 151661,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644,
+  "<|image_pad|>": 151655,
+  "<|object_ref_end|>": 151647,
+  "<|object_ref_start|>": 151646,
+  "<|quad_end|>": 151651,
+  "<|quad_start|>": 151650,
+  "<|repo_name|>": 151663,
+  "<|video_pad|>": 151656,
+  "<|vision_end|>": 151653,
+  "<|vision_pad|>": 151654,
+  "<|vision_start|>": 151652
+}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<|object_ref_start|>",
+    "<|object_ref_end|>",
+    "<|box_start|>",
+    "<|box_end|>",
+    "<|quad_start|>",
+    "<|quad_end|>",
+    "<|vision_start|>",
+    "<|vision_end|>",
+    "<|vision_pad|>",
+    "<|image_pad|>",
+    "<|video_pad|>"
+  ],
+  "eos_token": "<|endoftext|>",
+  "pad_token": "<|endoftext|>"
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3511c9b326fec6a1b23dbf63767a672c911fbee5b2145ad0099a5bd8aff458b5
+size 11421994

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,207 @@

+{
+  "add_bos_token": false,
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151646": {
+      "content": "<|object_ref_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151647": {
+      "content": "<|object_ref_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151648": {
+      "content": "<|box_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151649": {
+      "content": "<|box_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151650": {
+      "content": "<|quad_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151651": {
+      "content": "<|quad_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151652": {
+      "content": "<|vision_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151653": {
+      "content": "<|vision_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151654": {
+      "content": "<|vision_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151655": {
+      "content": "<|image_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151656": {
+      "content": "<|video_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151657": {
+      "content": "<tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151658": {
+      "content": "</tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151659": {
+      "content": "<|fim_prefix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151660": {
+      "content": "<|fim_middle|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151661": {
+      "content": "<|fim_suffix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151662": {
+      "content": "<|fim_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151663": {
+      "content": "<|repo_name|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151664": {
+      "content": "<|file_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<|object_ref_start|>",
+    "<|object_ref_end|>",
+    "<|box_start|>",
+    "<|box_end|>",
+    "<|quad_start|>",
+    "<|quad_end|>",
+    "<|vision_start|>",
+    "<|vision_end|>",
+    "<|vision_pad|>",
+    "<|image_pad|>",
+    "<|video_pad|>"
+  ],
+  "bos_token": null,
+  "chat_template": "{%- if tools %}\n    {{- '<|im_start|>system\\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] }}\n    {%- else %}\n        {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }}\n    {%- endif %}\n    {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within <tools></tools> XML tags:\\n<tools>\" }}\n    {%- for tool in tools %}\n        {{- \"\\n\" }}\n        {{- tool | tojson }}\n    {%- endfor %}\n    {{- \"\\n</tools>\\n\\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\\n<tool_call>\\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\\n</tool_call><|im_end|>\\n\" }}\n{%- else %}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n        {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role }}\n        {%- if message.content %}\n            {{- '\\n' + message.content }}\n        {%- endif %}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '\\n<tool_call>\\n{\"name\": \"' }}\n            {{- tool_call.name }}\n            {{- '\", \"arguments\": ' }}\n            {{- tool_call.arguments | tojson }}\n            {{- '}\\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n            {{- '<|im_start|>user' }}\n        {%- endif %}\n        {{- '\\n<tool_response>\\n' }}\n        {{- message.content }}\n        {{- '\\n</tool_response>' }}\n        {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n            {{- '<|im_end|>\\n' }}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "errors": "replace",
+  "model_max_length": 300,
+  "pad_token": "<|endoftext|>",
+  "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5d717faee84e567649c08b8e6fc776fbd52823ae864a482fe19d98642a27aca
+size 5496

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff