Training in progress, epoch 2

Files changed (13) hide show

adapter_config.json ADDED Viewed

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "Qwen/Qwen1.5-0.5B",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 128,
+  "lora_dropout": 0.05,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "v_proj",
+    "q_proj",
+    "k_proj",
+    "gate_proj",
+    "o_proj",
+    "up_proj",
+    "down_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

adapter_model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:75a2aba6d280e6dda56e7f0ea1705194515a20f771cfe630c9a20c94bb8ebb7f
+size 1726772784

added_tokens.json ADDED Viewed

+{
+  "<|endoftext|>": 151643,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644
+}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Jun06_07-45-29_20aaf702f238/events.out.tfevents.1717660442.20aaf702f238.4083.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:1c4ae326a2fcd3a58c211ace78f9eebffbad86e1918d8c8d866955a91738f3e6
+size 9542

runs/Jun06_07-57-41_20aaf702f238/events.out.tfevents.1717660678.20aaf702f238.4083.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:f4af82d57db03021f06ef2e077554ef517c92587e62786af52f28f2b1f512ae6
+size 4814

runs/Jun06_07-59-49_20aaf702f238/events.out.tfevents.1717660802.20aaf702f238.4083.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:595383c5622e5ca9e3c2bf34c006eaabc084d20e220506359635f2f0a7b3e752
+size 4184

runs/Jun06_08-05-22_20aaf702f238/events.out.tfevents.1717661152.20aaf702f238.8982.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b08d23c4d157ccb07d10e4204ae89a9edd9a4b2ffec40c861a5b9f63e0076df1
+size 9645

special_tokens_map.json ADDED Viewed

+{
+  "additional_special_tokens": [
+    {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    }
+  ],
+  "bos_token": "<|im_start|>",
+  "eos_token": "<|im_end|>",
+  "pad_token": "<|im_end|>"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>"
+  ],
+  "bos_token": "<|im_start|>",
+  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
+  "errors": "replace",
+  "model_max_length": 32768,
+  "pad_token": "<|im_end|>",
+  "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null
+}

training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a3701d5e53772d546579ca723f8c472bc43db19e2cecc434e820881ad38f4611
+size 4728

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff