Training in progress, epoch 1

Files changed (8) hide show

config.json CHANGED Viewed

@@ -1,6 +1,5 @@
 {
-  "_name_or_path": "distilbert/distilgpt2",
-  "_num_labels": 1,
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
@@ -9,6 +8,7 @@
   "bos_token_id": 50256,
   "embd_pdrop": 0.1,
   "eos_token_id": 50256,
   "id2label": {
     "0": "LABEL_0"
   },
@@ -22,7 +22,7 @@
   "n_embd": 768,
   "n_head": 12,
   "n_inner": null,
-  "n_layer": 6,
   "n_positions": 1024,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.1,

 {
+  "_name_or_path": "danghuy1999/gpt2-viwiki",
   "activation_function": "gelu_new",
   "architectures": [
     "GPT2LMHeadModel"
   "bos_token_id": 50256,
   "embd_pdrop": 0.1,
   "eos_token_id": 50256,
+  "gradient_checkpointing": false,
   "id2label": {
     "0": "LABEL_0"
   },
   "n_embd": 768,
   "n_head": 12,
   "n_inner": null,
+  "n_layer": 12,
   "n_positions": 1024,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.1,

merges.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9b7fba3a89b65ee3870f21bac29b8896350b5d55df4808fade5a93bb6e17b8ce
-size 327657928

 version https://git-lfs.github.com/spec/v1
+oid sha256:9a8091262bfd50437b7ed94384a26af05d2a3b1049a1e8a4c3e2d8955bd0579e
+size 497774208

runs/Feb25_14-51-53_6146ee6a12f6/events.out.tfevents.1708872713.6146ee6a12f6.205.7 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:911531e32509a908d0338ba1e12de74530a945884685e4bbfede2dddc8d845a3
+size 4488

runs/Feb25_14-56-54_6146ee6a12f6/events.out.tfevents.1708873015.6146ee6a12f6.18958.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:aba29ab1a1eb0c90b864b80f16d0185484ee3d5d0a0f09ca1e26d1e928f1545f
+size 4184

tokenizer_config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "add_bos_token": false,
   "add_prefix_space": false,
   "added_tokens_decoder": {
-    "50256": {
       "content": "<|endoftext|>",
       "lstrip": false,
       "normalized": true,
@@ -15,7 +15,7 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|endoftext|>",
   "errors": "replace",
-  "model_max_length": 1024,
   "pad_token": "<|endoftext|>",
   "tokenizer_class": "GPT2Tokenizer",
   "unk_token": "<|endoftext|>"

   "add_bos_token": false,
   "add_prefix_space": false,
   "added_tokens_decoder": {
+    "0": {
       "content": "<|endoftext|>",
       "lstrip": false,
       "normalized": true,
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|endoftext|>",
   "errors": "replace",
+  "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<|endoftext|>",
   "tokenizer_class": "GPT2Tokenizer",
   "unk_token": "<|endoftext|>"

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dcda92f4a204ad67aba73ab29a009870ac26be55110e0a787e8aa0a7b3586783
 size 4600

 version https://git-lfs.github.com/spec/v1
+oid sha256:504d3df164819552907cc38bc6870730e29c517d9d5b43f66c271a40313a1243
 size 4600

vocab.json CHANGED Viewed

The diff for this file is too large to render. See raw diff