Model save
Browse files
README.md
CHANGED
@@ -39,14 +39,18 @@ The following hyperparameters were used during training:
|
|
39 |
- train_batch_size: 2
|
40 |
- eval_batch_size: 8
|
41 |
- seed: 42
|
42 |
-
- optimizer:
|
43 |
- lr_scheduler_type: linear
|
44 |
- num_epochs: 3
|
45 |
- mixed_precision_training: Native AMP
|
46 |
|
|
|
|
|
|
|
|
|
47 |
### Framework versions
|
48 |
|
49 |
-
- Transformers 4.
|
50 |
- Pytorch 2.4.0+cu121
|
51 |
- Datasets 3.0.1
|
52 |
- Tokenizers 0.20.1
|
|
|
39 |
- train_batch_size: 2
|
40 |
- eval_batch_size: 8
|
41 |
- seed: 42
|
42 |
+
- optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
43 |
- lr_scheduler_type: linear
|
44 |
- num_epochs: 3
|
45 |
- mixed_precision_training: Native AMP
|
46 |
|
47 |
+
### Training results
|
48 |
+
|
49 |
+
|
50 |
+
|
51 |
### Framework versions
|
52 |
|
53 |
+
- Transformers 4.46.0.dev0
|
54 |
- Pytorch 2.4.0+cu121
|
55 |
- Datasets 3.0.1
|
56 |
- Tokenizers 0.20.1
|
generation_config.json
CHANGED
@@ -4,5 +4,5 @@
|
|
4 |
"eos_token_id": 2,
|
5 |
"forced_eos_token_id": 2,
|
6 |
"pad_token_id": 1,
|
7 |
-
"transformers_version": "4.
|
8 |
}
|
|
|
4 |
"eos_token_id": 2,
|
5 |
"forced_eos_token_id": 2,
|
6 |
"pad_token_id": 1,
|
7 |
+
"transformers_version": "4.46.0.dev0"
|
8 |
}
|
runs/Oct22_04-59-01_c71da081ab17/events.out.tfevents.1729573148.c71da081ab17.81.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b5e7ff657319fb1450e8f0094ce6f2d0a67cffd00ccad620de405d4c38e96d7
|
3 |
+
size 11407
|