HiTZ
/

Token Classification
Transformers
Safetensors
bert
Inference Endpoints
anaryegen commited on
Commit
89e71af
·
1 Parent(s): 780a12c

update model

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 0.27864328904585406,
4
- "train_runtime": 413.6435,
5
  "train_samples": 17598,
6
- "train_samples_per_second": 127.632,
7
- "train_steps_per_second": 7.978
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 0.2811542418508819,
4
+ "train_runtime": 449.7464,
5
  "train_samples": 17598,
6
+ "train_samples_per_second": 117.386,
7
+ "train_steps_per_second": 7.337
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b94a2b7dc1b945a12c97f126d710acab219fcdb45dd98e053089eeb5cb23ba9f
3
  size 709090132
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:548c1d2c4a14d27c96fe8163e38824d2b8d6f48e3a7f00fdae61ccd0e2036514
3
  size 709090132
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 0.27864328904585406,
4
- "train_runtime": 413.6435,
5
  "train_samples": 17598,
6
- "train_samples_per_second": 127.632,
7
- "train_steps_per_second": 7.978
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 0.2811542418508819,
4
+ "train_runtime": 449.7464,
5
  "train_samples": 17598,
6
+ "train_samples_per_second": 117.386,
7
+ "train_steps_per_second": 7.337
8
  }
trainer_state.json CHANGED
@@ -10,54 +10,54 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.45,
13
- "grad_norm": 3.782728910446167,
14
  "learning_rate": 4.242424242424243e-05,
15
- "loss": 0.532,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.91,
20
- "grad_norm": 3.925285816192627,
21
  "learning_rate": 3.484848484848485e-05,
22
- "loss": 0.4013,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 1.36,
27
- "grad_norm": 7.782624244689941,
28
  "learning_rate": 2.7272727272727273e-05,
29
- "loss": 0.281,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 1.82,
34
- "grad_norm": 3.6547534465789795,
35
  "learning_rate": 1.9696969696969697e-05,
36
- "loss": 0.2454,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 2.27,
41
- "grad_norm": 0.9583206176757812,
42
  "learning_rate": 1.2121212121212122e-05,
43
- "loss": 0.1696,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 2.73,
48
- "grad_norm": 11.225361824035645,
49
  "learning_rate": 4.5454545454545455e-06,
50
- "loss": 0.1393,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 3.0,
55
  "step": 3300,
56
  "total_flos": 2871828253461180.0,
57
- "train_loss": 0.27864328904585406,
58
- "train_runtime": 413.6435,
59
- "train_samples_per_second": 127.632,
60
- "train_steps_per_second": 7.978
61
  }
62
  ],
63
  "logging_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.45,
13
+ "grad_norm": 4.830384254455566,
14
  "learning_rate": 4.242424242424243e-05,
15
+ "loss": 0.5576,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.91,
20
+ "grad_norm": 2.6578476428985596,
21
  "learning_rate": 3.484848484848485e-05,
22
+ "loss": 0.4035,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 1.36,
27
+ "grad_norm": 6.386310577392578,
28
  "learning_rate": 2.7272727272727273e-05,
29
+ "loss": 0.2828,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 1.82,
34
+ "grad_norm": 1.7881163358688354,
35
  "learning_rate": 1.9696969696969697e-05,
36
+ "loss": 0.2468,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 2.27,
41
+ "grad_norm": 2.0737249851226807,
42
  "learning_rate": 1.2121212121212122e-05,
43
+ "loss": 0.1608,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 2.73,
48
+ "grad_norm": 0.20467181503772736,
49
  "learning_rate": 4.5454545454545455e-06,
50
+ "loss": 0.1321,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 3.0,
55
  "step": 3300,
56
  "total_flos": 2871828253461180.0,
57
+ "train_loss": 0.2811542418508819,
58
+ "train_runtime": 449.7464,
59
+ "train_samples_per_second": 117.386,
60
+ "train_steps_per_second": 7.337
61
  }
62
  ],
63
  "logging_steps": 500,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33f26567c9db33a95d0e6f1ccfebacde8b5cba77cf3ea0f0c2923835aa7ee837
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ad5b11cedb8c71b7172a119a539a49b00c9933a10cf45529cf47a37ef6a7c46
3
  size 4984