model
Browse files- scripts/model.yaml +2 -1
scripts/model.yaml
CHANGED
@@ -61,7 +61,8 @@ train:
|
|
61 |
global_batch_size: 512
|
62 |
|
63 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
64 |
-
micro_batch_size:
|
|
|
65 |
# micro_batch_size: 14
|
66 |
|
67 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
|
|
61 |
global_batch_size: 512
|
62 |
|
63 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
64 |
+
micro_batch_size: 1
|
65 |
+
# micro_batch_size: 16
|
66 |
# micro_batch_size: 14
|
67 |
|
68 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|