diff --git "a/logs/44k/diffusion/log_info.txt" "b/logs/44k/diffusion/log_info.txt" --- "a/logs/44k/diffusion/log_info.txt" +++ "b/logs/44k/diffusion/log_info.txt" @@ -2,118 +2,3307 @@ model: 55,192,704 ======= start training ======= epoch|batch_idx/num_batches|output_dir|batch/s|lr|time|step -epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 2.01 | lr: 0.0002 | loss: 0.996 | time: 0:00:05.2 | step: 10 -epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 2.06 | lr: 0.0002 | loss: 0.981 | time: 0:00:10.1 | step: 20 -epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 2.04 | lr: 0.0002 | loss: 0.944 | time: 0:00:15.0 | step: 30 -epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 1.99 | lr: 0.0002 | loss: 0.908 | time: 0:00:20.0 | step: 40 -epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 2.03 | lr: 0.0002 | loss: 0.874 | time: 0:00:24.9 | step: 50 -epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 2.00 | lr: 0.0002 | loss: 0.828 | time: 0:00:30.0 | step: 60 -epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 1.98 | lr: 0.0002 | loss: 0.781 | time: 0:00:35.0 | step: 70 -epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 1.95 | lr: 0.0002 | loss: 0.760 | time: 0:00:40.1 | step: 80 -epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.88 | lr: 0.0002 | loss: 0.737 | time: 0:00:45.5 | step: 90 -epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 1.92 | lr: 0.0002 | loss: 0.711 | time: 0:00:50.7 | step: 100 -epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.84 | lr: 0.0002 | loss: 0.692 | time: 0:00:56.2 | step: 110 -epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.91 | lr: 0.0002 | loss: 0.643 | time: 0:01:01.4 | step: 120 -epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.94 | lr: 0.0002 | loss: 0.626 | time: 0:01:06.5 | step: 130 -epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.96 | lr: 0.0002 | loss: 0.621 | time: 0:01:11.6 | step: 140 -epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 2.04 | lr: 0.0002 | loss: 0.582 | time: 0:01:16.5 | step: 150 -epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.95 | lr: 0.0002 | loss: 0.550 | time: 0:01:21.7 | step: 160 -epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.95 | lr: 0.0002 | loss: 0.539 | time: 0:01:26.8 | step: 170 -epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.82 | lr: 0.0002 | loss: 0.521 | time: 0:01:32.3 | step: 180 -epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.86 | lr: 0.0002 | loss: 0.508 | time: 0:01:37.7 | step: 190 -epoch: 4 | 11/ 47 | logs/44k/diffusion | batch/s: 1.84 | lr: 0.0002 | loss: 0.516 | time: 0:01:43.1 | step: 200 -epoch: 4 | 21/ 47 | logs/44k/diffusion | batch/s: 1.85 | lr: 0.0002 | loss: 0.512 | time: 0:01:48.6 | step: 210 -epoch: 4 | 31/ 47 | logs/44k/diffusion | batch/s: 1.73 | lr: 0.0002 | loss: 0.463 | time: 0:01:54.3 | step: 220 -epoch: 4 | 41/ 47 | logs/44k/diffusion | batch/s: 1.84 | lr: 0.0002 | loss: 0.447 | time: 0:01:59.7 | step: 230 -epoch: 5 | 4/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.446 | time: 0:02:05.2 | step: 240 -epoch: 5 | 14/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.417 | time: 0:02:10.7 | step: 250 -epoch: 5 | 24/ 47 | logs/44k/diffusion | batch/s: 1.84 | lr: 0.0002 | loss: 0.388 | time: 0:02:16.1 | step: 260 -epoch: 5 | 34/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.396 | time: 0:02:21.6 | step: 270 -epoch: 5 | 44/ 47 | logs/44k/diffusion | batch/s: 1.85 | lr: 0.0002 | loss: 0.391 | time: 0:02:27.0 | step: 280 -epoch: 6 | 7/ 47 | logs/44k/diffusion | batch/s: 1.91 | lr: 0.0002 | loss: 0.385 | time: 0:02:32.2 | step: 290 -epoch: 6 | 17/ 47 | logs/44k/diffusion | batch/s: 1.81 | lr: 0.0002 | loss: 0.365 | time: 0:02:37.7 | step: 300 -epoch: 6 | 27/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.372 | time: 0:02:43.2 | step: 310 -epoch: 6 | 37/ 47 | logs/44k/diffusion | batch/s: 1.81 | lr: 0.0002 | loss: 0.361 | time: 0:02:48.7 | step: 320 -epoch: 7 | 0/ 47 | logs/44k/diffusion | batch/s: 1.91 | lr: 0.0002 | loss: 0.335 | time: 0:02:53.9 | step: 330 -epoch: 7 | 10/ 47 | logs/44k/diffusion | batch/s: 1.82 | lr: 0.0002 | loss: 0.329 | time: 0:02:59.4 | step: 340 -epoch: 7 | 20/ 47 | logs/44k/diffusion | batch/s: 1.82 | lr: 0.0002 | loss: 0.343 | time: 0:03:04.9 | step: 350 -epoch: 7 | 30/ 47 | logs/44k/diffusion | batch/s: 1.75 | lr: 0.0002 | loss: 0.309 | time: 0:03:10.7 | step: 360 -epoch: 7 | 40/ 47 | logs/44k/diffusion | batch/s: 1.80 | lr: 0.0002 | loss: 0.334 | time: 0:03:16.2 | step: 370 -epoch: 8 | 3/ 47 | logs/44k/diffusion | batch/s: 1.91 | lr: 0.0002 | loss: 0.280 | time: 0:03:21.5 | step: 380 -epoch: 8 | 13/ 47 | logs/44k/diffusion | batch/s: 1.86 | lr: 0.0002 | loss: 0.281 | time: 0:03:26.8 | step: 390 -epoch: 8 | 23/ 47 | logs/44k/diffusion | batch/s: 1.82 | lr: 0.0002 | loss: 0.293 | time: 0:03:32.3 | step: 400 -epoch: 8 | 33/ 47 | logs/44k/diffusion | batch/s: 1.78 | lr: 0.0002 | loss: 0.266 | time: 0:03:38.0 | step: 410 -epoch: 8 | 43/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.262 | time: 0:03:43.4 | step: 420 -epoch: 9 | 6/ 47 | logs/44k/diffusion | batch/s: 1.92 | lr: 0.0002 | loss: 0.256 | time: 0:03:48.6 | step: 430 -epoch: 9 | 16/ 47 | logs/44k/diffusion | batch/s: 1.84 | lr: 0.0002 | loss: 0.247 | time: 0:03:54.1 | step: 440 -epoch: 9 | 26/ 47 | logs/44k/diffusion | batch/s: 1.84 | lr: 0.0002 | loss: 0.253 | time: 0:03:59.5 | step: 450 -epoch: 9 | 36/ 47 | logs/44k/diffusion | batch/s: 1.82 | lr: 0.0002 | loss: 0.236 | time: 0:04:05.0 | step: 460 -epoch: 9 | 46/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.239 | time: 0:04:10.3 | step: 470 -epoch: 10 | 9/ 47 | logs/44k/diffusion | batch/s: 1.87 | lr: 0.0002 | loss: 0.211 | time: 0:04:15.8 | step: 480 -epoch: 10 | 19/ 47 | logs/44k/diffusion | batch/s: 1.87 | lr: 0.0002 | loss: 0.219 | time: 0:04:21.2 | step: 490 -epoch: 10 | 29/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.244 | time: 0:04:26.6 | step: 500 -epoch: 10 | 39/ 47 | logs/44k/diffusion | batch/s: 1.81 | lr: 0.0002 | loss: 0.192 | time: 0:04:32.2 | step: 510 -epoch: 11 | 2/ 47 | logs/44k/diffusion | batch/s: 1.80 | lr: 0.0002 | loss: 0.203 | time: 0:04:37.7 | step: 520 -epoch: 11 | 12/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.195 | time: 0:04:43.2 | step: 530 -epoch: 11 | 22/ 47 | logs/44k/diffusion | batch/s: 1.77 | lr: 0.0002 | loss: 0.205 | time: 0:04:48.8 | step: 540 -epoch: 11 | 32/ 47 | logs/44k/diffusion | batch/s: 1.77 | lr: 0.0002 | loss: 0.203 | time: 0:04:54.5 | step: 550 -epoch: 11 | 42/ 47 | logs/44k/diffusion | batch/s: 1.88 | lr: 0.0002 | loss: 0.192 | time: 0:04:59.7 | step: 560 -epoch: 12 | 5/ 47 | logs/44k/diffusion | batch/s: 2.05 | lr: 0.0002 | loss: 0.180 | time: 0:05:04.6 | step: 570 -epoch: 12 | 15/ 47 | logs/44k/diffusion | batch/s: 1.97 | lr: 0.0002 | loss: 0.183 | time: 0:05:09.7 | step: 580 -epoch: 12 | 25/ 47 | logs/44k/diffusion | batch/s: 1.87 | lr: 0.0002 | loss: 0.178 | time: 0:05:15.1 | step: 590 -epoch: 12 | 35/ 47 | logs/44k/diffusion | batch/s: 2.02 | lr: 0.0002 | loss: 0.179 | time: 0:05:20.0 | step: 600 -epoch: 12 | 45/ 47 | logs/44k/diffusion | batch/s: 2.02 | lr: 0.0002 | loss: 0.161 | time: 0:05:25.0 | step: 610 -epoch: 13 | 8/ 47 | logs/44k/diffusion | batch/s: 2.08 | lr: 0.0002 | loss: 0.148 | time: 0:05:29.8 | step: 620 -epoch: 13 | 18/ 47 | logs/44k/diffusion | batch/s: 2.02 | lr: 0.0002 | loss: 0.167 | time: 0:05:34.7 | step: 630 -epoch: 13 | 28/ 47 | logs/44k/diffusion | batch/s: 2.01 | lr: 0.0002 | loss: 0.173 | time: 0:05:39.7 | step: 640 -epoch: 13 | 38/ 47 | logs/44k/diffusion | batch/s: 2.03 | lr: 0.0002 | loss: 0.157 | time: 0:05:44.6 | step: 650 -epoch: 14 | 1/ 47 | logs/44k/diffusion | batch/s: 2.10 | lr: 0.0002 | loss: 0.152 | time: 0:05:49.4 | step: 660 -epoch: 14 | 11/ 47 | logs/44k/diffusion | batch/s: 2.02 | lr: 0.0002 | loss: 0.138 | time: 0:05:54.3 | step: 670 -epoch: 14 | 21/ 47 | logs/44k/diffusion | batch/s: 2.00 | lr: 0.0002 | loss: 0.129 | time: 0:05:59.4 | step: 680 -epoch: 14 | 31/ 47 | logs/44k/diffusion | batch/s: 1.93 | lr: 0.0002 | loss: 0.134 | time: 0:06:04.5 | step: 690 -epoch: 14 | 41/ 47 | logs/44k/diffusion | batch/s: 1.99 | lr: 0.0002 | loss: 0.132 | time: 0:06:09.6 | step: 700 -epoch: 15 | 4/ 47 | logs/44k/diffusion | batch/s: 2.08 | lr: 0.0002 | loss: 0.154 | time: 0:06:14.4 | step: 710 -epoch: 15 | 14/ 47 | logs/44k/diffusion | batch/s: 1.98 | lr: 0.0002 | loss: 0.162 | time: 0:06:19.5 | step: 720 -epoch: 15 | 24/ 47 | logs/44k/diffusion | batch/s: 1.83 | lr: 0.0002 | loss: 0.125 | time: 0:06:24.9 | step: 730 -epoch: 15 | 34/ 47 | logs/44k/diffusion | batch/s: 1.96 | lr: 0.0002 | loss: 0.130 | time: 0:06:30.0 | step: 740 -epoch: 15 | 44/ 47 | logs/44k/diffusion | batch/s: 1.94 | lr: 0.0002 | loss: 0.116 | time: 0:06:35.2 | step: 750 -epoch: 16 | 7/ 47 | logs/44k/diffusion | batch/s: 2.03 | lr: 0.0002 | loss: 0.130 | time: 0:06:40.1 | step: 760 -epoch: 16 | 17/ 47 | logs/44k/diffusion | batch/s: 1.96 | lr: 0.0002 | loss: 0.117 | time: 0:06:45.2 | step: 770 -epoch: 16 | 27/ 47 | logs/44k/diffusion | batch/s: 1.92 | lr: 0.0002 | loss: 0.124 | time: 0:06:50.4 | step: 780 -epoch: 16 | 37/ 47 | logs/44k/diffusion | batch/s: 1.94 | lr: 0.0002 | loss: 0.122 | time: 0:06:55.5 | step: 790 -epoch: 17 | 0/ 47 | logs/44k/diffusion | batch/s: 2.05 | lr: 0.0002 | loss: 0.100 | time: 0:07:00.4 | step: 800 -epoch: 17 | 10/ 47 | logs/44k/diffusion | batch/s: 1.95 | lr: 0.0002 | loss: 0.106 | time: 0:07:05.5 | step: 810 -epoch: 17 | 20/ 47 | logs/44k/diffusion | batch/s: 1.93 | lr: 0.0002 | loss: 0.093 | time: 0:07:10.7 | step: 820 -epoch: 17 | 30/ 47 | logs/44k/diffusion | batch/s: 1.90 | lr: 0.0002 | loss: 0.117 | time: 0:07:16.0 | step: 830 -epoch: 17 | 40/ 47 | logs/44k/diffusion | batch/s: 1.95 | lr: 0.0002 | loss: 0.125 | time: 0:07:21.1 | step: 840 -epoch: 18 | 3/ 47 | logs/44k/diffusion | batch/s: 1.99 | lr: 0.0002 | loss: 0.101 | time: 0:07:26.1 | step: 850 -epoch: 18 | 13/ 47 | logs/44k/diffusion | batch/s: 1.93 | lr: 0.0002 | loss: 0.102 | time: 0:07:31.3 | step: 860 -epoch: 18 | 23/ 47 | logs/44k/diffusion | batch/s: 1.94 | lr: 0.0002 | loss: 0.110 | time: 0:07:36.4 | step: 870 -epoch: 18 | 33/ 47 | logs/44k/diffusion | batch/s: 1.86 | lr: 0.0002 | loss: 0.115 | time: 0:07:41.8 | step: 880 +epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 0.69 | lr: 0.0002 | loss: 0.040 | time: 0:00:15.1 | step: 10 +epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 1.22 | lr: 0.0002 | loss: 0.018 | time: 0:00:23.3 | step: 20 +epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.028 | time: 0:00:31.5 | step: 30 +epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.025 | time: 0:00:39.9 | step: 40 +epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 1.24 | lr: 0.0002 | loss: 0.007 | time: 0:00:48.0 | step: 50 +epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.014 | time: 0:00:56.5 | step: 60 +epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.023 | time: 0:01:05.1 | step: 70 +epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.029 | time: 0:01:13.7 | step: 80 +epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.025 | time: 0:01:22.5 | step: 90 +epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.013 | time: 0:01:30.9 | step: 100 +epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 0:01:39.8 | step: 110 +epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:01:48.9 | step: 120 +epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.039 | time: 0:01:57.9 | step: 130 +epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:02:06.8 | step: 140 +epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.011 | time: 0:02:15.1 | step: 150 +epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.034 | time: 0:02:23.9 | step: 160 +epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:02:32.7 | step: 170 +epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:02:41.5 | step: 180 +epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.028 | time: 0:02:49.9 | step: 190 +epoch: 4 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:02:58.8 | step: 200 +epoch: 4 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:03:07.7 | step: 210 +epoch: 4 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 0:03:16.5 | step: 220 +epoch: 4 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 0:03:25.4 | step: 230 +epoch: 5 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.014 | time: 0:03:33.8 | step: 240 +epoch: 5 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.043 | time: 0:03:42.7 | step: 250 +epoch: 5 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:03:51.5 | step: 260 +epoch: 5 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 0:04:00.4 | step: 270 +epoch: 5 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 0:04:09.3 | step: 280 +epoch: 6 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.024 | time: 0:04:17.7 | step: 290 +epoch: 6 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:04:26.6 | step: 300 +epoch: 6 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.041 | time: 0:04:35.4 | step: 310 +epoch: 6 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 0:04:44.3 | step: 320 +epoch: 7 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 0:04:52.8 | step: 330 +epoch: 7 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:05:01.7 | step: 340 +epoch: 7 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.049 | time: 0:05:10.5 | step: 350 +epoch: 7 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:05:19.4 | step: 360 +epoch: 7 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:05:28.3 | step: 370 +epoch: 8 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.019 | time: 0:05:36.7 | step: 380 +epoch: 8 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 0:05:45.6 | step: 390 +epoch: 8 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:05:54.5 | step: 400 +epoch: 8 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.034 | time: 0:06:03.4 | step: 410 +epoch: 8 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:06:12.3 | step: 420 +epoch: 9 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.027 | time: 0:06:20.7 | step: 430 +epoch: 9 | 16/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 0:06:29.6 | step: 440 +epoch: 9 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:06:38.5 | step: 450 +epoch: 9 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:06:47.4 | step: 460 +epoch: 9 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:06:55.8 | step: 470 +epoch: 10 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.042 | time: 0:07:04.7 | step: 480 +epoch: 10 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:07:13.6 | step: 490 +epoch: 10 | 29/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.034 | time: 0:07:22.4 | step: 500 +epoch: 10 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:07:31.3 | step: 510 +epoch: 11 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.017 | time: 0:07:39.7 | step: 520 +epoch: 11 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:07:48.6 | step: 530 +epoch: 11 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.005 | time: 0:07:57.4 | step: 540 +epoch: 11 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 0:08:06.3 | step: 550 +epoch: 11 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 0:08:15.2 | step: 560 +epoch: 12 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.022 | time: 0:08:23.7 | step: 570 +epoch: 12 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.006 | time: 0:08:32.6 | step: 580 +epoch: 12 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.058 | time: 0:08:41.4 | step: 590 +epoch: 12 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:08:50.3 | step: 600 +epoch: 12 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:08:59.2 | step: 610 +epoch: 13 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.025 | time: 0:09:07.6 | step: 620 +epoch: 13 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 0:09:16.4 | step: 630 +epoch: 13 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:09:25.3 | step: 640 +epoch: 13 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:09:34.2 | step: 650 +epoch: 14 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.028 | time: 0:09:42.6 | step: 660 +epoch: 14 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 0:09:51.5 | step: 670 +epoch: 14 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:10:00.4 | step: 680 +epoch: 14 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:10:09.3 | step: 690 +epoch: 14 | 41/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:10:18.2 | step: 700 +epoch: 15 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.013 | time: 0:10:26.6 | step: 710 +epoch: 15 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.038 | time: 0:10:35.5 | step: 720 +epoch: 15 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 0:10:44.4 | step: 730 +epoch: 15 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 0:10:53.2 | step: 740 +epoch: 15 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:11:02.1 | step: 750 +epoch: 16 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 0:11:10.5 | step: 760 +epoch: 16 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:11:19.4 | step: 770 +epoch: 16 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 0:11:28.3 | step: 780 +epoch: 16 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:11:37.2 | step: 790 +epoch: 17 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.011 | time: 0:11:45.7 | step: 800 +epoch: 17 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:11:54.5 | step: 810 +epoch: 17 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.032 | time: 0:12:03.4 | step: 820 +epoch: 17 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:12:12.3 | step: 830 +epoch: 17 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 0:12:21.2 | step: 840 +epoch: 18 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.019 | time: 0:12:29.6 | step: 850 +epoch: 18 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.039 | time: 0:12:38.5 | step: 860 +epoch: 18 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:12:47.4 | step: 870 +epoch: 18 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.050 | time: 0:12:56.3 | step: 880 +epoch: 18 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:13:05.2 | step: 890 +epoch: 19 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.031 | time: 0:13:13.6 | step: 900 +epoch: 19 | 16/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 0:13:22.5 | step: 910 +epoch: 19 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.054 | time: 0:13:31.4 | step: 920 +epoch: 19 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:13:40.3 | step: 930 +epoch: 19 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:13:48.7 | step: 940 +epoch: 20 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.026 | time: 0:13:57.7 | step: 950 +epoch: 20 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:14:06.6 | step: 960 +epoch: 20 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.044 | time: 0:14:15.4 | step: 970 +epoch: 20 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:14:24.3 | step: 980 +epoch: 21 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.026 | time: 0:14:32.8 | step: 990 +epoch: 21 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.030 | time: 0:14:41.7 | step: 1000 +epoch: 21 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:14:50.5 | step: 1010 +epoch: 21 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 0:14:59.5 | step: 1020 +epoch: 21 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.037 | time: 0:15:08.3 | step: 1030 +epoch: 22 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.023 | time: 0:15:16.8 | step: 1040 +epoch: 22 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:15:25.7 | step: 1050 +epoch: 22 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.022 | time: 0:15:34.5 | step: 1060 +epoch: 22 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 0:15:43.4 | step: 1070 +epoch: 22 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:15:52.3 | step: 1080 +epoch: 23 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.025 | time: 0:16:00.7 | step: 1090 +epoch: 23 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:16:09.6 | step: 1100 +epoch: 23 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 0:16:18.4 | step: 1110 +epoch: 23 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:16:27.3 | step: 1120 +epoch: 24 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.018 | time: 0:16:35.7 | step: 1130 +epoch: 24 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 0:16:44.6 | step: 1140 +epoch: 24 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:16:53.4 | step: 1150 +epoch: 24 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 0:17:02.3 | step: 1160 +epoch: 24 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:17:11.2 | step: 1170 +epoch: 25 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.032 | time: 0:17:19.6 | step: 1180 +epoch: 25 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 0:17:28.5 | step: 1190 +epoch: 25 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:17:37.4 | step: 1200 +epoch: 25 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 0:17:46.3 | step: 1210 +epoch: 25 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:17:55.1 | step: 1220 +epoch: 26 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.028 | time: 0:18:03.6 | step: 1230 +epoch: 26 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.039 | time: 0:18:12.5 | step: 1240 +epoch: 26 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.028 | time: 0:18:21.4 | step: 1250 +epoch: 26 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:18:30.2 | step: 1260 +epoch: 27 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.036 | time: 0:18:38.7 | step: 1270 +epoch: 27 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:18:47.6 | step: 1280 +epoch: 27 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:18:56.5 | step: 1290 +epoch: 27 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 0:19:05.3 | step: 1300 +epoch: 27 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.049 | time: 0:19:14.2 | step: 1310 +epoch: 28 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.122 | time: 0:19:22.7 | step: 1320 +epoch: 28 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.036 | time: 0:19:31.6 | step: 1330 +epoch: 28 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.043 | time: 0:19:40.4 | step: 1340 +epoch: 28 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.035 | time: 0:19:49.3 | step: 1350 +epoch: 28 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.079 | time: 0:19:58.2 | step: 1360 +epoch: 29 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.024 | time: 0:20:06.7 | step: 1370 +epoch: 29 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.039 | time: 0:20:15.6 | step: 1380 +epoch: 29 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:20:24.4 | step: 1390 +epoch: 29 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:20:33.3 | step: 1400 +epoch: 29 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:20:41.7 | step: 1410 +epoch: 30 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.014 | time: 0:20:50.7 | step: 1420 +epoch: 30 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 0:20:59.6 | step: 1430 +epoch: 30 | 29/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.042 | time: 0:21:08.5 | step: 1440 +epoch: 30 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 0:21:17.4 | step: 1450 +epoch: 31 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.025 | time: 0:21:25.9 | step: 1460 +epoch: 31 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:21:34.7 | step: 1470 +epoch: 31 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 0:21:43.6 | step: 1480 +epoch: 31 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 0:21:52.5 | step: 1490 +epoch: 31 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:22:01.4 | step: 1500 +epoch: 32 | 5/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.009 | time: 0:22:09.8 | step: 1510 +epoch: 32 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:22:18.7 | step: 1520 +epoch: 32 | 25/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:22:27.5 | step: 1530 +epoch: 32 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.037 | time: 0:22:36.4 | step: 1540 +epoch: 32 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:22:45.2 | step: 1550 +epoch: 33 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.010 | time: 0:22:53.6 | step: 1560 +epoch: 33 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.039 | time: 0:23:02.5 | step: 1570 +epoch: 33 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.005 | time: 0:23:11.3 | step: 1580 +epoch: 33 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 0:23:20.2 | step: 1590 +epoch: 34 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.047 | time: 0:23:28.6 | step: 1600 +epoch: 34 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:23:37.4 | step: 1610 +epoch: 34 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:23:46.3 | step: 1620 +epoch: 34 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:23:55.1 | step: 1630 +epoch: 34 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:24:04.0 | step: 1640 +epoch: 35 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.027 | time: 0:24:12.4 | step: 1650 +epoch: 35 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 0:24:21.3 | step: 1660 +epoch: 35 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:24:30.1 | step: 1670 +epoch: 35 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:24:39.0 | step: 1680 +epoch: 35 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:24:47.9 | step: 1690 +epoch: 36 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.006 | time: 0:24:56.3 | step: 1700 +epoch: 36 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 0:25:05.2 | step: 1710 +epoch: 36 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 0:25:14.0 | step: 1720 +epoch: 36 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.036 | time: 0:25:22.9 | step: 1730 +epoch: 37 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.040 | time: 0:25:31.3 | step: 1740 +epoch: 37 | 10/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.035 | time: 0:25:40.2 | step: 1750 +epoch: 37 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:25:49.1 | step: 1760 +epoch: 37 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:25:58.0 | step: 1770 +epoch: 37 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 0:26:06.8 | step: 1780 +epoch: 38 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.022 | time: 0:26:15.3 | step: 1790 +epoch: 38 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 0:26:24.2 | step: 1800 +epoch: 38 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 0:26:33.0 | step: 1810 +epoch: 38 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 0:26:41.9 | step: 1820 +epoch: 38 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:26:50.8 | step: 1830 +epoch: 39 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.043 | time: 0:26:59.3 | step: 1840 +epoch: 39 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:27:08.1 | step: 1850 +epoch: 39 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:27:17.0 | step: 1860 +epoch: 39 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:27:25.9 | step: 1870 +epoch: 39 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:27:34.3 | step: 1880 +epoch: 40 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:27:43.3 | step: 1890 +epoch: 40 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:27:52.2 | step: 1900 +epoch: 40 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.028 | time: 0:28:01.0 | step: 1910 +epoch: 40 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:28:09.9 | step: 1920 +epoch: 41 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.031 | time: 0:28:18.4 | step: 1930 +epoch: 41 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:28:27.3 | step: 1940 +epoch: 41 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:28:36.1 | step: 1950 +epoch: 41 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:28:45.0 | step: 1960 +epoch: 41 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:28:53.9 | step: 1970 +epoch: 42 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.024 | time: 0:29:02.3 | step: 1980 +epoch: 42 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:29:11.2 | step: 1990 +epoch: 42 | 25/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:29:20.1 | step: 2000 --- model size --- model: 55,192,704 ======= start training ======= epoch|batch_idx/num_batches|output_dir|batch/s|lr|time|step +epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 0.66 | lr: 0.0002 | loss: 0.026 | time: 0:00:15.7 | step: 2010 +epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.022 | time: 0:00:24.0 | step: 2020 +epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.034 | time: 0:00:32.4 | step: 2030 +epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.032 | time: 0:00:40.9 | step: 2040 +epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.025 | time: 0:00:49.1 | step: 2050 +epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.029 | time: 0:00:57.8 | step: 2060 +epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.038 | time: 0:01:06.5 | step: 2070 +epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.037 | time: 0:01:15.5 | step: 2080 +epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.040 | time: 0:01:24.6 | step: 2090 +epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:01:33.4 | step: 2100 +epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.041 | time: 0:01:42.7 | step: 2110 +epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 0:01:51.8 | step: 2120 +epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.034 | time: 0:02:00.8 | step: 2130 +epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:02:09.7 | step: 2140 +epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.009 | time: 0:02:18.2 | step: 2150 +epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 0:02:27.1 | step: 2160 +epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.030 | time: 0:02:36.1 | step: 2170 +epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:02:45.1 | step: 2180 +epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.020 | time: 0:02:53.7 | step: 2190 +epoch: 4 | 11/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.027 | time: 0:03:02.8 | step: 2200 +epoch: 4 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.026 | time: 0:03:11.9 | step: 2210 +epoch: 4 | 31/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 0:03:20.9 | step: 2220 +epoch: 4 | 41/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 0:03:30.0 | step: 2230 +epoch: 5 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.043 | time: 0:03:38.6 | step: 2240 +epoch: 5 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:03:47.6 | step: 2250 +epoch: 5 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:03:56.7 | step: 2260 +epoch: 5 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:04:05.7 | step: 2270 +epoch: 5 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.042 | time: 0:04:14.7 | step: 2280 +epoch: 6 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.020 | time: 0:04:23.3 | step: 2290 +epoch: 6 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:04:32.3 | step: 2300 +epoch: 6 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:04:41.3 | step: 2310 +epoch: 6 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:04:50.3 | step: 2320 +epoch: 7 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.006 | time: 0:04:58.9 | step: 2330 +epoch: 7 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:05:07.9 | step: 2340 +epoch: 7 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:05:16.9 | step: 2350 +epoch: 7 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:05:26.0 | step: 2360 +epoch: 7 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:05:35.0 | step: 2370 +epoch: 8 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:05:43.6 | step: 2380 +epoch: 8 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:05:52.6 | step: 2390 +epoch: 8 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:06:01.6 | step: 2400 +epoch: 8 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:06:10.7 | step: 2410 +epoch: 8 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:06:19.7 | step: 2420 +epoch: 9 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.025 | time: 0:06:28.2 | step: 2430 +epoch: 9 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:06:37.3 | step: 2440 +epoch: 9 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:06:46.3 | step: 2450 +epoch: 9 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 0:06:55.3 | step: 2460 +epoch: 9 | 46/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:07:03.8 | step: 2470 +epoch: 10 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:07:12.9 | step: 2480 +epoch: 10 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:07:21.9 | step: 2490 +epoch: 10 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.040 | time: 0:07:31.0 | step: 2500 +epoch: 10 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:07:40.0 | step: 2510 +epoch: 11 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.015 | time: 0:07:48.6 | step: 2520 +epoch: 11 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 0:07:57.7 | step: 2530 +epoch: 11 | 22/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.028 | time: 0:08:06.7 | step: 2540 +epoch: 11 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:08:15.8 | step: 2550 +epoch: 11 | 42/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:08:24.8 | step: 2560 +epoch: 12 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.004 | time: 0:08:33.4 | step: 2570 +epoch: 12 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:08:42.5 | step: 2580 +epoch: 12 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.025 | time: 0:08:51.6 | step: 2590 +epoch: 12 | 35/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.030 | time: 0:09:00.6 | step: 2600 +epoch: 12 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.032 | time: 0:09:09.7 | step: 2610 +epoch: 13 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.010 | time: 0:09:18.3 | step: 2620 +epoch: 13 | 18/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.031 | time: 0:09:27.4 | step: 2630 +epoch: 13 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:09:36.4 | step: 2640 +epoch: 13 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.031 | time: 0:09:45.5 | step: 2650 +epoch: 14 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.025 | time: 0:09:54.1 | step: 2660 +epoch: 14 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:10:03.1 | step: 2670 +epoch: 14 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:10:12.1 | step: 2680 +epoch: 14 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:10:21.1 | step: 2690 +epoch: 14 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:10:30.1 | step: 2700 +epoch: 15 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.020 | time: 0:10:38.7 | step: 2710 +epoch: 15 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:10:47.7 | step: 2720 +epoch: 15 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:10:56.7 | step: 2730 +epoch: 15 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 0:11:05.7 | step: 2740 +epoch: 15 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:11:14.7 | step: 2750 +epoch: 16 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.006 | time: 0:11:23.3 | step: 2760 +epoch: 16 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.039 | time: 0:11:32.3 | step: 2770 +epoch: 16 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:11:41.3 | step: 2780 +epoch: 16 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:11:50.3 | step: 2790 +epoch: 17 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.041 | time: 0:11:58.9 | step: 2800 +epoch: 17 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:12:07.9 | step: 2810 +epoch: 17 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:12:17.0 | step: 2820 +epoch: 17 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:12:26.0 | step: 2830 +epoch: 17 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:12:35.0 | step: 2840 +epoch: 18 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.021 | time: 0:12:43.6 | step: 2850 +epoch: 18 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:12:52.7 | step: 2860 +epoch: 18 | 23/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.030 | time: 0:13:01.7 | step: 2870 +epoch: 18 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:13:10.8 | step: 2880 +epoch: 18 | 43/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:13:19.8 | step: 2890 +epoch: 19 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:13:28.4 | step: 2900 +epoch: 19 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:13:37.5 | step: 2910 +epoch: 19 | 26/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 0:13:46.5 | step: 2920 +epoch: 19 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:13:55.6 | step: 2930 +epoch: 19 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 0:14:04.2 | step: 2940 +epoch: 20 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.034 | time: 0:14:13.3 | step: 2950 +epoch: 20 | 19/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 0:14:22.4 | step: 2960 +epoch: 20 | 29/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.013 | time: 0:14:31.4 | step: 2970 +epoch: 20 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.037 | time: 0:14:40.5 | step: 2980 +epoch: 21 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.008 | time: 0:14:49.1 | step: 2990 +epoch: 21 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:14:58.2 | step: 3000 +epoch: 21 | 22/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.038 | time: 0:15:07.2 | step: 3010 +epoch: 21 | 32/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.044 | time: 0:15:16.3 | step: 3020 +epoch: 21 | 42/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.022 | time: 0:15:25.3 | step: 3030 +epoch: 22 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.017 | time: 0:15:33.9 | step: 3040 +epoch: 22 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:15:43.0 | step: 3050 +epoch: 22 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.049 | time: 0:15:52.0 | step: 3060 +epoch: 22 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:16:01.1 | step: 3070 +epoch: 22 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:16:10.1 | step: 3080 +epoch: 23 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.020 | time: 0:16:18.7 | step: 3090 +epoch: 23 | 18/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.029 | time: 0:16:27.8 | step: 3100 +epoch: 23 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:16:36.9 | step: 3110 +epoch: 23 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.022 | time: 0:16:45.9 | step: 3120 +epoch: 24 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.005 | time: 0:16:54.5 | step: 3130 +epoch: 24 | 11/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.027 | time: 0:17:03.6 | step: 3140 +epoch: 24 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.006 | time: 0:17:12.6 | step: 3150 +epoch: 24 | 31/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.020 | time: 0:17:21.7 | step: 3160 +epoch: 24 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:17:30.8 | step: 3170 +epoch: 25 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.012 | time: 0:17:39.4 | step: 3180 +epoch: 25 | 14/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.026 | time: 0:17:48.4 | step: 3190 +epoch: 25 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:17:57.5 | step: 3200 +epoch: 25 | 34/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 0:18:06.5 | step: 3210 +epoch: 25 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:18:15.6 | step: 3220 +epoch: 26 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.038 | time: 0:18:24.2 | step: 3230 +epoch: 26 | 17/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.027 | time: 0:18:33.3 | step: 3240 +epoch: 26 | 27/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.028 | time: 0:18:42.4 | step: 3250 +epoch: 26 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:18:51.4 | step: 3260 +epoch: 27 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.027 | time: 0:19:00.0 | step: 3270 +epoch: 27 | 10/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 0:19:09.1 | step: 3280 +epoch: 27 | 20/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:19:18.1 | step: 3290 +epoch: 27 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:19:27.2 | step: 3300 +epoch: 27 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:19:36.2 | step: 3310 +epoch: 28 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.024 | time: 0:19:44.8 | step: 3320 +epoch: 28 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:19:53.8 | step: 3330 +epoch: 28 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:20:02.8 | step: 3340 +epoch: 28 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:20:11.8 | step: 3350 +epoch: 28 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 0:20:20.8 | step: 3360 +epoch: 29 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.012 | time: 0:20:29.3 | step: 3370 +epoch: 29 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:20:38.3 | step: 3380 +epoch: 29 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:20:47.3 | step: 3390 +epoch: 29 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.043 | time: 0:20:56.3 | step: 3400 +epoch: 29 | 46/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:21:04.9 | step: 3410 +epoch: 30 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:21:14.0 | step: 3420 +epoch: 30 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:21:23.0 | step: 3430 +epoch: 30 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:21:32.0 | step: 3440 +epoch: 30 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:21:41.0 | step: 3450 +epoch: 31 | 2/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.012 | time: 0:21:49.5 | step: 3460 +epoch: 31 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:21:58.6 | step: 3470 +epoch: 31 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:22:07.6 | step: 3480 +epoch: 31 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:22:16.6 | step: 3490 +epoch: 31 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 0:22:25.6 | step: 3500 +epoch: 32 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.022 | time: 0:22:34.2 | step: 3510 +epoch: 32 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:22:43.2 | step: 3520 +epoch: 32 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:22:52.2 | step: 3530 +epoch: 32 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:23:01.2 | step: 3540 +epoch: 32 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.037 | time: 0:23:10.2 | step: 3550 +epoch: 33 | 8/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.009 | time: 0:23:18.8 | step: 3560 +epoch: 33 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:23:27.9 | step: 3570 +epoch: 33 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:23:36.9 | step: 3580 +epoch: 33 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:23:45.9 | step: 3590 +epoch: 34 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.019 | time: 0:23:54.5 | step: 3600 +epoch: 34 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:24:03.5 | step: 3610 +epoch: 34 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:24:12.6 | step: 3620 +epoch: 34 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 0:24:21.6 | step: 3630 +epoch: 34 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:24:30.6 | step: 3640 +epoch: 35 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.045 | time: 0:24:39.2 | step: 3650 +epoch: 35 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:24:48.2 | step: 3660 +epoch: 35 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:24:57.3 | step: 3670 +epoch: 35 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:25:06.3 | step: 3680 +epoch: 35 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:25:15.4 | step: 3690 +epoch: 36 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:25:24.0 | step: 3700 +epoch: 36 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:25:33.0 | step: 3710 +epoch: 36 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 0:25:42.0 | step: 3720 +epoch: 36 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:25:51.1 | step: 3730 +epoch: 37 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.031 | time: 0:25:59.7 | step: 3740 +epoch: 37 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:26:08.7 | step: 3750 +epoch: 37 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.041 | time: 0:26:17.7 | step: 3760 +epoch: 37 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:26:26.8 | step: 3770 +epoch: 37 | 40/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:26:35.8 | step: 3780 +epoch: 38 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.040 | time: 0:26:44.4 | step: 3790 +epoch: 38 | 13/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 0:26:53.5 | step: 3800 +epoch: 38 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:27:02.5 | step: 3810 +epoch: 38 | 33/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.021 | time: 0:27:11.5 | step: 3820 +epoch: 38 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:27:20.6 | step: 3830 +epoch: 39 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.006 | time: 0:27:29.2 | step: 3840 +epoch: 39 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:27:38.2 | step: 3850 +epoch: 39 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:27:47.2 | step: 3860 +epoch: 39 | 36/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.021 | time: 0:27:56.3 | step: 3870 +epoch: 39 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:28:04.9 | step: 3880 +epoch: 40 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:28:14.0 | step: 3890 +epoch: 40 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:28:23.0 | step: 3900 +epoch: 40 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:28:32.0 | step: 3910 +epoch: 40 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:28:41.1 | step: 3920 +epoch: 41 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.019 | time: 0:28:49.7 | step: 3930 +epoch: 41 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.039 | time: 0:28:58.7 | step: 3940 +epoch: 41 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:29:07.7 | step: 3950 +epoch: 41 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:29:16.8 | step: 3960 +epoch: 41 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.058 | time: 0:29:25.8 | step: 3970 +epoch: 42 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.008 | time: 0:29:34.4 | step: 3980 +epoch: 42 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:29:43.4 | step: 3990 +epoch: 42 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:29:52.5 | step: 4000 +epoch: 42 | 35/ 47 | logs/44k/diffusion | batch/s: 0.33 | lr: 0.0002 | loss: 0.015 | time: 0:30:23.0 | step: 4010 +epoch: 42 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 0:30:32.1 | step: 4020 +epoch: 43 | 8/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.039 | time: 0:30:41.0 | step: 4030 +epoch: 43 | 18/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.033 | time: 0:30:50.5 | step: 4040 +epoch: 43 | 28/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.024 | time: 0:30:59.7 | step: 4050 +epoch: 43 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.019 | time: 0:31:08.8 | step: 4060 +epoch: 44 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.016 | time: 0:31:17.3 | step: 4070 +epoch: 44 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 0:31:26.2 | step: 4080 +epoch: 44 | 21/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 0:31:35.1 | step: 4090 +epoch: 44 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 0:31:44.1 | step: 4100 +epoch: 44 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.049 | time: 0:31:53.1 | step: 4110 +epoch: 45 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.023 | time: 0:32:01.7 | step: 4120 +epoch: 45 | 14/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.022 | time: 0:32:10.8 | step: 4130 +epoch: 45 | 24/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 0:32:19.9 | step: 4140 +epoch: 45 | 34/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:32:29.0 | step: 4150 +epoch: 45 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:32:38.0 | step: 4160 +epoch: 46 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.010 | time: 0:32:46.6 | step: 4170 +epoch: 46 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:32:55.6 | step: 4180 +epoch: 46 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:33:04.6 | step: 4190 +epoch: 46 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:33:13.6 | step: 4200 +epoch: 47 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.012 | time: 0:33:22.1 | step: 4210 +epoch: 47 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:33:31.1 | step: 4220 +epoch: 47 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:33:40.2 | step: 4230 +epoch: 47 | 30/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:33:49.2 | step: 4240 +epoch: 47 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:33:58.2 | step: 4250 +epoch: 48 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:34:06.9 | step: 4260 +epoch: 48 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:34:15.9 | step: 4270 +epoch: 48 | 23/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 0:34:25.0 | step: 4280 +epoch: 48 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:34:34.0 | step: 4290 +epoch: 48 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:34:43.1 | step: 4300 +epoch: 49 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.025 | time: 0:34:51.7 | step: 4310 +epoch: 49 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:35:00.7 | step: 4320 +epoch: 49 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:35:09.7 | step: 4330 +epoch: 49 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 0:35:18.8 | step: 4340 +epoch: 49 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 0:35:27.4 | step: 4350 +epoch: 50 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:35:36.5 | step: 4360 +epoch: 50 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:35:45.5 | step: 4370 +epoch: 50 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 0:35:54.6 | step: 4380 +epoch: 50 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:36:03.6 | step: 4390 +epoch: 51 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.011 | time: 0:36:12.2 | step: 4400 +epoch: 51 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:36:21.2 | step: 4410 +epoch: 51 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:36:30.2 | step: 4420 +epoch: 51 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:36:39.2 | step: 4430 +epoch: 51 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:36:48.3 | step: 4440 +epoch: 52 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.007 | time: 0:36:56.8 | step: 4450 +epoch: 52 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:37:05.9 | step: 4460 +epoch: 52 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:37:14.9 | step: 4470 +epoch: 52 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:37:23.9 | step: 4480 +epoch: 52 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 0:37:33.0 | step: 4490 +epoch: 53 | 8/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.038 | time: 0:37:41.5 | step: 4500 +epoch: 53 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.038 | time: 0:37:50.6 | step: 4510 +epoch: 53 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:37:59.6 | step: 4520 +epoch: 53 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:38:08.6 | step: 4530 +epoch: 54 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.022 | time: 0:38:17.2 | step: 4540 +epoch: 54 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:38:26.2 | step: 4550 +epoch: 54 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:38:35.2 | step: 4560 +epoch: 54 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.044 | time: 0:38:44.3 | step: 4570 +epoch: 54 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.036 | time: 0:38:53.3 | step: 4580 +epoch: 55 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.020 | time: 0:39:01.8 | step: 4590 +epoch: 55 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:39:10.8 | step: 4600 +epoch: 55 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:39:19.9 | step: 4610 +epoch: 55 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:39:28.9 | step: 4620 +epoch: 55 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:39:37.9 | step: 4630 +epoch: 56 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.020 | time: 0:39:46.4 | step: 4640 +epoch: 56 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:39:55.4 | step: 4650 +epoch: 56 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.048 | time: 0:40:04.4 | step: 4660 +epoch: 56 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:40:13.5 | step: 4670 +epoch: 57 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.021 | time: 0:40:22.0 | step: 4680 +epoch: 57 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:40:31.0 | step: 4690 +epoch: 57 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:40:40.0 | step: 4700 +epoch: 57 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.055 | time: 0:40:49.0 | step: 4710 +epoch: 57 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.063 | time: 0:40:58.0 | step: 4720 +epoch: 58 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.008 | time: 0:41:06.6 | step: 4730 +epoch: 58 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:41:15.6 | step: 4740 +epoch: 58 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:41:24.6 | step: 4750 +epoch: 58 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:41:33.7 | step: 4760 +epoch: 58 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:41:42.7 | step: 4770 +epoch: 59 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.020 | time: 0:41:51.2 | step: 4780 +epoch: 59 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:42:00.2 | step: 4790 +epoch: 59 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:42:09.2 | step: 4800 +epoch: 59 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:42:18.2 | step: 4810 +epoch: 59 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.005 | time: 0:42:26.8 | step: 4820 +epoch: 60 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:42:35.9 | step: 4830 +epoch: 60 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:42:44.9 | step: 4840 +epoch: 60 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:42:53.9 | step: 4850 +epoch: 60 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:43:02.9 | step: 4860 +epoch: 61 | 2/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.030 | time: 0:43:11.5 | step: 4870 +epoch: 61 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:43:20.5 | step: 4880 +epoch: 61 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:43:29.5 | step: 4890 +epoch: 61 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:43:38.5 | step: 4900 +epoch: 61 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:43:47.5 | step: 4910 +epoch: 62 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.034 | time: 0:43:56.1 | step: 4920 +epoch: 62 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:44:05.1 | step: 4930 +epoch: 62 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:44:14.1 | step: 4940 +epoch: 62 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:44:23.1 | step: 4950 +epoch: 62 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:44:32.1 | step: 4960 +epoch: 63 | 8/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.012 | time: 0:44:40.7 | step: 4970 +epoch: 63 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:44:49.7 | step: 4980 +epoch: 63 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:44:58.7 | step: 4990 +epoch: 63 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:45:07.7 | step: 5000 +epoch: 64 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.013 | time: 0:45:16.3 | step: 5010 +epoch: 64 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:45:25.3 | step: 5020 +epoch: 64 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:45:34.3 | step: 5030 +epoch: 64 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:45:43.3 | step: 5040 +epoch: 64 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:45:52.3 | step: 5050 +epoch: 65 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.006 | time: 0:46:00.9 | step: 5060 +epoch: 65 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:46:09.9 | step: 5070 +epoch: 65 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:46:18.9 | step: 5080 +epoch: 65 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:46:27.9 | step: 5090 +epoch: 65 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:46:36.9 | step: 5100 +epoch: 66 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.009 | time: 0:46:45.4 | step: 5110 +epoch: 66 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:46:54.4 | step: 5120 +epoch: 66 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.036 | time: 0:47:03.4 | step: 5130 +epoch: 66 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:47:12.4 | step: 5140 +epoch: 67 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.016 | time: 0:47:21.0 | step: 5150 +epoch: 67 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.041 | time: 0:47:30.0 | step: 5160 +epoch: 67 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:47:39.0 | step: 5170 +epoch: 67 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:47:48.0 | step: 5180 +epoch: 67 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:47:57.0 | step: 5190 +epoch: 68 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.024 | time: 0:48:05.6 | step: 5200 +epoch: 68 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:48:14.6 | step: 5210 +epoch: 68 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:48:23.6 | step: 5220 +epoch: 68 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:48:32.6 | step: 5230 +epoch: 68 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:48:41.6 | step: 5240 +epoch: 69 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.027 | time: 0:48:50.2 | step: 5250 +epoch: 69 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:48:59.2 | step: 5260 +epoch: 69 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:49:08.2 | step: 5270 +epoch: 69 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:49:17.2 | step: 5280 +epoch: 69 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.006 | time: 0:49:25.7 | step: 5290 +epoch: 70 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.029 | time: 0:49:34.8 | step: 5300 +epoch: 70 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:49:43.8 | step: 5310 +epoch: 70 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:49:52.8 | step: 5320 +epoch: 70 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:50:01.8 | step: 5330 +epoch: 71 | 2/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.008 | time: 0:50:10.4 | step: 5340 +epoch: 71 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:50:19.4 | step: 5350 +epoch: 71 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:50:28.4 | step: 5360 +epoch: 71 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:50:37.4 | step: 5370 +epoch: 71 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:50:46.4 | step: 5380 +epoch: 72 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.016 | time: 0:50:55.0 | step: 5390 +epoch: 72 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:51:04.0 | step: 5400 +epoch: 72 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:51:13.0 | step: 5410 +epoch: 72 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:51:22.0 | step: 5420 +epoch: 72 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:51:31.0 | step: 5430 +epoch: 73 | 8/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.011 | time: 0:51:39.6 | step: 5440 +epoch: 73 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.041 | time: 0:51:48.6 | step: 5450 +epoch: 73 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:51:57.6 | step: 5460 +epoch: 73 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.049 | time: 0:52:06.6 | step: 5470 +epoch: 74 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.044 | time: 0:52:15.2 | step: 5480 +epoch: 74 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:52:24.2 | step: 5490 +epoch: 74 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:52:33.3 | step: 5500 +epoch: 74 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:52:42.3 | step: 5510 +epoch: 74 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:52:51.3 | step: 5520 +epoch: 75 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.023 | time: 0:52:59.9 | step: 5530 +epoch: 75 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:53:08.9 | step: 5540 +epoch: 75 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:53:17.9 | step: 5550 +epoch: 75 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.039 | time: 0:53:26.9 | step: 5560 +epoch: 75 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 0:53:35.9 | step: 5570 +epoch: 76 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.024 | time: 0:53:44.5 | step: 5580 +epoch: 76 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:53:53.6 | step: 5590 +epoch: 76 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:54:02.6 | step: 5600 +epoch: 76 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:54:11.6 | step: 5610 +epoch: 77 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.040 | time: 0:54:20.2 | step: 5620 +epoch: 77 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:54:29.2 | step: 5630 +epoch: 77 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 0:54:38.2 | step: 5640 +epoch: 77 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.039 | time: 0:54:47.2 | step: 5650 +epoch: 77 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:54:56.2 | step: 5660 +epoch: 78 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.019 | time: 0:55:04.8 | step: 5670 +epoch: 78 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:55:13.8 | step: 5680 +epoch: 78 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:55:22.9 | step: 5690 +epoch: 78 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:55:31.9 | step: 5700 +epoch: 78 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:55:40.9 | step: 5710 +epoch: 79 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.021 | time: 0:55:49.5 | step: 5720 +epoch: 79 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:55:58.5 | step: 5730 +epoch: 79 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.044 | time: 0:56:07.5 | step: 5740 +epoch: 79 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:56:16.6 | step: 5750 +epoch: 79 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.006 | time: 0:56:25.1 | step: 5760 +epoch: 80 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:56:34.3 | step: 5770 +epoch: 80 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.036 | time: 0:56:43.3 | step: 5780 +epoch: 80 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:56:52.3 | step: 5790 +epoch: 80 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:57:01.3 | step: 5800 +epoch: 81 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.023 | time: 0:57:09.9 | step: 5810 +epoch: 81 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:57:19.0 | step: 5820 +epoch: 81 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.050 | time: 0:57:28.0 | step: 5830 +epoch: 81 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:57:37.0 | step: 5840 +epoch: 81 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:57:46.0 | step: 5850 +epoch: 82 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.019 | time: 0:57:54.6 | step: 5860 +epoch: 82 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:58:03.7 | step: 5870 +epoch: 82 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:58:12.7 | step: 5880 +epoch: 82 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:58:21.7 | step: 5890 +epoch: 82 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:58:30.8 | step: 5900 +epoch: 83 | 8/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.018 | time: 0:58:39.4 | step: 5910 +epoch: 83 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.040 | time: 0:58:48.4 | step: 5920 +epoch: 83 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.004 | time: 0:58:57.4 | step: 5930 +epoch: 83 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.019 | time: 0:59:06.5 | step: 5940 +epoch: 84 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.007 | time: 0:59:15.1 | step: 5950 +epoch: 84 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:59:24.1 | step: 5960 +epoch: 84 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 0:59:33.2 | step: 5970 +epoch: 84 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:59:42.2 | step: 5980 +epoch: 84 | 41/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.010 | time: 0:59:51.2 | step: 5990 +epoch: 85 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.017 | time: 0:59:59.9 | step: 6000 +epoch: 85 | 14/ 47 | logs/44k/diffusion | batch/s: 0.48 | lr: 0.0002 | loss: 0.028 | time: 1:00:20.8 | step: 6010 +epoch: 85 | 24/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.032 | time: 1:00:29.9 | step: 6020 +epoch: 85 | 34/ 47 | logs/44k/diffusion | batch/s: 1.07 | lr: 0.0002 | loss: 0.016 | time: 1:00:39.3 | step: 6030 +epoch: 85 | 44/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.014 | time: 1:00:48.7 | step: 6040 +epoch: 86 | 7/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.005 | time: 1:00:57.4 | step: 6050 +epoch: 86 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 1:01:06.4 | step: 6060 +epoch: 86 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.024 | time: 1:01:15.3 | step: 6070 +epoch: 86 | 37/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 1:01:24.3 | step: 6080 +epoch: 87 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.009 | time: 1:01:32.8 | step: 6090 +epoch: 87 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 1:01:41.7 | step: 6100 +epoch: 87 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 1:01:50.7 | step: 6110 +epoch: 87 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 1:01:59.8 | step: 6120 +epoch: 87 | 40/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.007 | time: 1:02:08.9 | step: 6130 +epoch: 88 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.041 | time: 1:02:17.5 | step: 6140 +epoch: 88 | 13/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.031 | time: 1:02:26.5 | step: 6150 +epoch: 88 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 1:02:35.6 | step: 6160 +epoch: 88 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 1:02:44.5 | step: 6170 +epoch: 88 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 1:02:53.5 | step: 6180 +epoch: 89 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.004 | time: 1:03:02.1 | step: 6190 +epoch: 89 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 1:03:11.1 | step: 6200 +epoch: 89 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 1:03:20.1 | step: 6210 +epoch: 89 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 1:03:29.1 | step: 6220 +epoch: 89 | 46/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 1:03:37.6 | step: 6230 +epoch: 90 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.050 | time: 1:03:46.7 | step: 6240 +epoch: 90 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.049 | time: 1:03:55.8 | step: 6250 +epoch: 90 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 1:04:04.8 | step: 6260 +epoch: 90 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 1:04:13.8 | step: 6270 +epoch: 91 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.028 | time: 1:04:22.4 | step: 6280 +epoch: 91 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 1:04:31.4 | step: 6290 +epoch: 91 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 1:04:40.4 | step: 6300 +epoch: 91 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 1:04:49.5 | step: 6310 +epoch: 91 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 1:04:58.5 | step: 6320 +epoch: 92 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.015 | time: 1:05:07.1 | step: 6330 +epoch: 92 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 1:05:16.1 | step: 6340 +epoch: 92 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.029 | time: 1:05:25.2 | step: 6350 +epoch: 92 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 1:05:34.2 | step: 6360 +epoch: 92 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.027 | time: 1:05:43.2 | step: 6370 +epoch: 93 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.028 | time: 1:05:51.8 | step: 6380 +epoch: 93 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 1:06:00.9 | step: 6390 +epoch: 93 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 1:06:09.9 | step: 6400 +epoch: 93 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.006 | time: 1:06:19.0 | step: 6410 +epoch: 94 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.011 | time: 1:06:27.6 | step: 6420 +epoch: 94 | 11/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.010 | time: 1:06:36.6 | step: 6430 +epoch: 94 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 1:06:45.7 | step: 6440 +epoch: 94 | 31/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.008 | time: 1:06:54.7 | step: 6450 +epoch: 94 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 1:07:03.8 | step: 6460 +epoch: 95 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.016 | time: 1:07:12.4 | step: 6470 +epoch: 95 | 14/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.005 | time: 1:07:21.4 | step: 6480 +epoch: 95 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.004 | time: 1:07:30.5 | step: 6490 +epoch: 95 | 34/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.019 | time: 1:07:39.5 | step: 6500 +epoch: 95 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 1:07:48.5 | step: 6510 +epoch: 96 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.015 | time: 1:07:57.2 | step: 6520 +epoch: 96 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 1:08:06.2 | step: 6530 +epoch: 96 | 27/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 1:08:15.3 | step: 6540 +epoch: 96 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 1:08:24.3 | step: 6550 +epoch: 97 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.009 | time: 1:08:32.9 | step: 6560 +epoch: 97 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 1:08:42.0 | step: 6570 +epoch: 97 | 20/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 1:08:51.0 | step: 6580 +epoch: 97 | 30/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.020 | time: 1:09:00.1 | step: 6590 +epoch: 97 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 1:09:09.1 | step: 6600 +epoch: 98 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.012 | time: 1:09:17.7 | step: 6610 +epoch: 98 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.040 | time: 1:09:26.8 | step: 6620 +epoch: 98 | 23/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.020 | time: 1:09:35.8 | step: 6630 +epoch: 98 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 1:09:44.9 | step: 6640 +epoch: 98 | 43/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.025 | time: 1:09:53.9 | step: 6650 +epoch: 99 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.026 | time: 1:10:02.5 | step: 6660 +epoch: 99 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 1:10:11.6 | step: 6670 +epoch: 99 | 26/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.019 | time: 1:10:20.6 | step: 6680 +epoch: 99 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 1:10:29.7 | step: 6690 +epoch: 99 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 1:10:38.3 | step: 6700 +epoch: 100 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:10:47.4 | step: 6710 +epoch: 100 | 19/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.020 | time: 1:10:56.4 | step: 6720 +epoch: 100 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 1:11:05.5 | step: 6730 +epoch: 100 | 39/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.038 | time: 1:11:14.5 | step: 6740 +epoch: 101 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.027 | time: 1:11:23.1 | step: 6750 +epoch: 101 | 12/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.022 | time: 1:11:32.2 | step: 6760 +epoch: 101 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 1:11:41.3 | step: 6770 +epoch: 101 | 32/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 1:11:50.3 | step: 6780 +epoch: 101 | 42/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.008 | time: 1:11:59.4 | step: 6790 +epoch: 102 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.010 | time: 1:12:08.0 | step: 6800 +epoch: 102 | 15/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.055 | time: 1:12:17.0 | step: 6810 +epoch: 102 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 1:12:26.1 | step: 6820 +epoch: 102 | 35/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.013 | time: 1:12:35.2 | step: 6830 +epoch: 102 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.025 | time: 1:12:44.3 | step: 6840 +epoch: 103 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.016 | time: 1:12:52.9 | step: 6850 +epoch: 103 | 18/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.010 | time: 1:13:02.0 | step: 6860 +epoch: 103 | 28/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.017 | time: 1:13:11.0 | step: 6870 +epoch: 103 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.045 | time: 1:13:20.1 | step: 6880 +epoch: 104 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.023 | time: 1:13:28.7 | step: 6890 +epoch: 104 | 11/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.047 | time: 1:13:37.8 | step: 6900 +epoch: 104 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.037 | time: 1:13:46.8 | step: 6910 +epoch: 104 | 31/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.026 | time: 1:13:55.9 | step: 6920 +epoch: 104 | 41/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.022 | time: 1:14:04.9 | step: 6930 +epoch: 105 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.026 | time: 1:14:13.6 | step: 6940 +epoch: 105 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 1:14:22.6 | step: 6950 +epoch: 105 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 1:14:31.6 | step: 6960 +epoch: 105 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 1:14:40.7 | step: 6970 +epoch: 105 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.044 | time: 1:14:49.7 | step: 6980 +epoch: 106 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.038 | time: 1:14:58.3 | step: 6990 +epoch: 106 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 1:15:07.4 | step: 7000 +epoch: 106 | 27/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.021 | time: 1:15:16.4 | step: 7010 +epoch: 106 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 1:15:25.4 | step: 7020 +epoch: 107 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.027 | time: 1:15:34.0 | step: 7030 +epoch: 107 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.041 | time: 1:15:43.0 | step: 7040 +epoch: 107 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 1:15:52.0 | step: 7050 +epoch: 107 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 1:16:01.0 | step: 7060 +epoch: 107 | 40/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.045 | time: 1:16:10.1 | step: 7070 +epoch: 108 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.018 | time: 1:16:18.7 | step: 7080 +epoch: 108 | 13/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.023 | time: 1:16:27.8 | step: 7090 +epoch: 108 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 1:16:36.8 | step: 7100 +epoch: 108 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 1:16:45.8 | step: 7110 +epoch: 108 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 1:16:54.8 | step: 7120 +epoch: 109 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.009 | time: 1:17:03.4 | step: 7130 +epoch: 109 | 16/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.004 | time: 1:17:12.4 | step: 7140 +epoch: 109 | 26/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.033 | time: 1:17:21.5 | step: 7150 +epoch: 109 | 36/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 1:17:30.6 | step: 7160 +epoch: 109 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 1:17:39.2 | step: 7170 +epoch: 110 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 1:17:48.4 | step: 7180 +epoch: 110 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 1:17:57.4 | step: 7190 +epoch: 110 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 1:18:06.4 | step: 7200 +epoch: 110 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 1:18:15.4 | step: 7210 +epoch: 111 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.034 | time: 1:18:24.0 | step: 7220 +epoch: 111 | 12/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 1:18:33.0 | step: 7230 +epoch: 111 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 1:18:42.1 | step: 7240 +epoch: 111 | 32/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.032 | time: 1:18:51.1 | step: 7250 +epoch: 111 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.036 | time: 1:19:00.2 | step: 7260 +epoch: 112 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.019 | time: 1:19:08.8 | step: 7270 +epoch: 112 | 15/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 1:19:17.8 | step: 7280 +epoch: 112 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.028 | time: 1:19:26.9 | step: 7290 +epoch: 112 | 35/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.005 | time: 1:19:36.0 | step: 7300 +epoch: 112 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 1:19:45.1 | step: 7310 +epoch: 113 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.033 | time: 1:19:53.7 | step: 7320 +epoch: 113 | 18/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.044 | time: 1:20:02.8 | step: 7330 +epoch: 113 | 28/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.023 | time: 1:20:11.8 | step: 7340 +epoch: 113 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.004 | time: 1:20:20.9 | step: 7350 +epoch: 114 | 1/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.010 | time: 1:20:29.6 | step: 7360 +epoch: 114 | 11/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 1:20:38.6 | step: 7370 +epoch: 114 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.026 | time: 1:20:47.7 | step: 7380 +epoch: 114 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 1:20:56.7 | step: 7390 +epoch: 114 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 1:21:05.7 | step: 7400 +epoch: 115 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.011 | time: 1:21:14.3 | step: 7410 +epoch: 115 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 1:21:23.3 | step: 7420 +epoch: 115 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 1:21:32.3 | step: 7430 +epoch: 115 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 1:21:41.3 | step: 7440 +epoch: 115 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 1:21:50.4 | step: 7450 +epoch: 116 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.015 | time: 1:21:58.9 | step: 7460 +epoch: 116 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 1:22:08.0 | step: 7470 +epoch: 116 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 1:22:17.0 | step: 7480 +epoch: 116 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 1:22:26.0 | step: 7490 +epoch: 117 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.019 | time: 1:22:34.6 | step: 7500 +epoch: 117 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 1:22:43.7 | step: 7510 +epoch: 117 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.050 | time: 1:22:52.7 | step: 7520 +epoch: 117 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 1:23:01.7 | step: 7530 +epoch: 117 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 1:23:10.8 | step: 7540 +epoch: 118 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.042 | time: 1:23:19.4 | step: 7550 +epoch: 118 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.048 | time: 1:23:28.4 | step: 7560 +epoch: 118 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 1:23:37.5 | step: 7570 +epoch: 118 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 1:23:46.5 | step: 7580 +epoch: 118 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 1:23:55.6 | step: 7590 +epoch: 119 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.012 | time: 1:24:04.2 | step: 7600 +epoch: 119 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 1:24:13.2 | step: 7610 +epoch: 119 | 26/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.032 | time: 1:24:22.3 | step: 7620 +epoch: 119 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 1:24:31.3 | step: 7630 +epoch: 119 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 1:24:39.9 | step: 7640 +epoch: 120 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:24:49.0 | step: 7650 +epoch: 120 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:24:58.0 | step: 7660 +epoch: 120 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 1:25:07.0 | step: 7670 +epoch: 120 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.034 | time: 1:25:16.1 | step: 7680 +epoch: 121 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.009 | time: 1:25:24.7 | step: 7690 +epoch: 121 | 12/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.025 | time: 1:25:33.8 | step: 7700 +epoch: 121 | 22/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 1:25:42.9 | step: 7710 +epoch: 121 | 32/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 1:25:51.9 | step: 7720 +epoch: 121 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 1:26:01.0 | step: 7730 +epoch: 122 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.012 | time: 1:26:09.5 | step: 7740 +epoch: 122 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 1:26:18.5 | step: 7750 +epoch: 122 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 1:26:27.6 | step: 7760 +epoch: 122 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 1:26:36.6 | step: 7770 +epoch: 122 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.047 | time: 1:26:45.7 | step: 7780 +epoch: 123 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 1:26:54.3 | step: 7790 +epoch: 123 | 18/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 1:27:03.4 | step: 7800 +epoch: 123 | 28/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.034 | time: 1:27:12.5 | step: 7810 +epoch: 123 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 1:27:21.6 | step: 7820 +epoch: 124 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.023 | time: 1:27:30.2 | step: 7830 +epoch: 124 | 11/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.027 | time: 1:27:39.2 | step: 7840 +epoch: 124 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 1:27:48.3 | step: 7850 +epoch: 124 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 1:27:57.3 | step: 7860 +epoch: 124 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 1:28:06.4 | step: 7870 +epoch: 125 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.028 | time: 1:28:15.0 | step: 7880 +epoch: 125 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 1:28:24.0 | step: 7890 +epoch: 125 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 1:28:33.0 | step: 7900 +epoch: 125 | 34/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.008 | time: 1:28:42.1 | step: 7910 +epoch: 125 | 44/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 1:28:51.2 | step: 7920 +epoch: 126 | 7/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.014 | time: 1:28:59.9 | step: 7930 +epoch: 126 | 17/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 1:29:08.9 | step: 7940 +epoch: 126 | 27/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 1:29:18.0 | step: 7950 +epoch: 126 | 37/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 1:29:27.1 | step: 7960 +epoch: 127 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.026 | time: 1:29:35.7 | step: 7970 +epoch: 127 | 10/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.030 | time: 1:29:44.8 | step: 7980 +epoch: 127 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 1:29:53.8 | step: 7990 +epoch: 127 | 30/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 1:30:02.9 | step: 8000 +epoch: 127 | 40/ 47 | logs/44k/diffusion | batch/s: 0.37 | lr: 0.0002 | loss: 0.019 | time: 1:30:29.6 | step: 8010 +epoch: 128 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.003 | time: 1:30:38.2 | step: 8020 +epoch: 128 | 13/ 47 | logs/44k/diffusion | batch/s: 1.07 | lr: 0.0002 | loss: 0.009 | time: 1:30:47.6 | step: 8030 +epoch: 128 | 23/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.014 | time: 1:30:57.1 | step: 8040 +epoch: 128 | 33/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.012 | time: 1:31:06.3 | step: 8050 +epoch: 128 | 43/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 1:31:15.4 | step: 8060 +epoch: 129 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.018 | time: 1:31:23.9 | step: 8070 +epoch: 129 | 16/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:31:32.7 | step: 8080 +epoch: 129 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 1:31:41.6 | step: 8090 +epoch: 129 | 36/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 1:31:50.6 | step: 8100 +epoch: 129 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 1:31:59.1 | step: 8110 +epoch: 130 | 9/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 1:32:08.3 | step: 8120 +epoch: 130 | 19/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.012 | time: 1:32:17.5 | step: 8130 +epoch: 130 | 29/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.010 | time: 1:32:26.6 | step: 8140 +epoch: 130 | 39/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.006 | time: 1:32:35.7 | step: 8150 +epoch: 131 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 1:32:44.3 | step: 8160 +epoch: 131 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 1:32:53.4 | step: 8170 +epoch: 131 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.036 | time: 1:33:02.3 | step: 8180 +epoch: 131 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 1:33:11.4 | step: 8190 +epoch: 131 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 1:33:20.4 | step: 8200 +epoch: 132 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.022 | time: 1:33:29.0 | step: 8210 +epoch: 132 | 15/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.042 | time: 1:33:38.0 | step: 8220 +epoch: 132 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 1:33:47.1 | step: 8230 +epoch: 132 | 35/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 1:33:56.2 | step: 8240 +epoch: 132 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.028 | time: 1:34:05.2 | step: 8250 +epoch: 133 | 8/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.018 | time: 1:34:13.9 | step: 8260 +epoch: 133 | 18/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.023 | time: 1:34:23.0 | step: 8270 +epoch: 133 | 28/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 1:34:32.0 | step: 8280 +epoch: 133 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 1:34:41.1 | step: 8290 +epoch: 134 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.019 | time: 1:34:49.8 | step: 8300 +epoch: 134 | 11/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.017 | time: 1:34:58.8 | step: 8310 +epoch: 134 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.019 | time: 1:35:07.9 | step: 8320 +epoch: 134 | 31/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.021 | time: 1:35:17.0 | step: 8330 +epoch: 134 | 41/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 1:35:26.0 | step: 8340 +epoch: 135 | 4/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.028 | time: 1:35:34.7 | step: 8350 +epoch: 135 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 1:35:43.8 | step: 8360 +epoch: 135 | 24/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.017 | time: 1:35:52.8 | step: 8370 +epoch: 135 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.045 | time: 1:36:01.9 | step: 8380 +epoch: 135 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 1:36:10.9 | step: 8390 +epoch: 136 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.010 | time: 1:36:19.5 | step: 8400 +epoch: 136 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 1:36:28.5 | step: 8410 +epoch: 136 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 1:36:37.5 | step: 8420 +epoch: 136 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 1:36:46.5 | step: 8430 +epoch: 137 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.044 | time: 1:36:55.1 | step: 8440 +epoch: 137 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 1:37:04.1 | step: 8450 +epoch: 137 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 1:37:13.1 | step: 8460 +epoch: 137 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 1:37:22.1 | step: 8470 +epoch: 137 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 1:37:31.1 | step: 8480 +epoch: 138 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.016 | time: 1:37:39.7 | step: 8490 +epoch: 138 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 1:37:48.7 | step: 8500 +epoch: 138 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 1:37:57.8 | step: 8510 +epoch: 138 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 1:38:06.8 | step: 8520 +epoch: 138 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 1:38:15.8 | step: 8530 +epoch: 139 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.040 | time: 1:38:24.4 | step: 8540 +epoch: 139 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.004 | time: 1:38:33.4 | step: 8550 +epoch: 139 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 1:38:42.4 | step: 8560 +epoch: 139 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 1:38:51.4 | step: 8570 +epoch: 139 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 1:39:00.0 | step: 8580 +epoch: 140 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 1:39:09.2 | step: 8590 +epoch: 140 | 19/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.025 | time: 1:39:18.3 | step: 8600 +epoch: 140 | 29/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.031 | time: 1:39:27.3 | step: 8610 +epoch: 140 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 1:39:36.4 | step: 8620 +epoch: 141 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.062 | time: 1:39:45.0 | step: 8630 +epoch: 141 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.037 | time: 1:39:54.0 | step: 8640 +epoch: 141 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 1:40:03.0 | step: 8650 +epoch: 141 | 32/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.038 | time: 1:40:12.0 | step: 8660 +epoch: 141 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.037 | time: 1:40:21.1 | step: 8670 +epoch: 142 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.056 | time: 1:40:29.7 | step: 8680 +epoch: 142 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 1:40:38.7 | step: 8690 +epoch: 142 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 1:40:47.7 | step: 8700 +epoch: 142 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.045 | time: 1:40:56.8 | step: 8710 +epoch: 142 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 1:41:05.8 | step: 8720 +epoch: 143 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.009 | time: 1:41:14.4 | step: 8730 +epoch: 143 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 1:41:23.4 | step: 8740 +epoch: 143 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 1:41:32.5 | step: 8750 +epoch: 143 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 1:41:41.5 | step: 8760 +epoch: 144 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.009 | time: 1:41:50.1 | step: 8770 +epoch: 144 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 1:41:59.1 | step: 8780 +epoch: 144 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 1:42:08.2 | step: 8790 --- model size --- model: 55,192,704 ======= start training ======= epoch|batch_idx/num_batches|output_dir|batch/s|lr|time|step -epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 2.14 | lr: 0.0002 | loss: 0.031 | time: 0:00:04.9 | step: 10 -epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 2.19 | lr: 0.0002 | loss: 0.042 | time: 0:00:09.5 | step: 20 -epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 2.21 | lr: 0.0002 | loss: 0.022 | time: 0:00:14.0 | step: 30 -epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 2.21 | lr: 0.0002 | loss: 0.017 | time: 0:00:18.5 | step: 40 -epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 2.22 | lr: 0.0002 | loss: 0.016 | time: 0:00:23.0 | step: 50 -epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 2.09 | lr: 0.0002 | loss: 0.031 | time: 0:00:27.9 | step: 60 -epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 2.09 | lr: 0.0002 | loss: 0.018 | time: 0:00:32.6 | step: 70 -epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 2.03 | lr: 0.0002 | loss: 0.011 | time: 0:00:37.6 | step: 80 -epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.98 | lr: 0.0002 | loss: 0.018 | time: 0:00:42.6 | step: 90 -epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 2.01 | lr: 0.0002 | loss: 0.048 | time: 0:00:47.6 | step: 100 -epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.93 | lr: 0.0002 | loss: 0.015 | time: 0:00:52.8 | step: 110 -epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.95 | lr: 0.0002 | loss: 0.009 | time: 0:00:57.9 | step: 120 -epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.91 | lr: 0.0002 | loss: 0.016 | time: 0:01:03.1 | step: 130 -epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.91 | lr: 0.0002 | loss: 0.008 | time: 0:01:08.4 | step: 140 -epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 2.00 | lr: 0.0002 | loss: 0.024 | time: 0:01:13.4 | step: 150 -epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.90 | lr: 0.0002 | loss: 0.025 | time: 0:01:18.7 | step: 160 -epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.77 | lr: 0.0002 | loss: 0.025 | time: 0:01:24.3 | step: 170 -epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.89 | lr: 0.0002 | loss: 0.024 | time: 0:01:29.6 | step: 180 -epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.88 | lr: 0.0002 | loss: 0.010 | time: 0:01:34.9 | step: 190 +epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 0.63 | lr: 0.0002 | loss: 0.011 | time: 0:00:16.4 | step: 8010 +epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 1.23 | lr: 0.0002 | loss: 0.007 | time: 0:00:24.5 | step: 8020 +epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.008 | time: 0:00:32.8 | step: 8030 +epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.025 | time: 0:00:41.1 | step: 8040 +epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 1.23 | lr: 0.0002 | loss: 0.011 | time: 0:00:49.3 | step: 8050 +epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.011 | time: 0:00:57.8 | step: 8060 +epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.045 | time: 0:01:06.5 | step: 8070 +epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.012 | time: 0:01:15.1 | step: 8080 +epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.010 | time: 0:01:23.6 | step: 8090 +epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 1.24 | lr: 0.0002 | loss: 0.023 | time: 0:01:31.7 | step: 8100 +epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.008 | time: 0:01:40.1 | step: 8110 +epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.007 | time: 0:01:48.6 | step: 8120 +epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.024 | time: 0:01:57.0 | step: 8130 +epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.014 | time: 0:02:05.6 | step: 8140 +epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 1.22 | lr: 0.0002 | loss: 0.011 | time: 0:02:13.7 | step: 8150 +epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.021 | time: 0:02:22.3 | step: 8160 +epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.017 | time: 0:02:31.0 | step: 8170 +epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.015 | time: 0:02:39.7 | step: 8180 +epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.020 | time: 0:02:48.0 | step: 8190 +epoch: 4 | 11/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.021 | time: 0:02:56.6 | step: 8200 +epoch: 4 | 21/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.017 | time: 0:03:05.3 | step: 8210 +epoch: 4 | 31/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.019 | time: 0:03:13.9 | step: 8220 +epoch: 4 | 41/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.024 | time: 0:03:22.6 | step: 8230 +epoch: 5 | 4/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.042 | time: 0:03:30.8 | step: 8240 +epoch: 5 | 14/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.011 | time: 0:03:39.5 | step: 8250 +epoch: 5 | 24/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.014 | time: 0:03:48.2 | step: 8260 +epoch: 5 | 34/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.019 | time: 0:03:56.9 | step: 8270 +epoch: 5 | 44/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.031 | time: 0:04:05.6 | step: 8280 +epoch: 6 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.040 | time: 0:04:13.9 | step: 8290 +epoch: 6 | 17/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.025 | time: 0:04:22.6 | step: 8300 +epoch: 6 | 27/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.011 | time: 0:04:31.3 | step: 8310 +epoch: 6 | 37/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.019 | time: 0:04:40.0 | step: 8320 +epoch: 7 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.046 | time: 0:04:48.3 | step: 8330 +epoch: 7 | 10/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.024 | time: 0:04:57.1 | step: 8340 +epoch: 7 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:05:05.8 | step: 8350 +epoch: 7 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:05:14.6 | step: 8360 +epoch: 7 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:05:23.3 | step: 8370 +epoch: 8 | 3/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.047 | time: 0:05:31.6 | step: 8380 +epoch: 8 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:05:40.4 | step: 8390 +epoch: 8 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:05:49.1 | step: 8400 +epoch: 8 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 0:05:57.9 | step: 8410 +epoch: 8 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 0:06:06.7 | step: 8420 +epoch: 9 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 0:06:15.2 | step: 8430 +epoch: 9 | 16/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 0:06:24.2 | step: 8440 +epoch: 9 | 26/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.021 | time: 0:06:33.4 | step: 8450 +epoch: 9 | 36/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.022 | time: 0:06:42.5 | step: 8460 +epoch: 9 | 46/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:06:51.2 | step: 8470 +epoch: 10 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:07:00.3 | step: 8480 +epoch: 10 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:07:09.3 | step: 8490 +epoch: 10 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.036 | time: 0:07:18.3 | step: 8500 +epoch: 10 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 0:07:27.3 | step: 8510 +epoch: 11 | 2/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.024 | time: 0:07:35.8 | step: 8520 +epoch: 11 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:07:44.9 | step: 8530 +epoch: 11 | 22/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.021 | time: 0:07:53.9 | step: 8540 +epoch: 11 | 32/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 0:08:03.0 | step: 8550 +epoch: 11 | 42/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:08:12.0 | step: 8560 +epoch: 12 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.012 | time: 0:08:20.7 | step: 8570 +epoch: 12 | 15/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.022 | time: 0:08:29.7 | step: 8580 +epoch: 12 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:08:38.8 | step: 8590 +epoch: 12 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:08:47.8 | step: 8600 +epoch: 12 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:08:56.9 | step: 8610 +epoch: 13 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.033 | time: 0:09:05.5 | step: 8620 +epoch: 13 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:09:14.5 | step: 8630 +epoch: 13 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:09:23.5 | step: 8640 +epoch: 13 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.041 | time: 0:09:32.5 | step: 8650 +epoch: 14 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.023 | time: 0:09:41.1 | step: 8660 +epoch: 14 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:09:50.1 | step: 8670 +epoch: 14 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:09:59.1 | step: 8680 +epoch: 14 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:10:08.1 | step: 8690 +epoch: 14 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:10:17.1 | step: 8700 +epoch: 15 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.028 | time: 0:10:25.6 | step: 8710 +epoch: 15 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:10:34.6 | step: 8720 +epoch: 15 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:10:43.6 | step: 8730 +epoch: 15 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:10:52.6 | step: 8740 +epoch: 15 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:11:01.7 | step: 8750 +epoch: 16 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.036 | time: 0:11:10.3 | step: 8760 +epoch: 16 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.054 | time: 0:11:19.3 | step: 8770 +epoch: 16 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:11:28.3 | step: 8780 +epoch: 16 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:11:37.4 | step: 8790 +epoch: 17 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:11:46.0 | step: 8800 +epoch: 17 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:11:55.0 | step: 8810 +epoch: 17 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:12:04.0 | step: 8820 +epoch: 17 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:12:13.0 | step: 8830 +epoch: 17 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:12:22.0 | step: 8840 +epoch: 18 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.017 | time: 0:12:30.6 | step: 8850 +epoch: 18 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:12:39.6 | step: 8860 +epoch: 18 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:12:48.6 | step: 8870 +epoch: 18 | 33/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.005 | time: 0:12:57.7 | step: 8880 +epoch: 18 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:13:06.7 | step: 8890 +epoch: 19 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.017 | time: 0:13:15.3 | step: 8900 +epoch: 19 | 16/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.046 | time: 0:13:24.4 | step: 8910 +epoch: 19 | 26/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 0:13:33.5 | step: 8920 +epoch: 19 | 36/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 0:13:42.6 | step: 8930 +epoch: 19 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 0:13:51.2 | step: 8940 +epoch: 20 | 9/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:14:00.3 | step: 8950 +epoch: 20 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:14:09.4 | step: 8960 +epoch: 20 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:14:18.4 | step: 8970 +epoch: 20 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:14:27.5 | step: 8980 +epoch: 21 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.020 | time: 0:14:36.1 | step: 8990 +epoch: 21 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:14:45.1 | step: 9000 +epoch: 21 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:14:54.1 | step: 9010 +epoch: 21 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:15:03.2 | step: 9020 +epoch: 21 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:15:12.2 | step: 9030 +epoch: 22 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.014 | time: 0:15:20.8 | step: 9040 +epoch: 22 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:15:29.8 | step: 9050 +epoch: 22 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:15:38.8 | step: 9060 +epoch: 22 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:15:47.9 | step: 9070 +epoch: 22 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:15:56.9 | step: 9080 +epoch: 23 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:16:05.5 | step: 9090 +epoch: 23 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:16:14.5 | step: 9100 +epoch: 23 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:16:23.5 | step: 9110 +epoch: 23 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:16:32.5 | step: 9120 +epoch: 24 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.021 | time: 0:16:41.1 | step: 9130 +epoch: 24 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:16:50.2 | step: 9140 +epoch: 24 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:16:59.2 | step: 9150 +epoch: 24 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:17:08.2 | step: 9160 +epoch: 24 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.045 | time: 0:17:17.2 | step: 9170 +epoch: 25 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.031 | time: 0:17:25.8 | step: 9180 +epoch: 25 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:17:34.9 | step: 9190 +epoch: 25 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:17:43.9 | step: 9200 +epoch: 25 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.042 | time: 0:17:52.9 | step: 9210 +epoch: 25 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:18:01.9 | step: 9220 +epoch: 26 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.017 | time: 0:18:10.5 | step: 9230 +epoch: 26 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.004 | time: 0:18:19.6 | step: 9240 +epoch: 26 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:18:28.6 | step: 9250 +epoch: 26 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:18:37.6 | step: 9260 +epoch: 27 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.028 | time: 0:18:46.2 | step: 9270 +epoch: 27 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:18:55.2 | step: 9280 +epoch: 27 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:19:04.2 | step: 9290 +epoch: 27 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:19:13.1 | step: 9300 +epoch: 27 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 0:19:22.1 | step: 9310 +epoch: 28 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.029 | time: 0:19:30.6 | step: 9320 +epoch: 28 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.052 | time: 0:19:39.5 | step: 9330 +epoch: 28 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:19:48.4 | step: 9340 +epoch: 28 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:19:57.3 | step: 9350 +epoch: 28 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:20:06.2 | step: 9360 +epoch: 29 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.043 | time: 0:20:14.7 | step: 9370 +epoch: 29 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 0:20:23.5 | step: 9380 +epoch: 29 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:20:32.3 | step: 9390 +epoch: 29 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:20:41.1 | step: 9400 +epoch: 29 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.008 | time: 0:20:49.5 | step: 9410 +epoch: 30 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.038 | time: 0:20:58.4 | step: 9420 +epoch: 30 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:21:07.2 | step: 9430 +epoch: 30 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:21:16.0 | step: 9440 +epoch: 30 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.047 | time: 0:21:24.8 | step: 9450 +epoch: 31 | 2/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.035 | time: 0:21:33.1 | step: 9460 +epoch: 31 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:21:41.9 | step: 9470 +epoch: 31 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 0:21:50.7 | step: 9480 +epoch: 31 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:21:59.5 | step: 9490 +epoch: 31 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:22:08.3 | step: 9500 +epoch: 32 | 5/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.027 | time: 0:22:16.7 | step: 9510 +epoch: 32 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:22:25.6 | step: 9520 +epoch: 32 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 0:22:34.5 | step: 9530 +epoch: 32 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:22:43.6 | step: 9540 +epoch: 32 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 0:22:52.7 | step: 9550 +epoch: 33 | 8/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.004 | time: 0:23:01.3 | step: 9560 +epoch: 33 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:23:10.4 | step: 9570 +epoch: 33 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:23:19.4 | step: 9580 +epoch: 33 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:23:28.4 | step: 9590 +epoch: 34 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.021 | time: 0:23:36.9 | step: 9600 +epoch: 34 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:23:45.9 | step: 9610 +epoch: 34 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:23:54.9 | step: 9620 +epoch: 34 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:24:03.9 | step: 9630 +epoch: 34 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 0:24:12.9 | step: 9640 +epoch: 35 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.018 | time: 0:24:21.4 | step: 9650 +epoch: 35 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:24:30.4 | step: 9660 +epoch: 35 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:24:39.4 | step: 9670 +epoch: 35 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:24:48.4 | step: 9680 +epoch: 35 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:24:57.4 | step: 9690 +epoch: 36 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.016 | time: 0:25:06.0 | step: 9700 +epoch: 36 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:25:15.0 | step: 9710 +epoch: 36 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 0:25:24.1 | step: 9720 +epoch: 36 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:25:33.1 | step: 9730 +epoch: 37 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.008 | time: 0:25:41.6 | step: 9740 +epoch: 37 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:25:50.7 | step: 9750 +epoch: 37 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:25:59.7 | step: 9760 +epoch: 37 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:26:08.7 | step: 9770 +epoch: 37 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:26:17.7 | step: 9780 +epoch: 38 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.011 | time: 0:26:26.3 | step: 9790 +epoch: 38 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:26:35.3 | step: 9800 +epoch: 38 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:26:44.3 | step: 9810 +epoch: 38 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:26:53.3 | step: 9820 +epoch: 38 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:27:02.3 | step: 9830 +epoch: 39 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.031 | time: 0:27:10.9 | step: 9840 +epoch: 39 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:27:19.9 | step: 9850 +epoch: 39 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.036 | time: 0:27:28.9 | step: 9860 +epoch: 39 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:27:37.9 | step: 9870 +epoch: 39 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 0:27:46.5 | step: 9880 +epoch: 40 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:27:55.5 | step: 9890 +epoch: 40 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:28:04.6 | step: 9900 +epoch: 40 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.039 | time: 0:28:13.6 | step: 9910 +epoch: 40 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:28:22.6 | step: 9920 +epoch: 41 | 2/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.016 | time: 0:28:31.1 | step: 9930 +epoch: 41 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:28:40.1 | step: 9940 +epoch: 41 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 0:28:49.2 | step: 9950 +epoch: 41 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:28:58.2 | step: 9960 +epoch: 41 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:29:07.2 | step: 9970 +epoch: 42 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.029 | time: 0:29:15.8 | step: 9980 +epoch: 42 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:29:24.8 | step: 9990 +epoch: 42 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:29:33.8 | step: 10000 +epoch: 42 | 35/ 47 | logs/44k/diffusion | batch/s: 0.24 | lr: 0.0002 | loss: 0.014 | time: 0:30:16.3 | step: 10010 +epoch: 42 | 45/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.023 | time: 0:30:25.0 | step: 10020 +epoch: 43 | 8/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.024 | time: 0:30:33.3 | step: 10030 +epoch: 43 | 18/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.027 | time: 0:30:42.0 | step: 10040 +epoch: 43 | 28/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.010 | time: 0:30:50.7 | step: 10050 +epoch: 43 | 38/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.017 | time: 0:30:59.4 | step: 10060 +epoch: 44 | 1/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.023 | time: 0:31:07.6 | step: 10070 +epoch: 44 | 11/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.024 | time: 0:31:16.3 | step: 10080 +epoch: 44 | 21/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.042 | time: 0:31:25.0 | step: 10090 +epoch: 44 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:31:33.8 | step: 10100 +epoch: 44 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:31:42.5 | step: 10110 +epoch: 45 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.021 | time: 0:31:50.9 | step: 10120 +epoch: 45 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:31:59.7 | step: 10130 +epoch: 45 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.044 | time: 0:32:08.4 | step: 10140 +epoch: 45 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.044 | time: 0:32:17.2 | step: 10150 +epoch: 45 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.039 | time: 0:32:26.0 | step: 10160 +epoch: 46 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.021 | time: 0:32:34.3 | step: 10170 +epoch: 46 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.039 | time: 0:32:43.1 | step: 10180 +epoch: 46 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.045 | time: 0:32:51.8 | step: 10190 +epoch: 46 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:33:00.6 | step: 10200 +epoch: 47 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.010 | time: 0:33:08.9 | step: 10210 +epoch: 47 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:33:17.7 | step: 10220 +epoch: 47 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.037 | time: 0:33:26.4 | step: 10230 +epoch: 47 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:33:35.2 | step: 10240 +epoch: 47 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:33:44.0 | step: 10250 +epoch: 48 | 3/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.023 | time: 0:33:52.3 | step: 10260 +epoch: 48 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:34:01.1 | step: 10270 +epoch: 48 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:34:09.8 | step: 10280 +epoch: 48 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 0:34:18.6 | step: 10290 +epoch: 48 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:34:27.4 | step: 10300 +epoch: 49 | 6/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.012 | time: 0:34:35.7 | step: 10310 +epoch: 49 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:34:44.5 | step: 10320 +epoch: 49 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:34:53.2 | step: 10330 +epoch: 49 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:35:02.0 | step: 10340 +epoch: 49 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:35:10.5 | step: 10350 +epoch: 50 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.048 | time: 0:35:19.7 | step: 10360 +epoch: 50 | 19/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.026 | time: 0:35:28.8 | step: 10370 +epoch: 50 | 29/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.020 | time: 0:35:37.9 | step: 10380 +epoch: 50 | 39/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.023 | time: 0:35:47.0 | step: 10390 +epoch: 51 | 2/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.046 | time: 0:35:55.7 | step: 10400 +epoch: 51 | 12/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.008 | time: 0:36:04.7 | step: 10410 +epoch: 51 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 0:36:13.7 | step: 10420 +epoch: 51 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.039 | time: 0:36:22.7 | step: 10430 +epoch: 51 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:36:31.7 | step: 10440 +epoch: 52 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.016 | time: 0:36:40.2 | step: 10450 +epoch: 52 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:36:49.2 | step: 10460 +epoch: 52 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:36:58.2 | step: 10470 +epoch: 52 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:37:07.2 | step: 10480 +epoch: 52 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:37:16.3 | step: 10490 +epoch: 53 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.008 | time: 0:37:24.8 | step: 10500 +epoch: 53 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:37:33.8 | step: 10510 +epoch: 53 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:37:42.8 | step: 10520 +epoch: 53 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 0:37:51.9 | step: 10530 +epoch: 54 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.018 | time: 0:38:00.5 | step: 10540 +epoch: 54 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.037 | time: 0:38:09.5 | step: 10550 +epoch: 54 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:38:18.5 | step: 10560 +epoch: 54 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:38:27.6 | step: 10570 +epoch: 54 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:38:36.6 | step: 10580 +epoch: 55 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.010 | time: 0:38:45.2 | step: 10590 +epoch: 55 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.004 | time: 0:38:54.2 | step: 10600 +epoch: 55 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:39:03.2 | step: 10610 +epoch: 55 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:39:12.3 | step: 10620 +epoch: 55 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.041 | time: 0:39:21.3 | step: 10630 +epoch: 56 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.028 | time: 0:39:29.9 | step: 10640 +epoch: 56 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:39:38.9 | step: 10650 +epoch: 56 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:39:47.9 | step: 10660 +epoch: 56 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:39:57.0 | step: 10670 +epoch: 57 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.008 | time: 0:40:05.6 | step: 10680 +epoch: 57 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:40:14.6 | step: 10690 +epoch: 57 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:40:23.6 | step: 10700 +epoch: 57 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:40:32.6 | step: 10710 +epoch: 57 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:40:41.7 | step: 10720 +epoch: 58 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.011 | time: 0:40:50.3 | step: 10730 +epoch: 58 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:40:59.3 | step: 10740 +epoch: 58 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:41:08.3 | step: 10750 +epoch: 58 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:41:17.3 | step: 10760 +epoch: 58 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:41:26.3 | step: 10770 +epoch: 59 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.010 | time: 0:41:34.9 | step: 10780 +epoch: 59 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:41:43.9 | step: 10790 +epoch: 59 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:41:52.9 | step: 10800 +epoch: 59 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:42:01.9 | step: 10810 +epoch: 59 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.024 | time: 0:42:10.5 | step: 10820 +epoch: 60 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:42:19.6 | step: 10830 +epoch: 60 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:42:28.6 | step: 10840 +epoch: 60 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:42:37.6 | step: 10850 +epoch: 60 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:42:46.6 | step: 10860 +epoch: 61 | 2/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.025 | time: 0:42:55.2 | step: 10870 +epoch: 61 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:43:04.2 | step: 10880 +epoch: 61 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.045 | time: 0:43:13.2 | step: 10890 +epoch: 61 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 0:43:22.2 | step: 10900 +epoch: 61 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:43:31.2 | step: 10910 +epoch: 62 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.009 | time: 0:43:39.8 | step: 10920 +epoch: 62 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:43:48.8 | step: 10930 +epoch: 62 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:43:57.8 | step: 10940 +epoch: 62 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:44:06.8 | step: 10950 +epoch: 62 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:44:15.8 | step: 10960 +epoch: 63 | 8/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.028 | time: 0:44:24.3 | step: 10970 +epoch: 63 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:44:33.3 | step: 10980 +epoch: 63 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:44:42.3 | step: 10990 +epoch: 63 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.036 | time: 0:44:51.4 | step: 11000 +epoch: 64 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.008 | time: 0:44:59.9 | step: 11010 +epoch: 64 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:45:09.0 | step: 11020 +epoch: 64 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.042 | time: 0:45:18.0 | step: 11030 +epoch: 64 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:45:27.0 | step: 11040 +epoch: 64 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:45:36.0 | step: 11050 +epoch: 65 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.038 | time: 0:45:44.6 | step: 11060 +epoch: 65 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:45:53.6 | step: 11070 +epoch: 65 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.041 | time: 0:46:02.6 | step: 11080 +epoch: 65 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 0:46:11.6 | step: 11090 +epoch: 65 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:46:20.7 | step: 11100 +epoch: 66 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.013 | time: 0:46:29.3 | step: 11110 +epoch: 66 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:46:38.3 | step: 11120 +epoch: 66 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:46:47.3 | step: 11130 +epoch: 66 | 37/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 0:46:56.4 | step: 11140 +epoch: 67 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.019 | time: 0:47:05.0 | step: 11150 +epoch: 67 | 10/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.004 | time: 0:47:14.0 | step: 11160 +epoch: 67 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:47:23.1 | step: 11170 +epoch: 67 | 30/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 0:47:32.1 | step: 11180 +epoch: 67 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.032 | time: 0:47:41.1 | step: 11190 +epoch: 68 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.044 | time: 0:47:49.8 | step: 11200 +epoch: 68 | 13/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.036 | time: 0:47:58.8 | step: 11210 +epoch: 68 | 23/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 0:48:07.9 | step: 11220 +epoch: 68 | 33/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:48:17.0 | step: 11230 +epoch: 68 | 43/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.028 | time: 0:48:26.0 | step: 11240 +epoch: 69 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.048 | time: 0:48:34.6 | step: 11250 +epoch: 69 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.037 | time: 0:48:43.6 | step: 11260 +epoch: 69 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 0:48:52.6 | step: 11270 +epoch: 69 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:49:01.5 | step: 11280 +epoch: 69 | 46/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 0:49:10.0 | step: 11290 +epoch: 70 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.031 | time: 0:49:19.1 | step: 11300 +epoch: 70 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:49:28.0 | step: 11310 +epoch: 70 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.004 | time: 0:49:36.9 | step: 11320 +epoch: 70 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.021 | time: 0:49:45.8 | step: 11330 +epoch: 71 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.007 | time: 0:49:54.3 | step: 11340 +epoch: 71 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 0:50:03.1 | step: 11350 +epoch: 71 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:50:12.0 | step: 11360 +epoch: 71 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:50:20.9 | step: 11370 +epoch: 71 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:50:29.7 | step: 11380 +epoch: 72 | 5/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.024 | time: 0:50:38.1 | step: 11390 +epoch: 72 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:50:47.0 | step: 11400 +epoch: 72 | 25/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:50:55.8 | step: 11410 +epoch: 72 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:51:04.6 | step: 11420 +epoch: 72 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:51:13.4 | step: 11430 +epoch: 73 | 8/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.012 | time: 0:51:21.8 | step: 11440 +epoch: 73 | 18/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.024 | time: 0:51:30.6 | step: 11450 +epoch: 73 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:51:39.4 | step: 11460 +epoch: 73 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:51:48.2 | step: 11470 +epoch: 74 | 1/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.021 | time: 0:51:56.6 | step: 11480 +epoch: 74 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.039 | time: 0:52:05.4 | step: 11490 +epoch: 74 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:52:14.1 | step: 11500 +epoch: 74 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:52:22.9 | step: 11510 +epoch: 74 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:52:31.7 | step: 11520 +epoch: 75 | 4/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.029 | time: 0:52:40.0 | step: 11530 +epoch: 75 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:52:48.8 | step: 11540 +epoch: 75 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:52:57.5 | step: 11550 +epoch: 75 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:53:06.3 | step: 11560 +epoch: 75 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:53:15.0 | step: 11570 +epoch: 76 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.048 | time: 0:53:23.4 | step: 11580 +epoch: 76 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:53:32.2 | step: 11590 +epoch: 76 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 0:53:40.9 | step: 11600 +epoch: 76 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:53:49.7 | step: 11610 +epoch: 77 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.014 | time: 0:53:58.1 | step: 11620 +epoch: 77 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:54:06.9 | step: 11630 +epoch: 77 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:54:15.6 | step: 11640 +epoch: 77 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:54:24.4 | step: 11650 +epoch: 77 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:54:33.2 | step: 11660 +epoch: 78 | 3/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.005 | time: 0:54:41.6 | step: 11670 +epoch: 78 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:54:50.3 | step: 11680 +epoch: 78 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 0:54:59.1 | step: 11690 +epoch: 78 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:55:07.9 | step: 11700 +epoch: 78 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:55:16.6 | step: 11710 +epoch: 79 | 6/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.043 | time: 0:55:25.0 | step: 11720 +epoch: 79 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:55:33.7 | step: 11730 +epoch: 79 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.035 | time: 0:55:42.5 | step: 11740 +epoch: 79 | 36/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.015 | time: 0:55:51.2 | step: 11750 +epoch: 79 | 46/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.013 | time: 0:55:59.6 | step: 11760 +epoch: 80 | 9/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.023 | time: 0:56:08.4 | step: 11770 +epoch: 80 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 0:56:17.1 | step: 11780 +epoch: 80 | 29/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.035 | time: 0:56:25.9 | step: 11790 +epoch: 80 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.036 | time: 0:56:34.6 | step: 11800 +epoch: 81 | 2/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.014 | time: 0:56:42.9 | step: 11810 +epoch: 81 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.038 | time: 0:56:51.7 | step: 11820 +epoch: 81 | 22/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.032 | time: 0:57:00.4 | step: 11830 +epoch: 81 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:57:09.2 | step: 11840 +epoch: 81 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:57:17.9 | step: 11850 +epoch: 82 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.026 | time: 0:57:26.3 | step: 11860 +epoch: 82 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:57:35.1 | step: 11870 +epoch: 82 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:57:43.8 | step: 11880 +epoch: 82 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:57:52.6 | step: 11890 +epoch: 82 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 0:58:01.4 | step: 11900 +epoch: 83 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.028 | time: 0:58:09.8 | step: 11910 +epoch: 83 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:58:18.5 | step: 11920 +epoch: 83 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:58:27.3 | step: 11930 +epoch: 83 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.039 | time: 0:58:36.0 | step: 11940 +epoch: 84 | 1/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.016 | time: 0:58:44.4 | step: 11950 +epoch: 84 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:58:53.1 | step: 11960 +epoch: 84 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.031 | time: 0:59:01.9 | step: 11970 +epoch: 84 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:59:10.6 | step: 11980 +epoch: 84 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:59:19.4 | step: 11990 +epoch: 85 | 4/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.013 | time: 0:59:27.7 | step: 12000 +epoch: 85 | 14/ 47 | logs/44k/diffusion | batch/s: 0.29 | lr: 0.0002 | loss: 0.011 | time: 1:00:02.7 | step: 12010 +--- model size --- +model: 55,192,704 +======= start training ======= +epoch|batch_idx/num_batches|output_dir|batch/s|lr|time|step +epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 1.00 | lr: 0.0002 | loss: 0.020 | time: 0:00:10.5 | step: 12010 +epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 1.24 | lr: 0.0002 | loss: 0.040 | time: 0:00:18.5 | step: 12020 +epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.043 | time: 0:00:26.7 | step: 12030 +epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.018 | time: 0:00:35.1 | step: 12040 +epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 1.24 | lr: 0.0002 | loss: 0.016 | time: 0:00:43.1 | step: 12050 +epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.014 | time: 0:00:51.7 | step: 12060 +epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.009 | time: 0:01:00.3 | step: 12070 +epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:01:09.0 | step: 12080 +epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 0:01:17.9 | step: 12090 +epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.017 | time: 0:01:26.6 | step: 12100 +epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.07 | lr: 0.0002 | loss: 0.024 | time: 0:01:36.0 | step: 12110 +epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.009 | time: 0:01:45.2 | step: 12120 +epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.028 | time: 0:01:54.3 | step: 12130 +epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.033 | time: 0:02:03.2 | step: 12140 +epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.012 | time: 0:02:11.7 | step: 12150 +epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:02:20.5 | step: 12160 +epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:02:29.4 | step: 12170 +epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 0:02:38.4 | step: 12180 +epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.005 | time: 0:02:46.9 | step: 12190 +epoch: 4 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:02:56.0 | step: 12200 +epoch: 4 | 21/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:03:05.1 | step: 12210 +epoch: 4 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:03:14.1 | step: 12220 +epoch: 4 | 41/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 0:03:23.2 | step: 12230 +epoch: 5 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.023 | time: 0:03:31.8 | step: 12240 +epoch: 5 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:03:40.8 | step: 12250 +epoch: 5 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:03:49.8 | step: 12260 +epoch: 5 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:03:58.8 | step: 12270 +epoch: 5 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:04:07.8 | step: 12280 +epoch: 6 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.015 | time: 0:04:16.3 | step: 12290 +epoch: 6 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.040 | time: 0:04:25.3 | step: 12300 +epoch: 6 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:04:34.4 | step: 12310 +epoch: 6 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:04:43.4 | step: 12320 +epoch: 7 | 0/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.024 | time: 0:04:52.0 | step: 12330 +epoch: 7 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:05:01.0 | step: 12340 +epoch: 7 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 0:05:10.1 | step: 12350 +epoch: 7 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:05:19.1 | step: 12360 +epoch: 7 | 40/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 0:05:28.1 | step: 12370 +epoch: 8 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.042 | time: 0:05:36.7 | step: 12380 +epoch: 8 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:05:45.7 | step: 12390 +epoch: 8 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.030 | time: 0:05:54.8 | step: 12400 +epoch: 8 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:06:03.8 | step: 12410 +epoch: 8 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:06:12.8 | step: 12420 +epoch: 9 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.018 | time: 0:06:21.4 | step: 12430 +epoch: 9 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:06:30.5 | step: 12440 +epoch: 9 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:06:39.5 | step: 12450 +epoch: 9 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:06:48.5 | step: 12460 +epoch: 9 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:06:57.1 | step: 12470 +epoch: 10 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:07:06.2 | step: 12480 +epoch: 10 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:07:15.2 | step: 12490 +epoch: 10 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:07:24.3 | step: 12500 +epoch: 10 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:07:33.3 | step: 12510 +epoch: 11 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.011 | time: 0:07:41.9 | step: 12520 +epoch: 11 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:07:50.9 | step: 12530 +epoch: 11 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:08:00.0 | step: 12540 +epoch: 11 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:08:09.0 | step: 12550 +epoch: 11 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:08:18.0 | step: 12560 +epoch: 12 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.028 | time: 0:08:26.7 | step: 12570 +epoch: 12 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:08:35.7 | step: 12580 +epoch: 12 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 0:08:44.8 | step: 12590 +epoch: 12 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:08:53.9 | step: 12600 +epoch: 12 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:09:02.9 | step: 12610 +epoch: 13 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:09:11.5 | step: 12620 +epoch: 13 | 18/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.013 | time: 0:09:20.6 | step: 12630 +epoch: 13 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.034 | time: 0:09:29.6 | step: 12640 +epoch: 13 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:09:38.7 | step: 12650 +epoch: 14 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.022 | time: 0:09:47.3 | step: 12660 +epoch: 14 | 11/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.010 | time: 0:09:56.3 | step: 12670 +epoch: 14 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:10:05.4 | step: 12680 +epoch: 14 | 31/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.037 | time: 0:10:14.4 | step: 12690 +epoch: 14 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:10:23.5 | step: 12700 +epoch: 15 | 4/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.034 | time: 0:10:32.0 | step: 12710 +epoch: 15 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:10:41.0 | step: 12720 +epoch: 15 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:10:50.0 | step: 12730 +epoch: 15 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 0:10:59.0 | step: 12740 +epoch: 15 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:11:08.0 | step: 12750 +epoch: 16 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.032 | time: 0:11:16.5 | step: 12760 +epoch: 16 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:11:25.5 | step: 12770 +epoch: 16 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:11:34.5 | step: 12780 +epoch: 16 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:11:43.5 | step: 12790 +epoch: 17 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.022 | time: 0:11:52.1 | step: 12800 +epoch: 17 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:12:01.0 | step: 12810 +epoch: 17 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.046 | time: 0:12:10.0 | step: 12820 +epoch: 17 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:12:19.0 | step: 12830 +epoch: 17 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:12:28.0 | step: 12840 +epoch: 18 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.051 | time: 0:12:36.6 | step: 12850 +epoch: 18 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.045 | time: 0:12:45.6 | step: 12860 +epoch: 18 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:12:54.5 | step: 12870 +epoch: 18 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.034 | time: 0:13:03.5 | step: 12880 +epoch: 18 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:13:12.5 | step: 12890 +epoch: 19 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.014 | time: 0:13:21.1 | step: 12900 +epoch: 19 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:13:30.1 | step: 12910 +epoch: 19 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:13:39.1 | step: 12920 +epoch: 19 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.004 | time: 0:13:48.1 | step: 12930 +epoch: 19 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.005 | time: 0:13:56.7 | step: 12940 +epoch: 20 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:14:05.8 | step: 12950 +epoch: 20 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:14:14.8 | step: 12960 +epoch: 20 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 0:14:23.8 | step: 12970 +epoch: 20 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:14:32.9 | step: 12980 +epoch: 21 | 2/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.022 | time: 0:14:41.5 | step: 12990 +epoch: 21 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:14:50.5 | step: 13000 +epoch: 21 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:14:59.5 | step: 13010 +epoch: 21 | 32/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.030 | time: 0:15:08.6 | step: 13020 +epoch: 21 | 42/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:15:17.7 | step: 13030 +epoch: 22 | 5/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.015 | time: 0:15:26.3 | step: 13040 +epoch: 22 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:15:35.4 | step: 13050 +epoch: 22 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.034 | time: 0:15:44.4 | step: 13060 +epoch: 22 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:15:53.5 | step: 13070 +epoch: 22 | 45/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.030 | time: 0:16:02.5 | step: 13080 +epoch: 23 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.020 | time: 0:16:11.2 | step: 13090 +epoch: 23 | 18/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.035 | time: 0:16:20.2 | step: 13100 +epoch: 23 | 28/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.017 | time: 0:16:29.3 | step: 13110 +epoch: 23 | 38/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.023 | time: 0:16:38.4 | step: 13120 +epoch: 24 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.007 | time: 0:16:47.0 | step: 13130 +epoch: 24 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.006 | time: 0:16:56.0 | step: 13140 +epoch: 24 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:17:05.1 | step: 13150 +epoch: 24 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.043 | time: 0:17:14.1 | step: 13160 +epoch: 24 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:17:23.1 | step: 13170 +epoch: 25 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.019 | time: 0:17:31.6 | step: 13180 +epoch: 25 | 14/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.021 | time: 0:17:40.6 | step: 13190 +epoch: 25 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:17:49.6 | step: 13200 +epoch: 25 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:17:58.6 | step: 13210 +epoch: 25 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.035 | time: 0:18:07.6 | step: 13220 +epoch: 26 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.009 | time: 0:18:16.1 | step: 13230 +epoch: 26 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:18:25.1 | step: 13240 +epoch: 26 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:18:34.1 | step: 13250 +epoch: 26 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.016 | time: 0:18:43.1 | step: 13260 +epoch: 27 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.015 | time: 0:18:51.7 | step: 13270 +epoch: 27 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.026 | time: 0:19:00.7 | step: 13280 +epoch: 27 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:19:09.7 | step: 13290 +epoch: 27 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:19:18.8 | step: 13300 +epoch: 27 | 40/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 0:19:27.8 | step: 13310 +epoch: 28 | 3/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:19:36.5 | step: 13320 +epoch: 28 | 13/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.031 | time: 0:19:45.6 | step: 13330 +epoch: 28 | 23/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:19:54.6 | step: 13340 +epoch: 28 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:20:03.7 | step: 13350 +epoch: 28 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.034 | time: 0:20:12.7 | step: 13360 +epoch: 29 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.046 | time: 0:20:21.3 | step: 13370 +epoch: 29 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.042 | time: 0:20:30.3 | step: 13380 +epoch: 29 | 26/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:20:39.3 | step: 13390 +epoch: 29 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.022 | time: 0:20:48.2 | step: 13400 +epoch: 29 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:20:56.8 | step: 13410 +epoch: 30 | 9/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:21:05.9 | step: 13420 +epoch: 30 | 19/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:21:14.9 | step: 13430 +epoch: 30 | 29/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:21:23.9 | step: 13440 +epoch: 30 | 39/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:21:33.0 | step: 13450 +epoch: 31 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.026 | time: 0:21:41.6 | step: 13460 +epoch: 31 | 12/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 0:21:50.6 | step: 13470 +epoch: 31 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.025 | time: 0:21:59.6 | step: 13480 +epoch: 31 | 32/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:22:08.7 | step: 13490 +epoch: 31 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:22:17.7 | step: 13500 +epoch: 32 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.013 | time: 0:22:26.3 | step: 13510 +epoch: 32 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:22:35.3 | step: 13520 +epoch: 32 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:22:44.3 | step: 13530 +epoch: 32 | 35/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:22:53.3 | step: 13540 +epoch: 32 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:23:02.3 | step: 13550 +epoch: 33 | 8/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.011 | time: 0:23:10.9 | step: 13560 +epoch: 33 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.018 | time: 0:23:19.9 | step: 13570 +epoch: 33 | 28/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:23:28.9 | step: 13580 +epoch: 33 | 38/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:23:37.9 | step: 13590 +epoch: 34 | 1/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.052 | time: 0:23:46.5 | step: 13600 +epoch: 34 | 11/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:23:55.5 | step: 13610 +epoch: 34 | 21/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.005 | time: 0:24:04.5 | step: 13620 +epoch: 34 | 31/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:24:13.5 | step: 13630 +epoch: 34 | 41/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:24:22.5 | step: 13640 +epoch: 35 | 4/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.020 | time: 0:24:31.1 | step: 13650 +epoch: 35 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.014 | time: 0:24:40.1 | step: 13660 +epoch: 35 | 24/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:24:49.1 | step: 13670 +epoch: 35 | 34/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.004 | time: 0:24:58.1 | step: 13680 +epoch: 35 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.028 | time: 0:25:07.1 | step: 13690 +epoch: 36 | 7/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.020 | time: 0:25:15.7 | step: 13700 +epoch: 36 | 17/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.020 | time: 0:25:24.7 | step: 13710 +epoch: 36 | 27/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:25:33.7 | step: 13720 +epoch: 36 | 37/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:25:42.7 | step: 13730 +epoch: 37 | 0/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.026 | time: 0:25:51.3 | step: 13740 +epoch: 37 | 10/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.024 | time: 0:26:00.3 | step: 13750 +epoch: 37 | 20/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.033 | time: 0:26:09.3 | step: 13760 +epoch: 37 | 30/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.023 | time: 0:26:18.3 | step: 13770 +epoch: 37 | 40/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.075 | time: 0:26:27.3 | step: 13780 +epoch: 38 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.032 | time: 0:26:35.9 | step: 13790 +epoch: 38 | 13/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.007 | time: 0:26:44.9 | step: 13800 +epoch: 38 | 23/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:26:53.9 | step: 13810 +epoch: 38 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.048 | time: 0:27:03.0 | step: 13820 +epoch: 38 | 43/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.012 | time: 0:27:12.0 | step: 13830 +epoch: 39 | 6/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.041 | time: 0:27:20.6 | step: 13840 +epoch: 39 | 16/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.029 | time: 0:27:29.7 | step: 13850 +epoch: 39 | 26/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.005 | time: 0:27:38.7 | step: 13860 +epoch: 39 | 36/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.019 | time: 0:27:47.8 | step: 13870 +epoch: 39 | 46/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.043 | time: 0:27:56.4 | step: 13880 +epoch: 40 | 9/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:28:05.6 | step: 13890 +epoch: 40 | 19/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.020 | time: 0:28:14.6 | step: 13900 +epoch: 40 | 29/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.006 | time: 0:28:23.7 | step: 13910 +epoch: 40 | 39/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.007 | time: 0:28:32.7 | step: 13920 +epoch: 41 | 2/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.041 | time: 0:28:41.4 | step: 13930 +epoch: 41 | 12/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 0:28:50.4 | step: 13940 +epoch: 41 | 22/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:28:59.5 | step: 13950 +epoch: 41 | 32/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 0:29:08.5 | step: 13960 +epoch: 41 | 42/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:29:17.5 | step: 13970 +epoch: 42 | 5/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.007 | time: 0:29:26.1 | step: 13980 +epoch: 42 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.015 | time: 0:29:35.2 | step: 13990 +epoch: 42 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.031 | time: 0:29:44.2 | step: 14000 +--- model size --- +model: 55,192,704 +======= start training ======= +epoch|batch_idx/num_batches|output_dir|batch/s|lr|time|step +epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 0.84 | lr: 0.0002 | loss: 0.013 | time: 0:00:12.5 | step: 14010 +epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:00:22.1 | step: 14020 +epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 0.99 | lr: 0.0002 | loss: 0.031 | time: 0:00:32.2 | step: 14030 +epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 0.98 | lr: 0.0002 | loss: 0.034 | time: 0:00:42.4 | step: 14040 +epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.030 | time: 0:00:51.9 | step: 14050 +epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.035 | time: 0:01:01.4 | step: 14060 +epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.031 | time: 0:01:10.8 | step: 14070 +epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 1.07 | lr: 0.0002 | loss: 0.023 | time: 0:01:20.1 | step: 14080 +epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.07 | lr: 0.0002 | loss: 0.019 | time: 0:01:29.5 | step: 14090 +epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:01:38.5 | step: 14100 +epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.018 | time: 0:01:48.0 | step: 14110 +epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.020 | time: 0:01:57.6 | step: 14120 +epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.03 | lr: 0.0002 | loss: 0.008 | time: 0:02:07.3 | step: 14130 +epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.03 | lr: 0.0002 | loss: 0.020 | time: 0:02:17.0 | step: 14140 +epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:02:26.1 | step: 14150 +epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.018 | time: 0:02:35.7 | step: 14160 +epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.003 | time: 0:02:45.2 | step: 14170 +epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.006 | time: 0:02:54.7 | step: 14180 +epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.013 | time: 0:03:03.7 | step: 14190 +epoch: 4 | 11/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.019 | time: 0:03:13.2 | step: 14200 +epoch: 4 | 21/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.017 | time: 0:03:22.8 | step: 14210 +epoch: 4 | 31/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.010 | time: 0:03:32.3 | step: 14220 +epoch: 4 | 41/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.017 | time: 0:03:41.8 | step: 14230 +epoch: 5 | 4/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.013 | time: 0:03:50.9 | step: 14240 +epoch: 5 | 14/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.009 | time: 0:04:00.5 | step: 14250 +epoch: 5 | 24/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.007 | time: 0:04:10.1 | step: 14260 +epoch: 5 | 34/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.012 | time: 0:04:19.7 | step: 14270 +epoch: 5 | 44/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.016 | time: 0:04:29.3 | step: 14280 +epoch: 6 | 7/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.013 | time: 0:04:38.4 | step: 14290 +epoch: 6 | 17/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.020 | time: 0:04:48.0 | step: 14300 +epoch: 6 | 27/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.027 | time: 0:04:57.6 | step: 14310 +epoch: 6 | 37/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.027 | time: 0:05:07.2 | step: 14320 +epoch: 7 | 0/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:05:16.3 | step: 14330 +epoch: 7 | 10/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.012 | time: 0:05:25.9 | step: 14340 +epoch: 7 | 20/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.019 | time: 0:05:35.5 | step: 14350 +epoch: 7 | 30/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.038 | time: 0:05:45.1 | step: 14360 +epoch: 7 | 40/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.017 | time: 0:05:54.7 | step: 14370 +epoch: 8 | 3/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:06:03.8 | step: 14380 +epoch: 8 | 13/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.017 | time: 0:06:13.4 | step: 14390 +epoch: 8 | 23/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.005 | time: 0:06:23.0 | step: 14400 +epoch: 8 | 33/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.014 | time: 0:06:32.5 | step: 14410 +epoch: 8 | 43/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.011 | time: 0:06:42.1 | step: 14420 +epoch: 9 | 6/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.006 | time: 0:06:51.2 | step: 14430 +epoch: 9 | 16/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 0:07:00.8 | step: 14440 +epoch: 9 | 26/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:07:10.4 | step: 14450 +epoch: 9 | 36/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.022 | time: 0:07:20.0 | step: 14460 +epoch: 9 | 46/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.006 | time: 0:07:29.1 | step: 14470 +epoch: 10 | 9/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.053 | time: 0:07:38.7 | step: 14480 +epoch: 10 | 19/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.015 | time: 0:07:48.3 | step: 14490 +epoch: 10 | 29/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.004 | time: 0:07:57.8 | step: 14500 +epoch: 10 | 39/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.017 | time: 0:08:07.4 | step: 14510 +epoch: 11 | 2/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 0:08:16.5 | step: 14520 +epoch: 11 | 12/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.030 | time: 0:08:26.1 | step: 14530 +epoch: 11 | 22/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.007 | time: 0:08:35.7 | step: 14540 +epoch: 11 | 32/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.016 | time: 0:08:45.3 | step: 14550 +epoch: 11 | 42/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 0:08:54.8 | step: 14560 +epoch: 12 | 5/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.021 | time: 0:09:03.9 | step: 14570 +epoch: 12 | 15/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.007 | time: 0:09:13.5 | step: 14580 +epoch: 12 | 25/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.009 | time: 0:09:23.1 | step: 14590 +epoch: 12 | 35/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:09:32.6 | step: 14600 +epoch: 12 | 45/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.022 | time: 0:09:42.2 | step: 14610 +epoch: 13 | 8/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 0:09:51.3 | step: 14620 +epoch: 13 | 18/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.024 | time: 0:10:00.9 | step: 14630 +epoch: 13 | 28/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.028 | time: 0:10:10.5 | step: 14640 +epoch: 13 | 38/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.022 | time: 0:10:20.0 | step: 14650 +epoch: 14 | 1/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.040 | time: 0:10:29.2 | step: 14660 +epoch: 14 | 11/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.033 | time: 0:10:38.7 | step: 14670 +epoch: 14 | 21/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.016 | time: 0:10:48.3 | step: 14680 +epoch: 14 | 31/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.024 | time: 0:10:57.9 | step: 14690 +epoch: 14 | 41/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.014 | time: 0:11:07.5 | step: 14700 +epoch: 15 | 4/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.038 | time: 0:11:16.6 | step: 14710 +epoch: 15 | 14/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.017 | time: 0:11:26.1 | step: 14720 +epoch: 15 | 24/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.023 | time: 0:11:35.7 | step: 14730 +epoch: 15 | 34/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.021 | time: 0:11:45.3 | step: 14740 +epoch: 15 | 44/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.011 | time: 0:11:54.9 | step: 14750 +epoch: 16 | 7/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.013 | time: 0:12:04.0 | step: 14760 +epoch: 16 | 17/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.018 | time: 0:12:13.5 | step: 14770 +epoch: 16 | 27/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.009 | time: 0:12:23.1 | step: 14780 +epoch: 16 | 37/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.013 | time: 0:12:32.7 | step: 14790 +epoch: 17 | 0/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.040 | time: 0:12:41.8 | step: 14800 +epoch: 17 | 10/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 0:12:51.4 | step: 14810 +epoch: 17 | 20/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.022 | time: 0:13:00.9 | step: 14820 +epoch: 17 | 30/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.013 | time: 0:13:10.5 | step: 14830 +epoch: 17 | 40/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.017 | time: 0:13:20.1 | step: 14840 +epoch: 18 | 3/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:13:29.2 | step: 14850 +epoch: 18 | 13/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.025 | time: 0:13:38.7 | step: 14860 +epoch: 18 | 23/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.032 | time: 0:13:48.3 | step: 14870 +epoch: 18 | 33/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.021 | time: 0:13:57.9 | step: 14880 +epoch: 18 | 43/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.028 | time: 0:14:07.4 | step: 14890 +epoch: 19 | 6/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.030 | time: 0:14:16.5 | step: 14900 +epoch: 19 | 16/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.003 | time: 0:14:26.1 | step: 14910 +epoch: 19 | 26/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.017 | time: 0:14:35.7 | step: 14920 +epoch: 19 | 36/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.024 | time: 0:14:45.2 | step: 14930 +epoch: 19 | 46/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.015 | time: 0:14:54.3 | step: 14940 +epoch: 20 | 9/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.012 | time: 0:15:04.0 | step: 14950 +epoch: 20 | 19/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.027 | time: 0:15:13.5 | step: 14960 +epoch: 20 | 29/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.021 | time: 0:15:23.1 | step: 14970 +epoch: 20 | 39/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.025 | time: 0:15:32.7 | step: 14980 +epoch: 21 | 2/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.038 | time: 0:15:41.8 | step: 14990 +epoch: 21 | 12/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.013 | time: 0:15:51.3 | step: 15000 +epoch: 21 | 22/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.015 | time: 0:16:00.9 | step: 15010 +epoch: 21 | 32/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.028 | time: 0:16:10.5 | step: 15020 +epoch: 21 | 42/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.021 | time: 0:16:20.0 | step: 15030 +epoch: 22 | 5/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.020 | time: 0:16:29.1 | step: 15040 +epoch: 22 | 15/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.013 | time: 0:16:38.7 | step: 15050 +epoch: 22 | 25/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.022 | time: 0:16:48.2 | step: 15060 +epoch: 22 | 35/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.005 | time: 0:16:57.8 | step: 15070 +epoch: 22 | 45/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.029 | time: 0:17:07.4 | step: 15080 +epoch: 23 | 8/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:17:16.5 | step: 15090 +epoch: 23 | 18/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.025 | time: 0:17:26.0 | step: 15100 +epoch: 23 | 28/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.010 | time: 0:17:35.6 | step: 15110 +epoch: 23 | 38/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.031 | time: 0:17:45.1 | step: 15120 +epoch: 24 | 1/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.024 | time: 0:17:54.2 | step: 15130 +epoch: 24 | 11/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.007 | time: 0:18:03.8 | step: 15140 +epoch: 24 | 21/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.014 | time: 0:18:13.3 | step: 15150 +epoch: 24 | 31/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.015 | time: 0:18:22.9 | step: 15160 +epoch: 24 | 41/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.009 | time: 0:18:32.4 | step: 15170 +epoch: 25 | 4/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.026 | time: 0:18:41.5 | step: 15180 +epoch: 25 | 14/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.016 | time: 0:18:51.1 | step: 15190 +epoch: 25 | 24/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.028 | time: 0:19:00.6 | step: 15200 +epoch: 25 | 34/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:19:10.2 | step: 15210 +epoch: 25 | 44/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.018 | time: 0:19:19.8 | step: 15220 +epoch: 26 | 7/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 0:19:28.8 | step: 15230 +epoch: 26 | 17/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.021 | time: 0:19:38.4 | step: 15240 +epoch: 26 | 27/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.007 | time: 0:19:48.0 | step: 15250 +epoch: 26 | 37/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.017 | time: 0:19:57.5 | step: 15260 +epoch: 27 | 0/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.042 | time: 0:20:06.6 | step: 15270 +epoch: 27 | 10/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.023 | time: 0:20:16.2 | step: 15280 +epoch: 27 | 20/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.022 | time: 0:20:25.7 | step: 15290 +epoch: 27 | 30/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.010 | time: 0:20:35.3 | step: 15300 +epoch: 27 | 40/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:20:44.9 | step: 15310 +epoch: 28 | 3/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:20:54.0 | step: 15320 +epoch: 28 | 13/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.039 | time: 0:21:03.5 | step: 15330 +epoch: 28 | 23/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.016 | time: 0:21:13.1 | step: 15340 +epoch: 28 | 33/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.035 | time: 0:21:22.7 | step: 15350 +epoch: 28 | 43/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.011 | time: 0:21:32.2 | step: 15360 +epoch: 29 | 6/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:21:41.3 | step: 15370 +epoch: 29 | 16/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.031 | time: 0:21:50.9 | step: 15380 +epoch: 29 | 26/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:22:00.5 | step: 15390 +epoch: 29 | 36/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.010 | time: 0:22:10.0 | step: 15400 +epoch: 29 | 46/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.008 | time: 0:22:19.1 | step: 15410 +epoch: 30 | 9/ 47 | logs/44k/diffusion | batch/s: 1.07 | lr: 0.0002 | loss: 0.039 | time: 0:22:28.8 | step: 15420 +epoch: 30 | 19/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.014 | time: 0:22:38.4 | step: 15430 +epoch: 30 | 29/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.006 | time: 0:22:47.9 | step: 15440 +epoch: 30 | 39/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.037 | time: 0:22:57.5 | step: 15450 +epoch: 31 | 2/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.006 | time: 0:23:06.6 | step: 15460 +epoch: 31 | 12/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:23:16.2 | step: 15470 +epoch: 31 | 22/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:23:25.8 | step: 15480 +epoch: 31 | 32/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.015 | time: 0:23:35.3 | step: 15490 +epoch: 31 | 42/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.013 | time: 0:23:44.9 | step: 15500 +epoch: 32 | 5/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:23:54.0 | step: 15510 +epoch: 32 | 15/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.032 | time: 0:24:03.6 | step: 15520 +epoch: 32 | 25/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.011 | time: 0:24:13.2 | step: 15530 +epoch: 32 | 35/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:24:22.7 | step: 15540 +epoch: 32 | 45/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.034 | time: 0:24:32.3 | step: 15550 +epoch: 33 | 8/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:24:41.4 | step: 15560 +epoch: 33 | 18/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.020 | time: 0:24:51.0 | step: 15570 +epoch: 33 | 28/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.036 | time: 0:25:00.6 | step: 15580 +epoch: 33 | 38/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.022 | time: 0:25:10.1 | step: 15590 +epoch: 34 | 1/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.005 | time: 0:25:19.3 | step: 15600 +epoch: 34 | 11/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.017 | time: 0:25:28.8 | step: 15610 +epoch: 34 | 21/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.011 | time: 0:25:38.4 | step: 15620 +epoch: 34 | 31/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.009 | time: 0:25:48.0 | step: 15630 +epoch: 34 | 41/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.032 | time: 0:25:57.6 | step: 15640 +epoch: 35 | 4/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.026 | time: 0:26:06.7 | step: 15650 +epoch: 35 | 14/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.012 | time: 0:26:16.3 | step: 15660 +epoch: 35 | 24/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.006 | time: 0:26:25.9 | step: 15670 +epoch: 35 | 34/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:26:35.4 | step: 15680 +epoch: 35 | 44/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.019 | time: 0:26:45.0 | step: 15690 +epoch: 36 | 7/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.039 | time: 0:26:54.1 | step: 15700 +epoch: 36 | 17/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.038 | time: 0:27:03.7 | step: 15710 +epoch: 36 | 27/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.011 | time: 0:27:13.3 | step: 15720 +epoch: 36 | 37/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:27:22.9 | step: 15730 +epoch: 37 | 0/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.007 | time: 0:27:32.0 | step: 15740 +epoch: 37 | 10/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.012 | time: 0:27:41.6 | step: 15750 +epoch: 37 | 20/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.028 | time: 0:27:51.2 | step: 15760 +epoch: 37 | 30/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.025 | time: 0:28:00.8 | step: 15770 +epoch: 37 | 40/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:28:10.4 | step: 15780 +epoch: 38 | 3/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.019 | time: 0:28:19.5 | step: 15790 +epoch: 38 | 13/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.019 | time: 0:28:29.1 | step: 15800 +epoch: 38 | 23/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.034 | time: 0:28:38.7 | step: 15810 +epoch: 38 | 33/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:28:48.2 | step: 15820 +epoch: 38 | 43/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:28:57.8 | step: 15830 +epoch: 39 | 6/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.022 | time: 0:29:06.9 | step: 15840 +epoch: 39 | 16/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.024 | time: 0:29:16.5 | step: 15850 +epoch: 39 | 26/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:29:26.1 | step: 15860 +epoch: 39 | 36/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.022 | time: 0:29:35.7 | step: 15870 +epoch: 39 | 46/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.013 | time: 0:29:44.8 | step: 15880 +epoch: 40 | 9/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.017 | time: 0:29:54.4 | step: 15890 +epoch: 40 | 19/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.009 | time: 0:30:04.0 | step: 15900 +epoch: 40 | 29/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.009 | time: 0:30:13.6 | step: 15910 +epoch: 40 | 39/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.027 | time: 0:30:23.2 | step: 15920 +epoch: 41 | 2/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.029 | time: 0:30:32.3 | step: 15930 +epoch: 41 | 12/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.023 | time: 0:30:41.9 | step: 15940 +epoch: 41 | 22/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.021 | time: 0:30:51.5 | step: 15950 +epoch: 41 | 32/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.014 | time: 0:31:01.1 | step: 15960 +epoch: 41 | 42/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.012 | time: 0:31:10.7 | step: 15970 +epoch: 42 | 5/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.021 | time: 0:31:19.8 | step: 15980 +epoch: 42 | 15/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.031 | time: 0:31:29.4 | step: 15990 +epoch: 42 | 25/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.020 | time: 0:31:39.0 | step: 16000 +epoch: 42 | 35/ 47 | logs/44k/diffusion | batch/s: 0.23 | lr: 0.0002 | loss: 0.008 | time: 0:32:21.7 | step: 16010 +epoch: 42 | 45/ 47 | logs/44k/diffusion | batch/s: 1.01 | lr: 0.0002 | loss: 0.010 | time: 0:32:31.6 | step: 16020 +epoch: 43 | 8/ 47 | logs/44k/diffusion | batch/s: 1.02 | lr: 0.0002 | loss: 0.020 | time: 0:32:41.4 | step: 16030 +epoch: 43 | 18/ 47 | logs/44k/diffusion | batch/s: 0.99 | lr: 0.0002 | loss: 0.024 | time: 0:32:51.5 | step: 16040 +epoch: 43 | 28/ 47 | logs/44k/diffusion | batch/s: 1.03 | lr: 0.0002 | loss: 0.027 | time: 0:33:01.2 | step: 16050 +epoch: 43 | 38/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.008 | time: 0:33:10.7 | step: 16060 +epoch: 44 | 1/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 0:33:19.6 | step: 16070 +epoch: 44 | 11/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.030 | time: 0:33:28.9 | step: 16080 +epoch: 44 | 21/ 47 | logs/44k/diffusion | batch/s: 1.07 | lr: 0.0002 | loss: 0.024 | time: 0:33:38.2 | step: 16090 +epoch: 44 | 31/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.032 | time: 0:33:47.7 | step: 16100 +epoch: 44 | 41/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.038 | time: 0:33:57.2 | step: 16110 +epoch: 45 | 4/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.012 | time: 0:34:06.4 | step: 16120 +epoch: 45 | 14/ 47 | logs/44k/diffusion | batch/s: 1.03 | lr: 0.0002 | loss: 0.033 | time: 0:34:16.1 | step: 16130 +epoch: 45 | 24/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.014 | time: 0:34:25.8 | step: 16140 +epoch: 45 | 34/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.022 | time: 0:34:35.4 | step: 16150 +epoch: 45 | 44/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.006 | time: 0:34:45.0 | step: 16160 +epoch: 46 | 7/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.037 | time: 0:34:54.1 | step: 16170 +epoch: 46 | 17/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.016 | time: 0:35:03.6 | step: 16180 +epoch: 46 | 27/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.014 | time: 0:35:13.1 | step: 16190 +epoch: 46 | 37/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.011 | time: 0:35:22.6 | step: 16200 +epoch: 47 | 0/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:35:31.7 | step: 16210 +epoch: 47 | 10/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.021 | time: 0:35:41.3 | step: 16220 +epoch: 47 | 20/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:35:50.8 | step: 16230 +epoch: 47 | 30/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.012 | time: 0:36:00.4 | step: 16240 +epoch: 47 | 40/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.012 | time: 0:36:10.0 | step: 16250 +epoch: 48 | 3/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:36:19.2 | step: 16260 +epoch: 48 | 13/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.026 | time: 0:36:28.8 | step: 16270 +epoch: 48 | 23/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.025 | time: 0:36:38.4 | step: 16280 +epoch: 48 | 33/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.021 | time: 0:36:48.0 | step: 16290 +epoch: 48 | 43/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.008 | time: 0:36:57.5 | step: 16300 +epoch: 49 | 6/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.023 | time: 0:37:06.6 | step: 16310 +epoch: 49 | 16/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.010 | time: 0:37:16.2 | step: 16320 +epoch: 49 | 26/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.013 | time: 0:37:25.7 | step: 16330 +epoch: 49 | 36/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.008 | time: 0:37:35.3 | step: 16340 +epoch: 49 | 46/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.006 | time: 0:37:44.3 | step: 16350 +epoch: 50 | 9/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.017 | time: 0:37:53.9 | step: 16360 +epoch: 50 | 19/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.004 | time: 0:38:03.4 | step: 16370 +epoch: 50 | 29/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.009 | time: 0:38:12.9 | step: 16380 +epoch: 50 | 39/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.005 | time: 0:38:22.5 | step: 16390 +epoch: 51 | 2/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.018 | time: 0:38:31.5 | step: 16400 +epoch: 51 | 12/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.016 | time: 0:38:41.1 | step: 16410 +epoch: 51 | 22/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 0:38:50.6 | step: 16420 +epoch: 51 | 32/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.007 | time: 0:39:00.2 | step: 16430 +epoch: 51 | 42/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.016 | time: 0:39:09.7 | step: 16440 +epoch: 52 | 5/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.013 | time: 0:39:18.8 | step: 16450 +epoch: 52 | 15/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.011 | time: 0:39:28.4 | step: 16460 +epoch: 52 | 25/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.037 | time: 0:39:37.9 | step: 16470 +epoch: 52 | 35/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.028 | time: 0:39:47.5 | step: 16480 +epoch: 52 | 45/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.043 | time: 0:39:57.0 | step: 16490 +epoch: 53 | 8/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.008 | time: 0:40:06.1 | step: 16500 +epoch: 53 | 18/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.026 | time: 0:40:15.7 | step: 16510 +epoch: 53 | 28/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.010 | time: 0:40:25.2 | step: 16520 +epoch: 53 | 38/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.038 | time: 0:40:34.8 | step: 16530 +epoch: 54 | 1/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.029 | time: 0:40:43.9 | step: 16540 +epoch: 54 | 11/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.020 | time: 0:40:53.5 | step: 16550 +epoch: 54 | 21/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.029 | time: 0:41:03.0 | step: 16560 +epoch: 54 | 31/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.015 | time: 0:41:12.6 | step: 16570 +epoch: 54 | 41/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 0:41:22.1 | step: 16580 +epoch: 55 | 4/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.008 | time: 0:41:31.2 | step: 16590 +epoch: 55 | 14/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.027 | time: 0:41:40.8 | step: 16600 +epoch: 55 | 24/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.007 | time: 0:41:50.4 | step: 16610 +epoch: 55 | 34/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.034 | time: 0:41:59.9 | step: 16620 +epoch: 55 | 44/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.032 | time: 0:42:09.5 | step: 16630 +epoch: 56 | 7/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.007 | time: 0:42:18.6 | step: 16640 +epoch: 56 | 17/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.011 | time: 0:42:28.1 | step: 16650 +epoch: 56 | 27/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.038 | time: 0:42:37.7 | step: 16660 +epoch: 56 | 37/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.011 | time: 0:42:47.3 | step: 16670 +epoch: 57 | 0/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.019 | time: 0:42:56.4 | step: 16680 +epoch: 57 | 10/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.017 | time: 0:43:05.9 | step: 16690 +epoch: 57 | 20/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.025 | time: 0:43:15.5 | step: 16700 +epoch: 57 | 30/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.030 | time: 0:43:25.1 | step: 16710 +epoch: 57 | 40/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.047 | time: 0:43:34.6 | step: 16720 +epoch: 58 | 3/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.021 | time: 0:43:43.7 | step: 16730 +epoch: 58 | 13/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.010 | time: 0:43:53.3 | step: 16740 +epoch: 58 | 23/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.010 | time: 0:44:02.8 | step: 16750 +epoch: 58 | 33/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.034 | time: 0:44:12.4 | step: 16760 +epoch: 58 | 43/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.010 | time: 0:44:22.0 | step: 16770 +epoch: 59 | 6/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 0:44:31.1 | step: 16780 +epoch: 59 | 16/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.017 | time: 0:44:40.7 | step: 16790 +epoch: 59 | 26/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.041 | time: 0:44:50.2 | step: 16800 +epoch: 59 | 36/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.018 | time: 0:44:59.8 | step: 16810 +epoch: 59 | 46/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.015 | time: 0:45:08.9 | step: 16820 +epoch: 60 | 9/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.010 | time: 0:45:18.5 | step: 16830 +epoch: 60 | 19/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.013 | time: 0:45:28.1 | step: 16840 +epoch: 60 | 29/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.009 | time: 0:45:37.7 | step: 16850 +epoch: 60 | 39/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.028 | time: 0:45:47.2 | step: 16860 +epoch: 61 | 2/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.027 | time: 0:45:56.4 | step: 16870 +epoch: 61 | 12/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.023 | time: 0:46:05.9 | step: 16880 +epoch: 61 | 22/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.040 | time: 0:46:15.5 | step: 16890 +epoch: 61 | 32/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.025 | time: 0:46:25.1 | step: 16900 +epoch: 61 | 42/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.021 | time: 0:46:34.6 | step: 16910 +epoch: 62 | 5/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.022 | time: 0:46:43.7 | step: 16920 +epoch: 62 | 15/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.006 | time: 0:46:53.3 | step: 16930 +epoch: 62 | 25/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.027 | time: 0:47:02.9 | step: 16940 +epoch: 62 | 35/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.013 | time: 0:47:12.5 | step: 16950 +epoch: 62 | 45/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.045 | time: 0:47:22.0 | step: 16960 +epoch: 63 | 8/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 0:47:31.1 | step: 16970 +epoch: 63 | 18/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:47:40.7 | step: 16980 +epoch: 63 | 28/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.041 | time: 0:47:50.3 | step: 16990 +epoch: 63 | 38/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.019 | time: 0:47:59.9 | step: 17000 +epoch: 64 | 1/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:48:09.0 | step: 17010 +epoch: 64 | 11/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.023 | time: 0:48:18.5 | step: 17020 +epoch: 64 | 21/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.022 | time: 0:48:28.1 | step: 17030 +epoch: 64 | 31/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.007 | time: 0:48:37.7 | step: 17040 +epoch: 64 | 41/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.037 | time: 0:48:47.2 | step: 17050 +epoch: 65 | 4/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.027 | time: 0:48:56.3 | step: 17060 +epoch: 65 | 14/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.018 | time: 0:49:05.9 | step: 17070 +epoch: 65 | 24/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.007 | time: 0:49:15.5 | step: 17080 +epoch: 65 | 34/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.009 | time: 0:49:25.0 | step: 17090 +epoch: 65 | 44/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:49:34.6 | step: 17100 +epoch: 66 | 7/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.011 | time: 0:49:43.7 | step: 17110 +epoch: 66 | 17/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.049 | time: 0:49:53.3 | step: 17120 +epoch: 66 | 27/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.031 | time: 0:50:02.8 | step: 17130 +epoch: 66 | 37/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.012 | time: 0:50:12.4 | step: 17140 +epoch: 67 | 0/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.021 | time: 0:50:21.4 | step: 17150 +epoch: 67 | 10/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.019 | time: 0:50:30.9 | step: 17160 +epoch: 67 | 20/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.025 | time: 0:50:40.5 | step: 17170 +epoch: 67 | 30/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:50:50.1 | step: 17180 +epoch: 67 | 40/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.036 | time: 0:50:59.7 | step: 17190 +epoch: 68 | 3/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.023 | time: 0:51:08.8 | step: 17200 +epoch: 68 | 13/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.023 | time: 0:51:18.4 | step: 17210 +epoch: 68 | 23/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.023 | time: 0:51:28.0 | step: 17220 +epoch: 68 | 33/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.043 | time: 0:51:37.6 | step: 17230 +epoch: 68 | 43/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.014 | time: 0:51:47.2 | step: 17240 +epoch: 69 | 6/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.036 | time: 0:51:56.3 | step: 17250 +epoch: 69 | 16/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.032 | time: 0:52:05.9 | step: 17260 +epoch: 69 | 26/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.010 | time: 0:52:15.5 | step: 17270 +epoch: 69 | 36/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.008 | time: 0:52:25.1 | step: 17280 +epoch: 69 | 46/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.028 | time: 0:52:34.1 | step: 17290 +epoch: 70 | 9/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.019 | time: 0:52:43.7 | step: 17300 +epoch: 70 | 19/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.052 | time: 0:52:53.3 | step: 17310 +epoch: 70 | 29/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.011 | time: 0:53:02.8 | step: 17320 +epoch: 70 | 39/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.043 | time: 0:53:12.3 | step: 17330 +epoch: 71 | 2/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.035 | time: 0:53:21.4 | step: 17340 +epoch: 71 | 12/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.032 | time: 0:53:30.9 | step: 17350 +epoch: 71 | 22/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.011 | time: 0:53:40.4 | step: 17360 +epoch: 71 | 32/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.007 | time: 0:53:50.0 | step: 17370 +epoch: 71 | 42/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.017 | time: 0:53:59.5 | step: 17380 +epoch: 72 | 5/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.014 | time: 0:54:08.6 | step: 17390 +epoch: 72 | 15/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.028 | time: 0:54:18.1 | step: 17400 +epoch: 72 | 25/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 0:54:27.6 | step: 17410 +epoch: 72 | 35/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.031 | time: 0:54:37.2 | step: 17420 +epoch: 72 | 45/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.016 | time: 0:54:46.7 | step: 17430 +epoch: 73 | 8/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.019 | time: 0:54:55.8 | step: 17440 +epoch: 73 | 18/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.012 | time: 0:55:05.3 | step: 17450 +epoch: 73 | 28/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.015 | time: 0:55:14.8 | step: 17460 +epoch: 73 | 38/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.008 | time: 0:55:24.3 | step: 17470 +epoch: 74 | 1/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.008 | time: 0:55:33.4 | step: 17480 +epoch: 74 | 11/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.017 | time: 0:55:43.0 | step: 17490 +epoch: 74 | 21/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.010 | time: 0:55:52.6 | step: 17500 +epoch: 74 | 31/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.015 | time: 0:56:02.2 | step: 17510 +epoch: 74 | 41/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:56:11.8 | step: 17520 +epoch: 75 | 4/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.040 | time: 0:56:20.9 | step: 17530 +epoch: 75 | 14/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.018 | time: 0:56:30.5 | step: 17540 +epoch: 75 | 24/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.016 | time: 0:56:40.0 | step: 17550 +epoch: 75 | 34/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 0:56:49.6 | step: 17560 +epoch: 75 | 44/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.012 | time: 0:56:59.1 | step: 17570 +epoch: 76 | 7/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.017 | time: 0:57:08.1 | step: 17580 +epoch: 76 | 17/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.013 | time: 0:57:17.6 | step: 17590 +epoch: 76 | 27/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.008 | time: 0:57:27.1 | step: 17600 +epoch: 76 | 37/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.047 | time: 0:57:36.6 | step: 17610 +epoch: 77 | 0/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.044 | time: 0:57:45.7 | step: 17620 +epoch: 77 | 10/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.041 | time: 0:57:55.2 | step: 17630 +epoch: 77 | 20/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.007 | time: 0:58:04.8 | step: 17640 +epoch: 77 | 30/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.035 | time: 0:58:14.3 | step: 17650 +epoch: 77 | 40/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.037 | time: 0:58:23.9 | step: 17660 +epoch: 78 | 3/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 0:58:33.0 | step: 17670 +epoch: 78 | 13/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.024 | time: 0:58:42.6 | step: 17680 +epoch: 78 | 23/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.018 | time: 0:58:52.2 | step: 17690 +epoch: 78 | 33/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.031 | time: 0:59:01.8 | step: 17700 +epoch: 78 | 43/ 47 | logs/44k/diffusion | batch/s: 1.04 | lr: 0.0002 | loss: 0.016 | time: 0:59:11.4 | step: 17710 +epoch: 79 | 6/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.007 | time: 0:59:20.5 | step: 17720 +epoch: 79 | 16/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.044 | time: 0:59:30.1 | step: 17730 +epoch: 79 | 26/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.007 | time: 0:59:39.6 | step: 17740 +epoch: 79 | 36/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.008 | time: 0:59:49.2 | step: 17750 +epoch: 79 | 46/ 47 | logs/44k/diffusion | batch/s: 1.06 | lr: 0.0002 | loss: 0.010 | time: 0:59:58.2 | step: 17760 +epoch: 80 | 9/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.014 | time: 1:00:07.8 | step: 17770 +epoch: 80 | 19/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.014 | time: 1:00:17.3 | step: 17780 +epoch: 80 | 29/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.017 | time: 1:00:26.8 | step: 17790 +epoch: 80 | 39/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.038 | time: 1:00:36.4 | step: 17800 +epoch: 81 | 2/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.016 | time: 1:00:45.4 | step: 17810 +epoch: 81 | 12/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.009 | time: 1:00:55.0 | step: 17820 +epoch: 81 | 22/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.013 | time: 1:01:04.5 | step: 17830 +epoch: 81 | 32/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.012 | time: 1:01:14.0 | step: 17840 +epoch: 81 | 42/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.009 | time: 1:01:23.6 | step: 17850 +epoch: 82 | 5/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.088 | time: 1:01:32.6 | step: 17860 +epoch: 82 | 15/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 1:01:42.2 | step: 17870 +epoch: 82 | 25/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.018 | time: 1:01:51.7 | step: 17880 +epoch: 82 | 35/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.008 | time: 1:02:01.3 | step: 17890 +epoch: 82 | 45/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.024 | time: 1:02:10.8 | step: 17900 +epoch: 83 | 8/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.020 | time: 1:02:19.8 | step: 17910 +epoch: 83 | 18/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.015 | time: 1:02:29.4 | step: 17920 +epoch: 83 | 28/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.024 | time: 1:02:38.9 | step: 17930 +epoch: 83 | 38/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.007 | time: 1:02:48.4 | step: 17940 +epoch: 84 | 1/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.032 | time: 1:02:57.5 | step: 17950 +epoch: 84 | 11/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.033 | time: 1:03:07.0 | step: 17960 +epoch: 84 | 21/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.030 | time: 1:03:16.5 | step: 17970 +epoch: 84 | 31/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.012 | time: 1:03:26.1 | step: 17980 +epoch: 84 | 41/ 47 | logs/44k/diffusion | batch/s: 1.05 | lr: 0.0002 | loss: 0.020 | time: 1:03:35.6 | step: 17990 +epoch: 85 | 4/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.015 | time: 1:03:44.7 | step: 18000 +--- model size --- +model: 55,192,704 +======= start training ======= +epoch|batch_idx/num_batches|output_dir|batch/s|lr|time|step +epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 0.67 | lr: 0.0002 | loss: 0.012 | time: 0:00:15.5 | step: 18010 +epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 1.25 | lr: 0.0002 | loss: 0.026 | time: 0:00:23.5 | step: 18020 +epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 1.23 | lr: 0.0002 | loss: 0.021 | time: 0:00:31.6 | step: 18030 +epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 1.23 | lr: 0.0002 | loss: 0.063 | time: 0:00:39.7 | step: 18040 +epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 1.26 | lr: 0.0002 | loss: 0.042 | time: 0:00:47.7 | step: 18050 +epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.008 | time: 0:00:56.1 | step: 18060 +epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.026 | time: 0:01:04.7 | step: 18070 +epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.015 | time: 0:01:13.3 | step: 18080 +epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 0:01:22.1 | step: 18090 +epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.010 | time: 0:01:30.6 | step: 18100 +epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.023 | time: 0:01:39.8 | step: 18110 +epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.012 | time: 0:01:48.9 | step: 18120 +epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 0:01:57.8 | step: 18130 +epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:02:06.6 | step: 18140 +epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.016 | time: 0:02:14.9 | step: 18150 +epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.011 | time: 0:02:23.6 | step: 18160 +epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.029 | time: 0:02:32.3 | step: 18170 +epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:02:41.1 | step: 18180 +epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.017 | time: 0:02:49.5 | step: 18190 +epoch: 4 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.037 | time: 0:02:58.4 | step: 18200 +epoch: 4 | 21/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 0:03:07.3 | step: 18210 +epoch: 4 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 0:03:16.3 | step: 18220 +epoch: 4 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:03:25.1 | step: 18230 +epoch: 5 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.024 | time: 0:03:33.6 | step: 18240 +epoch: 5 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:03:42.4 | step: 18250 +epoch: 5 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 0:03:51.3 | step: 18260 +epoch: 5 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:04:00.1 | step: 18270 +epoch: 5 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 0:04:09.0 | step: 18280 +epoch: 6 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.017 | time: 0:04:17.4 | step: 18290 +epoch: 6 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:04:26.2 | step: 18300 +epoch: 6 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.037 | time: 0:04:35.1 | step: 18310 +epoch: 6 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:04:44.0 | step: 18320 +epoch: 7 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.007 | time: 0:04:52.4 | step: 18330 +epoch: 7 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 0:05:01.3 | step: 18340 +epoch: 7 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.034 | time: 0:05:10.2 | step: 18350 +epoch: 7 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:05:19.0 | step: 18360 +epoch: 7 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:05:27.9 | step: 18370 +epoch: 8 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.011 | time: 0:05:36.3 | step: 18380 +epoch: 8 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 0:05:45.2 | step: 18390 +epoch: 8 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:05:54.1 | step: 18400 +epoch: 8 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 0:06:02.9 | step: 18410 +epoch: 8 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:06:11.8 | step: 18420 +epoch: 9 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.008 | time: 0:06:20.2 | step: 18430 +epoch: 9 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 0:06:29.1 | step: 18440 +epoch: 9 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 0:06:38.0 | step: 18450 +epoch: 9 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 0:06:46.9 | step: 18460 +epoch: 9 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:06:55.3 | step: 18470 +epoch: 10 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.014 | time: 0:07:04.2 | step: 18480 +epoch: 10 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.035 | time: 0:07:13.1 | step: 18490 +epoch: 10 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 0:07:22.0 | step: 18500 +epoch: 10 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:07:30.9 | step: 18510 +epoch: 11 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.023 | time: 0:07:39.4 | step: 18520 +epoch: 11 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 0:07:48.2 | step: 18530 +epoch: 11 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:07:57.1 | step: 18540 +epoch: 11 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 0:08:06.0 | step: 18550 +epoch: 11 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:08:14.9 | step: 18560 +epoch: 12 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.040 | time: 0:08:23.3 | step: 18570 +epoch: 12 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 0:08:32.2 | step: 18580 +epoch: 12 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.012 | time: 0:08:41.1 | step: 18590 +epoch: 12 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:08:50.0 | step: 18600 +epoch: 12 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 0:08:58.9 | step: 18610 +epoch: 13 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 0:09:07.4 | step: 18620 +epoch: 13 | 18/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:09:16.2 | step: 18630 +epoch: 13 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.053 | time: 0:09:25.1 | step: 18640 +epoch: 13 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:09:34.0 | step: 18650 +epoch: 14 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.024 | time: 0:09:42.5 | step: 18660 +epoch: 14 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.031 | time: 0:09:51.4 | step: 18670 +epoch: 14 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.036 | time: 0:10:00.3 | step: 18680 +epoch: 14 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.031 | time: 0:10:09.2 | step: 18690 +epoch: 14 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 0:10:18.0 | step: 18700 +epoch: 15 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.058 | time: 0:10:26.5 | step: 18710 +epoch: 15 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.006 | time: 0:10:35.4 | step: 18720 +epoch: 15 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.049 | time: 0:10:44.3 | step: 18730 +epoch: 15 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:10:53.2 | step: 18740 +epoch: 15 | 44/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.004 | time: 0:11:02.0 | step: 18750 +epoch: 16 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.021 | time: 0:11:10.5 | step: 18760 +epoch: 16 | 17/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 0:11:19.4 | step: 18770 +epoch: 16 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:11:28.3 | step: 18780 +epoch: 16 | 37/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 0:11:37.2 | step: 18790 +epoch: 17 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.010 | time: 0:11:45.6 | step: 18800 +epoch: 17 | 10/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 0:11:54.5 | step: 18810 +epoch: 17 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:12:03.4 | step: 18820 +epoch: 17 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 0:12:12.3 | step: 18830 +epoch: 17 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.037 | time: 0:12:21.2 | step: 18840 +epoch: 18 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.023 | time: 0:12:29.6 | step: 18850 +epoch: 18 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 0:12:38.5 | step: 18860 +epoch: 18 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:12:47.4 | step: 18870 +epoch: 18 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 0:12:56.3 | step: 18880 +epoch: 18 | 43/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:13:05.2 | step: 18890 +epoch: 19 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.031 | time: 0:13:13.6 | step: 18900 +epoch: 19 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:13:22.5 | step: 18910 +epoch: 19 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 0:13:31.4 | step: 18920 +epoch: 19 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 0:13:40.3 | step: 18930 +epoch: 19 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.056 | time: 0:13:48.7 | step: 18940 +epoch: 20 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.015 | time: 0:13:57.7 | step: 18950 +epoch: 20 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.048 | time: 0:14:06.6 | step: 18960 +epoch: 20 | 29/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:14:15.5 | step: 18970 +epoch: 20 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.034 | time: 0:14:24.4 | step: 18980 +epoch: 21 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.020 | time: 0:14:32.8 | step: 18990 +epoch: 21 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:14:41.7 | step: 19000 +epoch: 21 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:14:50.6 | step: 19010 +epoch: 21 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:14:59.4 | step: 19020 +epoch: 21 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:15:08.3 | step: 19030 +epoch: 22 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 0:15:16.7 | step: 19040 +epoch: 22 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 0:15:25.6 | step: 19050 +epoch: 22 | 25/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:15:34.5 | step: 19060 +epoch: 22 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.038 | time: 0:15:43.4 | step: 19070 +epoch: 22 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:15:52.2 | step: 19080 +epoch: 23 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.013 | time: 0:16:00.7 | step: 19090 +epoch: 23 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.035 | time: 0:16:09.6 | step: 19100 +epoch: 23 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:16:18.4 | step: 19110 +epoch: 23 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:16:27.3 | step: 19120 +epoch: 24 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.014 | time: 0:16:35.8 | step: 19130 +epoch: 24 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.043 | time: 0:16:44.6 | step: 19140 +epoch: 24 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:16:53.5 | step: 19150 +epoch: 24 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.035 | time: 0:17:02.4 | step: 19160 +epoch: 24 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.037 | time: 0:17:11.3 | step: 19170 +epoch: 25 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.016 | time: 0:17:19.7 | step: 19180 +epoch: 25 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:17:28.6 | step: 19190 +epoch: 25 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 0:17:37.5 | step: 19200 +epoch: 25 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.034 | time: 0:17:46.4 | step: 19210 +epoch: 25 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 0:17:55.2 | step: 19220 +epoch: 26 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.039 | time: 0:18:03.7 | step: 19230 +epoch: 26 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:18:12.6 | step: 19240 +epoch: 26 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:18:21.4 | step: 19250 +epoch: 26 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 0:18:30.3 | step: 19260 +epoch: 27 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.004 | time: 0:18:38.8 | step: 19270 +epoch: 27 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:18:47.6 | step: 19280 +epoch: 27 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.047 | time: 0:18:56.5 | step: 19290 +epoch: 27 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:19:05.4 | step: 19300 +epoch: 27 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:19:14.3 | step: 19310 +epoch: 28 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.035 | time: 0:19:22.7 | step: 19320 +epoch: 28 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:19:31.6 | step: 19330 +epoch: 28 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.004 | time: 0:19:40.5 | step: 19340 +epoch: 28 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:19:49.4 | step: 19350 +epoch: 28 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:19:58.2 | step: 19360 +epoch: 29 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.008 | time: 0:20:06.7 | step: 19370 +epoch: 29 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 0:20:15.6 | step: 19380 +epoch: 29 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:20:24.5 | step: 19390 +epoch: 29 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:20:33.3 | step: 19400 +epoch: 29 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:20:41.8 | step: 19410 +epoch: 30 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.026 | time: 0:20:50.8 | step: 19420 +epoch: 30 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 0:20:59.7 | step: 19430 +epoch: 30 | 29/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.006 | time: 0:21:08.6 | step: 19440 +epoch: 30 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:21:17.5 | step: 19450 +epoch: 31 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.029 | time: 0:21:25.9 | step: 19460 +epoch: 31 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 0:21:34.8 | step: 19470 +epoch: 31 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:21:43.7 | step: 19480 +epoch: 31 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:21:52.6 | step: 19490 +epoch: 31 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 0:22:01.5 | step: 19500 +epoch: 32 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.014 | time: 0:22:09.9 | step: 19510 +epoch: 32 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 0:22:18.8 | step: 19520 +epoch: 32 | 25/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 0:22:27.7 | step: 19530 +epoch: 32 | 35/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:22:36.6 | step: 19540 +epoch: 32 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.033 | time: 0:22:45.5 | step: 19550 +epoch: 33 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 0:22:53.9 | step: 19560 +epoch: 33 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:23:02.8 | step: 19570 +epoch: 33 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.031 | time: 0:23:11.7 | step: 19580 +epoch: 33 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.006 | time: 0:23:20.6 | step: 19590 +epoch: 34 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.018 | time: 0:23:29.0 | step: 19600 +epoch: 34 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.006 | time: 0:23:37.9 | step: 19610 +epoch: 34 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:23:46.8 | step: 19620 +epoch: 34 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:23:55.7 | step: 19630 +epoch: 34 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:24:04.6 | step: 19640 +epoch: 35 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.012 | time: 0:24:13.1 | step: 19650 +epoch: 35 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 0:24:21.9 | step: 19660 +epoch: 35 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:24:30.8 | step: 19670 +epoch: 35 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.031 | time: 0:24:39.7 | step: 19680 +epoch: 35 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:24:48.6 | step: 19690 +epoch: 36 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.016 | time: 0:24:57.1 | step: 19700 +epoch: 36 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:25:06.0 | step: 19710 +epoch: 36 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 0:25:14.9 | step: 19720 +epoch: 36 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:25:23.8 | step: 19730 +epoch: 37 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.009 | time: 0:25:32.2 | step: 19740 +epoch: 37 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 0:25:41.1 | step: 19750 +epoch: 37 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 0:25:50.0 | step: 19760 +epoch: 37 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:25:58.9 | step: 19770 +epoch: 37 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.029 | time: 0:26:07.8 | step: 19780 +epoch: 38 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.035 | time: 0:26:16.2 | step: 19790 +epoch: 38 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.006 | time: 0:26:25.1 | step: 19800 +epoch: 38 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:26:34.0 | step: 19810 +epoch: 38 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.012 | time: 0:26:42.9 | step: 19820 +epoch: 38 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:26:51.8 | step: 19830 +epoch: 39 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.009 | time: 0:27:00.2 | step: 19840 +epoch: 39 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:27:09.1 | step: 19850 +epoch: 39 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 0:27:18.0 | step: 19860 +epoch: 39 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:27:26.9 | step: 19870 +epoch: 39 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:27:35.4 | step: 19880 +epoch: 40 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.015 | time: 0:27:44.4 | step: 19890 +epoch: 40 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 0:27:53.3 | step: 19900 +epoch: 40 | 29/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:28:02.1 | step: 19910 +epoch: 40 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:28:11.0 | step: 19920 +epoch: 41 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.036 | time: 0:28:19.4 | step: 19930 +epoch: 41 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:28:28.3 | step: 19940 +epoch: 41 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:28:37.2 | step: 19950 +epoch: 41 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:28:46.1 | step: 19960 +epoch: 41 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 0:28:54.9 | step: 19970 +epoch: 42 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.026 | time: 0:29:03.4 | step: 19980 +epoch: 42 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.036 | time: 0:29:12.3 | step: 19990 +epoch: 42 | 25/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:29:21.2 | step: 20000 +epoch: 42 | 35/ 47 | logs/44k/diffusion | batch/s: 0.16 | lr: 0.0002 | loss: 0.008 | time: 0:30:24.1 | step: 20010 +epoch: 42 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.013 | time: 0:30:33.1 | step: 20020 +epoch: 43 | 8/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:30:42.0 | step: 20030 +epoch: 43 | 18/ 47 | logs/44k/diffusion | batch/s: 1.07 | lr: 0.0002 | loss: 0.011 | time: 0:30:51.3 | step: 20040 +epoch: 43 | 28/ 47 | logs/44k/diffusion | batch/s: 1.10 | lr: 0.0002 | loss: 0.009 | time: 0:31:00.4 | step: 20050 +epoch: 43 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:31:09.2 | step: 20060 +epoch: 44 | 1/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.031 | time: 0:31:17.6 | step: 20070 +epoch: 44 | 11/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.013 | time: 0:31:26.3 | step: 20080 +epoch: 44 | 21/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.020 | time: 0:31:35.0 | step: 20090 +epoch: 44 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:31:43.7 | step: 20100 +epoch: 44 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:31:52.6 | step: 20110 +epoch: 45 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.028 | time: 0:32:01.1 | step: 20120 +epoch: 45 | 14/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.037 | time: 0:32:10.1 | step: 20130 +epoch: 45 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 0:32:19.0 | step: 20140 +epoch: 45 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 0:32:27.9 | step: 20150 +epoch: 45 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:32:36.8 | step: 20160 +epoch: 46 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.033 | time: 0:32:45.3 | step: 20170 +epoch: 46 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:32:54.1 | step: 20180 +epoch: 46 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.044 | time: 0:33:02.9 | step: 20190 +epoch: 46 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 0:33:11.8 | step: 20200 +epoch: 47 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.039 | time: 0:33:20.2 | step: 20210 +epoch: 47 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 0:33:29.1 | step: 20220 +epoch: 47 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.028 | time: 0:33:38.0 | step: 20230 +epoch: 47 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.029 | time: 0:33:46.9 | step: 20240 +epoch: 47 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.006 | time: 0:33:55.8 | step: 20250 +epoch: 48 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.028 | time: 0:34:04.3 | step: 20260 +epoch: 48 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.028 | time: 0:34:13.2 | step: 20270 +epoch: 48 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.036 | time: 0:34:22.1 | step: 20280 +epoch: 48 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:34:31.0 | step: 20290 +epoch: 48 | 43/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 0:34:39.9 | step: 20300 +epoch: 49 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 0:34:48.4 | step: 20310 +epoch: 49 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:34:57.3 | step: 20320 +epoch: 49 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 0:35:06.2 | step: 20330 +epoch: 49 | 36/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 0:35:15.1 | step: 20340 +epoch: 49 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:35:23.5 | step: 20350 +epoch: 50 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.013 | time: 0:35:32.5 | step: 20360 +epoch: 50 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 0:35:41.4 | step: 20370 +epoch: 50 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.036 | time: 0:35:50.3 | step: 20380 +epoch: 50 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.004 | time: 0:35:59.2 | step: 20390 +epoch: 51 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.026 | time: 0:36:07.7 | step: 20400 +epoch: 51 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:36:16.6 | step: 20410 +epoch: 51 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.022 | time: 0:36:25.4 | step: 20420 +epoch: 51 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:36:34.3 | step: 20430 +epoch: 51 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.028 | time: 0:36:43.2 | step: 20440 +epoch: 52 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.003 | time: 0:36:51.7 | step: 20450 +epoch: 52 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.034 | time: 0:37:00.6 | step: 20460 +epoch: 52 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 0:37:09.5 | step: 20470 +epoch: 52 | 35/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.031 | time: 0:37:18.4 | step: 20480 +epoch: 52 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:37:27.3 | step: 20490 +epoch: 53 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.011 | time: 0:37:35.7 | step: 20500 +epoch: 53 | 18/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 0:37:44.7 | step: 20510 +epoch: 53 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 0:37:53.5 | step: 20520 +epoch: 53 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:38:02.4 | step: 20530 +epoch: 54 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 0:38:10.9 | step: 20540 +epoch: 54 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 0:38:19.8 | step: 20550 +epoch: 54 | 21/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.033 | time: 0:38:28.7 | step: 20560 +epoch: 54 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 0:38:37.6 | step: 20570 +epoch: 54 | 41/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.032 | time: 0:38:46.5 | step: 20580 +epoch: 55 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.011 | time: 0:38:55.0 | step: 20590 +epoch: 55 | 14/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:39:03.9 | step: 20600 +epoch: 55 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:39:12.8 | step: 20610 +epoch: 55 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 0:39:21.7 | step: 20620 +epoch: 55 | 44/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.036 | time: 0:39:30.6 | step: 20630 +epoch: 56 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.026 | time: 0:39:39.1 | step: 20640 +epoch: 56 | 17/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 0:39:48.0 | step: 20650 +epoch: 56 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.022 | time: 0:39:56.9 | step: 20660 +epoch: 56 | 37/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 0:40:05.8 | step: 20670 +epoch: 57 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.025 | time: 0:40:14.3 | step: 20680 +epoch: 57 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:40:23.2 | step: 20690 +epoch: 57 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.037 | time: 0:40:32.0 | step: 20700 +epoch: 57 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.030 | time: 0:40:41.0 | step: 20710 +epoch: 57 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 0:40:49.9 | step: 20720 +epoch: 58 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.038 | time: 0:40:58.3 | step: 20730 +epoch: 58 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.047 | time: 0:41:07.2 | step: 20740 +epoch: 58 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 0:41:16.1 | step: 20750 +epoch: 58 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 0:41:25.0 | step: 20760 +epoch: 58 | 43/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:41:33.9 | step: 20770 +epoch: 59 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.007 | time: 0:41:42.4 | step: 20780 +epoch: 59 | 16/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:41:51.3 | step: 20790 +epoch: 59 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.006 | time: 0:42:00.2 | step: 20800 +epoch: 59 | 36/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:42:09.1 | step: 20810 +epoch: 59 | 46/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.082 | time: 0:42:17.6 | step: 20820 +epoch: 60 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.016 | time: 0:42:26.6 | step: 20830 +epoch: 60 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:42:35.5 | step: 20840 +epoch: 60 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 0:42:44.4 | step: 20850 +epoch: 60 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 0:42:53.3 | step: 20860 +epoch: 61 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.004 | time: 0:43:01.8 | step: 20870 +epoch: 61 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:43:10.7 | step: 20880 +epoch: 61 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.039 | time: 0:43:19.5 | step: 20890 +epoch: 61 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.021 | time: 0:43:28.4 | step: 20900 +epoch: 61 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 0:43:37.3 | step: 20910 +epoch: 62 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.026 | time: 0:43:45.8 | step: 20920 +epoch: 62 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:43:54.7 | step: 20930 +epoch: 62 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.012 | time: 0:44:03.7 | step: 20940 +epoch: 62 | 35/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 0:44:12.6 | step: 20950 +epoch: 62 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:44:21.5 | step: 20960 +epoch: 63 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.024 | time: 0:44:29.9 | step: 20970 +epoch: 63 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:44:38.8 | step: 20980 +epoch: 63 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:44:47.6 | step: 20990 +epoch: 63 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:44:56.4 | step: 21000 +epoch: 64 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.032 | time: 0:45:04.8 | step: 21010 +epoch: 64 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:45:13.7 | step: 21020 +epoch: 64 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:45:22.6 | step: 21030 +epoch: 64 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.005 | time: 0:45:31.4 | step: 21040 +epoch: 64 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:45:40.2 | step: 21050 +epoch: 65 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.027 | time: 0:45:48.7 | step: 21060 +epoch: 65 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:45:57.5 | step: 21070 +epoch: 65 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:46:06.4 | step: 21080 +epoch: 65 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 0:46:15.3 | step: 21090 +epoch: 65 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 0:46:24.2 | step: 21100 +epoch: 66 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.007 | time: 0:46:32.6 | step: 21110 +epoch: 66 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.027 | time: 0:46:41.5 | step: 21120 +epoch: 66 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 0:46:50.4 | step: 21130 +epoch: 66 | 37/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 0:46:59.3 | step: 21140 +epoch: 67 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 0:47:07.8 | step: 21150 +epoch: 67 | 10/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:47:16.7 | step: 21160 +epoch: 67 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 0:47:25.6 | step: 21170 +epoch: 67 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:47:34.5 | step: 21180 +epoch: 67 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 0:47:43.4 | step: 21190 +epoch: 68 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.029 | time: 0:47:51.9 | step: 21200 +epoch: 68 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 0:48:00.8 | step: 21210 +epoch: 68 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.012 | time: 0:48:09.8 | step: 21220 +epoch: 68 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.033 | time: 0:48:18.7 | step: 21230 +epoch: 68 | 43/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.034 | time: 0:48:27.6 | step: 21240 +epoch: 69 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.018 | time: 0:48:36.1 | step: 21250 +epoch: 69 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:48:45.0 | step: 21260 +epoch: 69 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.046 | time: 0:48:53.9 | step: 21270 +epoch: 69 | 36/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 0:49:02.8 | step: 21280 +epoch: 69 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.031 | time: 0:49:11.2 | step: 21290 +epoch: 70 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.014 | time: 0:49:20.2 | step: 21300 +epoch: 70 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:49:29.1 | step: 21310 +epoch: 70 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 0:49:38.0 | step: 21320 +epoch: 70 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 0:49:46.9 | step: 21330 +epoch: 71 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.028 | time: 0:49:55.3 | step: 21340 +epoch: 71 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 0:50:04.2 | step: 21350 +epoch: 71 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 0:50:13.1 | step: 21360 +epoch: 71 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.034 | time: 0:50:22.0 | step: 21370 +epoch: 71 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 0:50:30.9 | step: 21380 +epoch: 72 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.012 | time: 0:50:39.4 | step: 21390 +epoch: 72 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 0:50:48.3 | step: 21400 +epoch: 72 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 0:50:57.2 | step: 21410 +epoch: 72 | 35/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.039 | time: 0:51:06.1 | step: 21420 +epoch: 72 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:51:15.0 | step: 21430 +epoch: 73 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.018 | time: 0:51:23.4 | step: 21440 +epoch: 73 | 18/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.040 | time: 0:51:32.3 | step: 21450 +epoch: 73 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 0:51:41.2 | step: 21460 +epoch: 73 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.021 | time: 0:51:50.2 | step: 21470 +epoch: 74 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.008 | time: 0:51:58.6 | step: 21480 +epoch: 74 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.032 | time: 0:52:07.6 | step: 21490 +epoch: 74 | 21/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.004 | time: 0:52:16.5 | step: 21500 +epoch: 74 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.035 | time: 0:52:25.4 | step: 21510 +epoch: 74 | 41/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 0:52:34.3 | step: 21520 +epoch: 75 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 0:52:42.8 | step: 21530 +epoch: 75 | 14/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 0:52:51.7 | step: 21540 +epoch: 75 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.035 | time: 0:53:00.6 | step: 21550 +epoch: 75 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.005 | time: 0:53:09.4 | step: 21560 +epoch: 75 | 44/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.033 | time: 0:53:18.3 | step: 21570 +epoch: 76 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.009 | time: 0:53:26.8 | step: 21580 +epoch: 76 | 17/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 0:53:35.7 | step: 21590 +epoch: 76 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:53:44.5 | step: 21600 +epoch: 76 | 37/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 0:53:53.4 | step: 21610 +epoch: 77 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.013 | time: 0:54:01.9 | step: 21620 +epoch: 77 | 10/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 0:54:10.8 | step: 21630 +epoch: 77 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:54:19.7 | step: 21640 +epoch: 77 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:54:28.5 | step: 21650 +epoch: 77 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:54:37.4 | step: 21660 +epoch: 78 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.042 | time: 0:54:45.8 | step: 21670 +epoch: 78 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:54:54.7 | step: 21680 +epoch: 78 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:55:03.6 | step: 21690 +epoch: 78 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 0:55:12.4 | step: 21700 +epoch: 78 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:55:21.3 | step: 21710 +epoch: 79 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.023 | time: 0:55:29.7 | step: 21720 +epoch: 79 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 0:55:38.6 | step: 21730 +epoch: 79 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.006 | time: 0:55:47.5 | step: 21740 +epoch: 79 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 0:55:56.3 | step: 21750 +epoch: 79 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:56:04.8 | step: 21760 +epoch: 80 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.018 | time: 0:56:13.7 | step: 21770 +epoch: 80 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 0:56:22.5 | step: 21780 +epoch: 80 | 29/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:56:31.4 | step: 21790 +epoch: 80 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 0:56:40.3 | step: 21800 +epoch: 81 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.008 | time: 0:56:48.7 | step: 21810 +epoch: 81 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 0:56:57.5 | step: 21820 +epoch: 81 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:57:06.4 | step: 21830 +epoch: 81 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.005 | time: 0:57:15.3 | step: 21840 +epoch: 81 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:57:24.1 | step: 21850 +epoch: 82 | 5/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.014 | time: 0:57:32.5 | step: 21860 +epoch: 82 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:57:41.4 | step: 21870 +epoch: 82 | 25/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 0:57:50.2 | step: 21880 +epoch: 82 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 0:57:59.1 | step: 21890 +epoch: 82 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 0:58:07.9 | step: 21900 +epoch: 83 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.013 | time: 0:58:16.4 | step: 21910 +epoch: 83 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:58:25.2 | step: 21920 +epoch: 83 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.037 | time: 0:58:34.1 | step: 21930 +epoch: 83 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 0:58:42.9 | step: 21940 +epoch: 84 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.013 | time: 0:58:51.4 | step: 21950 +epoch: 84 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 0:59:00.3 | step: 21960 +epoch: 84 | 21/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 0:59:09.2 | step: 21970 +epoch: 84 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.047 | time: 0:59:18.1 | step: 21980 +epoch: 84 | 41/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.012 | time: 0:59:26.9 | step: 21990 +epoch: 85 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.009 | time: 0:59:35.4 | step: 22000 +epoch: 85 | 14/ 47 | logs/44k/diffusion | batch/s: 0.53 | lr: 0.0002 | loss: 0.010 | time: 0:59:54.4 | step: 22010 +epoch: 85 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 1:00:03.3 | step: 22020 +epoch: 85 | 34/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.032 | time: 1:00:12.5 | step: 22030 +epoch: 85 | 44/ 47 | logs/44k/diffusion | batch/s: 1.08 | lr: 0.0002 | loss: 0.030 | time: 1:00:21.8 | step: 22040 +epoch: 86 | 7/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.004 | time: 1:00:30.3 | step: 22050 +epoch: 86 | 17/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:00:39.3 | step: 22060 +epoch: 86 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 1:00:48.1 | step: 22070 +epoch: 86 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 1:00:56.8 | step: 22080 +epoch: 87 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.014 | time: 1:01:05.2 | step: 22090 +epoch: 87 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 1:01:14.0 | step: 22100 +epoch: 87 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 1:01:22.8 | step: 22110 +epoch: 87 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:01:31.7 | step: 22120 +epoch: 87 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 1:01:40.7 | step: 22130 +epoch: 88 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.009 | time: 1:01:49.2 | step: 22140 +epoch: 88 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 1:01:58.1 | step: 22150 +epoch: 88 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:02:07.0 | step: 22160 +epoch: 88 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.037 | time: 1:02:15.9 | step: 22170 +epoch: 88 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 1:02:24.7 | step: 22180 +epoch: 89 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.011 | time: 1:02:33.1 | step: 22190 +epoch: 89 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.054 | time: 1:02:41.9 | step: 22200 +epoch: 89 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.039 | time: 1:02:50.8 | step: 22210 +epoch: 89 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.042 | time: 1:02:59.6 | step: 22220 +epoch: 89 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 1:03:08.1 | step: 22230 +epoch: 90 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.021 | time: 1:03:17.0 | step: 22240 +epoch: 90 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 1:03:25.9 | step: 22250 +epoch: 90 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.040 | time: 1:03:34.8 | step: 22260 +epoch: 90 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:03:43.7 | step: 22270 +epoch: 91 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.013 | time: 1:03:52.1 | step: 22280 +epoch: 91 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 1:04:01.0 | step: 22290 +epoch: 91 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:04:09.9 | step: 22300 +epoch: 91 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 1:04:18.8 | step: 22310 +epoch: 91 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 1:04:27.7 | step: 22320 +epoch: 92 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.022 | time: 1:04:36.2 | step: 22330 +epoch: 92 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 1:04:45.1 | step: 22340 +epoch: 92 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 1:04:54.0 | step: 22350 +epoch: 92 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.050 | time: 1:05:02.9 | step: 22360 +epoch: 92 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:05:11.8 | step: 22370 +epoch: 93 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.029 | time: 1:05:20.3 | step: 22380 +epoch: 93 | 18/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.106 | time: 1:05:29.2 | step: 22390 +epoch: 93 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.120 | time: 1:05:38.1 | step: 22400 +epoch: 93 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.087 | time: 1:05:47.0 | step: 22410 +epoch: 94 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.139 | time: 1:05:55.5 | step: 22420 +epoch: 94 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.107 | time: 1:06:04.4 | step: 22430 +epoch: 94 | 21/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.084 | time: 1:06:13.3 | step: 22440 +epoch: 94 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.041 | time: 1:06:22.2 | step: 22450 +epoch: 94 | 41/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.088 | time: 1:06:31.1 | step: 22460 +epoch: 95 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.047 | time: 1:06:39.6 | step: 22470 +epoch: 95 | 14/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.053 | time: 1:06:48.5 | step: 22480 +epoch: 95 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.042 | time: 1:06:57.4 | step: 22490 +epoch: 95 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.095 | time: 1:07:06.3 | step: 22500 +epoch: 95 | 44/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:07:15.2 | step: 22510 +epoch: 96 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.044 | time: 1:07:23.7 | step: 22520 +epoch: 96 | 17/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 1:07:32.6 | step: 22530 +epoch: 96 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.035 | time: 1:07:41.5 | step: 22540 +epoch: 96 | 37/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.037 | time: 1:07:50.4 | step: 22550 +epoch: 97 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.010 | time: 1:07:58.8 | step: 22560 +epoch: 97 | 10/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 1:08:07.7 | step: 22570 +epoch: 97 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.034 | time: 1:08:16.6 | step: 22580 +epoch: 97 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:08:25.5 | step: 22590 +epoch: 97 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 1:08:34.4 | step: 22600 +epoch: 98 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.018 | time: 1:08:42.9 | step: 22610 +epoch: 98 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 1:08:51.8 | step: 22620 +epoch: 98 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 1:09:00.7 | step: 22630 +epoch: 98 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:09:09.6 | step: 22640 +epoch: 98 | 43/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.006 | time: 1:09:18.5 | step: 22650 +epoch: 99 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.011 | time: 1:09:26.9 | step: 22660 +epoch: 99 | 16/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 1:09:35.8 | step: 22670 +epoch: 99 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:09:44.7 | step: 22680 +epoch: 99 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 1:09:53.6 | step: 22690 +epoch: 99 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 1:10:02.1 | step: 22700 +epoch: 100 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.029 | time: 1:10:11.1 | step: 22710 +epoch: 100 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 1:10:20.0 | step: 22720 +epoch: 100 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:10:28.9 | step: 22730 +epoch: 100 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 1:10:37.8 | step: 22740 +epoch: 101 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.013 | time: 1:10:46.3 | step: 22750 +epoch: 101 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 1:10:55.2 | step: 22760 +epoch: 101 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 1:11:04.1 | step: 22770 +epoch: 101 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:11:12.9 | step: 22780 +epoch: 101 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 1:11:21.8 | step: 22790 +epoch: 102 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.014 | time: 1:11:30.3 | step: 22800 +epoch: 102 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 1:11:39.2 | step: 22810 +epoch: 102 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 1:11:48.1 | step: 22820 +epoch: 102 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 1:11:57.0 | step: 22830 +epoch: 102 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 1:12:05.8 | step: 22840 +epoch: 103 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.013 | time: 1:12:14.3 | step: 22850 +epoch: 103 | 18/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 1:12:23.2 | step: 22860 +epoch: 103 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 1:12:32.1 | step: 22870 +epoch: 103 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:12:41.0 | step: 22880 +epoch: 104 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.005 | time: 1:12:49.4 | step: 22890 +epoch: 104 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 1:12:58.3 | step: 22900 +epoch: 104 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 1:13:07.2 | step: 22910 +epoch: 104 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.012 | time: 1:13:16.1 | step: 22920 +epoch: 104 | 41/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 1:13:25.0 | step: 22930 +epoch: 105 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.026 | time: 1:13:33.5 | step: 22940 +epoch: 105 | 14/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 1:13:42.4 | step: 22950 +epoch: 105 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 1:13:51.2 | step: 22960 +epoch: 105 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.014 | time: 1:14:00.1 | step: 22970 +epoch: 105 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 1:14:09.0 | step: 22980 +epoch: 106 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.032 | time: 1:14:17.5 | step: 22990 +epoch: 106 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 1:14:26.4 | step: 23000 +epoch: 106 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 1:14:35.3 | step: 23010 +epoch: 106 | 37/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 1:14:44.2 | step: 23020 +epoch: 107 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.020 | time: 1:14:52.7 | step: 23030 +epoch: 107 | 10/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.028 | time: 1:15:01.6 | step: 23040 +epoch: 107 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.012 | time: 1:15:10.5 | step: 23050 +epoch: 107 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 1:15:19.4 | step: 23060 +epoch: 107 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.005 | time: 1:15:28.2 | step: 23070 +epoch: 108 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.025 | time: 1:15:36.7 | step: 23080 +epoch: 108 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:15:45.6 | step: 23090 +epoch: 108 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.034 | time: 1:15:54.5 | step: 23100 +epoch: 108 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:16:03.4 | step: 23110 +epoch: 108 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 1:16:12.3 | step: 23120 +epoch: 109 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.013 | time: 1:16:20.7 | step: 23130 +epoch: 109 | 16/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.005 | time: 1:16:29.6 | step: 23140 +epoch: 109 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 1:16:38.5 | step: 23150 +epoch: 109 | 36/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.022 | time: 1:16:47.4 | step: 23160 +epoch: 109 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 1:16:55.9 | step: 23170 +epoch: 110 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.005 | time: 1:17:04.8 | step: 23180 +epoch: 110 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 1:17:13.7 | step: 23190 +epoch: 110 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.042 | time: 1:17:22.6 | step: 23200 +epoch: 110 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 1:17:31.5 | step: 23210 +epoch: 111 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.010 | time: 1:17:40.0 | step: 23220 +epoch: 111 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 1:17:48.9 | step: 23230 +epoch: 111 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.037 | time: 1:17:57.8 | step: 23240 +epoch: 111 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 1:18:06.7 | step: 23250 +epoch: 111 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 1:18:15.5 | step: 23260 +epoch: 112 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.020 | time: 1:18:24.0 | step: 23270 +epoch: 112 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 1:18:32.9 | step: 23280 +epoch: 112 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.027 | time: 1:18:41.8 | step: 23290 +epoch: 112 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 1:18:50.6 | step: 23300 +epoch: 112 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 1:18:59.5 | step: 23310 +epoch: 113 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.011 | time: 1:19:08.0 | step: 23320 +epoch: 113 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 1:19:16.9 | step: 23330 +epoch: 113 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 1:19:25.7 | step: 23340 +epoch: 113 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:19:34.6 | step: 23350 +epoch: 114 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.028 | time: 1:19:43.1 | step: 23360 +epoch: 114 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 1:19:52.0 | step: 23370 +epoch: 114 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.004 | time: 1:20:00.8 | step: 23380 +epoch: 114 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 1:20:09.7 | step: 23390 +epoch: 114 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 1:20:18.6 | step: 23400 +epoch: 115 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.010 | time: 1:20:27.0 | step: 23410 +epoch: 115 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 1:20:35.9 | step: 23420 +epoch: 115 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 1:20:44.8 | step: 23430 +epoch: 115 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 1:20:53.7 | step: 23440 +epoch: 115 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 1:21:02.5 | step: 23450 +epoch: 116 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.018 | time: 1:21:11.0 | step: 23460 +epoch: 116 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 1:21:19.8 | step: 23470 +epoch: 116 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.006 | time: 1:21:28.7 | step: 23480 +epoch: 116 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 1:21:37.6 | step: 23490 +epoch: 117 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.039 | time: 1:21:46.0 | step: 23500 +epoch: 117 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.035 | time: 1:21:54.9 | step: 23510 +epoch: 117 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.035 | time: 1:22:03.7 | step: 23520 +epoch: 117 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.048 | time: 1:22:12.6 | step: 23530 +epoch: 117 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 1:22:21.5 | step: 23540 +epoch: 118 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.018 | time: 1:22:29.9 | step: 23550 +epoch: 118 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 1:22:38.7 | step: 23560 +epoch: 118 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.042 | time: 1:22:47.6 | step: 23570 +epoch: 118 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 1:22:56.5 | step: 23580 +epoch: 118 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 1:23:05.3 | step: 23590 +epoch: 119 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.016 | time: 1:23:13.7 | step: 23600 +epoch: 119 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 1:23:22.6 | step: 23610 +epoch: 119 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 1:23:31.5 | step: 23620 +epoch: 119 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 1:23:40.3 | step: 23630 +epoch: 119 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 1:23:48.8 | step: 23640 +epoch: 120 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.027 | time: 1:23:57.7 | step: 23650 +epoch: 120 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 1:24:06.6 | step: 23660 +epoch: 120 | 29/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 1:24:15.5 | step: 23670 +epoch: 120 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 1:24:24.3 | step: 23680 +epoch: 121 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.024 | time: 1:24:32.8 | step: 23690 +epoch: 121 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.024 | time: 1:24:41.6 | step: 23700 +epoch: 121 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 1:24:50.5 | step: 23710 +epoch: 121 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.007 | time: 1:24:59.4 | step: 23720 +epoch: 121 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 1:25:08.3 | step: 23730 +epoch: 122 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.029 | time: 1:25:16.7 | step: 23740 +epoch: 122 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.034 | time: 1:25:25.6 | step: 23750 +epoch: 122 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.032 | time: 1:25:34.5 | step: 23760 +epoch: 122 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 1:25:43.4 | step: 23770 +epoch: 122 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.013 | time: 1:25:52.3 | step: 23780 +epoch: 123 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.017 | time: 1:26:00.7 | step: 23790 +epoch: 123 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.004 | time: 1:26:09.6 | step: 23800 +epoch: 123 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 1:26:18.5 | step: 23810 +epoch: 123 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.004 | time: 1:26:27.4 | step: 23820 +epoch: 124 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.012 | time: 1:26:35.8 | step: 23830 +epoch: 124 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.022 | time: 1:26:44.7 | step: 23840 +epoch: 124 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.005 | time: 1:26:53.6 | step: 23850 +epoch: 124 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.035 | time: 1:27:02.5 | step: 23860 +epoch: 124 | 41/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.029 | time: 1:27:11.4 | step: 23870 +epoch: 125 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 1:27:19.9 | step: 23880 +epoch: 125 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 1:27:28.7 | step: 23890 +epoch: 125 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:27:37.6 | step: 23900 +epoch: 125 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 1:27:46.5 | step: 23910 +epoch: 125 | 44/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 1:27:55.4 | step: 23920 +epoch: 126 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 1:28:03.9 | step: 23930 +epoch: 126 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 1:28:12.7 | step: 23940 +epoch: 126 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 1:28:21.5 | step: 23950 +epoch: 126 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.034 | time: 1:28:30.4 | step: 23960 +epoch: 127 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.040 | time: 1:28:38.8 | step: 23970 +epoch: 127 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.036 | time: 1:28:47.7 | step: 23980 +epoch: 127 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.042 | time: 1:28:56.6 | step: 23990 +epoch: 127 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.028 | time: 1:29:05.5 | step: 24000 +epoch: 127 | 40/ 47 | logs/44k/diffusion | batch/s: 0.52 | lr: 0.0002 | loss: 0.019 | time: 1:29:24.6 | step: 24010 +epoch: 128 | 3/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.029 | time: 1:29:33.2 | step: 24020 +epoch: 128 | 13/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.008 | time: 1:29:42.4 | step: 24030 +epoch: 128 | 23/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.020 | time: 1:29:51.5 | step: 24040 +epoch: 128 | 33/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.008 | time: 1:30:00.5 | step: 24050 +epoch: 128 | 43/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 1:30:09.4 | step: 24060 +epoch: 129 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.023 | time: 1:30:17.8 | step: 24070 +epoch: 129 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 1:30:26.6 | step: 24080 +epoch: 129 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:30:35.3 | step: 24090 +epoch: 129 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 1:30:44.1 | step: 24100 +epoch: 129 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.005 | time: 1:30:52.6 | step: 24110 +epoch: 130 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.010 | time: 1:31:01.5 | step: 24120 +epoch: 130 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 1:31:10.5 | step: 24130 +epoch: 130 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.021 | time: 1:31:19.4 | step: 24140 +epoch: 130 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 1:31:28.3 | step: 24150 +epoch: 131 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 1:31:36.8 | step: 24160 +epoch: 131 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 1:31:45.7 | step: 24170 +epoch: 131 | 22/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.041 | time: 1:31:54.5 | step: 24180 +epoch: 131 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 1:32:03.3 | step: 24190 +epoch: 131 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 1:32:12.2 | step: 24200 +epoch: 132 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.018 | time: 1:32:20.6 | step: 24210 +epoch: 132 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 1:32:29.5 | step: 24220 +epoch: 132 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 1:32:38.4 | step: 24230 +epoch: 132 | 35/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.022 | time: 1:32:47.4 | step: 24240 +epoch: 132 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:32:56.3 | step: 24250 +epoch: 133 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.019 | time: 1:33:04.8 | step: 24260 +epoch: 133 | 18/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 1:33:13.7 | step: 24270 +epoch: 133 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 1:33:22.5 | step: 24280 +epoch: 133 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.003 | time: 1:33:31.4 | step: 24290 +epoch: 134 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.007 | time: 1:33:39.8 | step: 24300 +epoch: 134 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 1:33:48.7 | step: 24310 +epoch: 134 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 1:33:57.5 | step: 24320 +epoch: 134 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 1:34:06.3 | step: 24330 +epoch: 134 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 1:34:15.2 | step: 24340 +epoch: 135 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.009 | time: 1:34:23.6 | step: 24350 +epoch: 135 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 1:34:32.5 | step: 24360 +epoch: 135 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 1:34:41.3 | step: 24370 +epoch: 135 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 1:34:50.2 | step: 24380 +epoch: 135 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.037 | time: 1:34:59.1 | step: 24390 +epoch: 136 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.023 | time: 1:35:07.5 | step: 24400 +epoch: 136 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 1:35:16.4 | step: 24410 +epoch: 136 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 1:35:25.2 | step: 24420 +epoch: 136 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 1:35:34.1 | step: 24430 +epoch: 137 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.008 | time: 1:35:42.5 | step: 24440 +epoch: 137 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 1:35:51.4 | step: 24450 +epoch: 137 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 1:36:00.2 | step: 24460 +epoch: 137 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 1:36:09.0 | step: 24470 +epoch: 137 | 40/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.031 | time: 1:36:17.9 | step: 24480 +epoch: 138 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.023 | time: 1:36:26.4 | step: 24490 +epoch: 138 | 13/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:36:35.3 | step: 24500 +epoch: 138 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 1:36:44.3 | step: 24510 +epoch: 138 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.012 | time: 1:36:53.2 | step: 24520 +epoch: 138 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 1:37:02.1 | step: 24530 +epoch: 139 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.025 | time: 1:37:10.5 | step: 24540 +epoch: 139 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 1:37:19.3 | step: 24550 +epoch: 139 | 26/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 1:37:28.1 | step: 24560 +epoch: 139 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.041 | time: 1:37:37.0 | step: 24570 +epoch: 139 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 1:37:45.4 | step: 24580 +epoch: 140 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.023 | time: 1:37:54.5 | step: 24590 +epoch: 140 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 1:38:03.3 | step: 24600 +epoch: 140 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 1:38:12.3 | step: 24610 +epoch: 140 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:38:21.2 | step: 24620 +epoch: 141 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.021 | time: 1:38:29.7 | step: 24630 +epoch: 141 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:38:38.6 | step: 24640 +epoch: 141 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.021 | time: 1:38:47.5 | step: 24650 +epoch: 141 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:38:56.4 | step: 24660 +epoch: 141 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:39:05.3 | step: 24670 +epoch: 142 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.008 | time: 1:39:13.8 | step: 24680 +epoch: 142 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 1:39:22.7 | step: 24690 +epoch: 142 | 25/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 1:39:31.5 | step: 24700 +epoch: 142 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 1:39:40.3 | step: 24710 +epoch: 142 | 45/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.036 | time: 1:39:49.2 | step: 24720 +epoch: 143 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.016 | time: 1:39:57.6 | step: 24730 +epoch: 143 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 1:40:06.5 | step: 24740 +epoch: 143 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.048 | time: 1:40:15.4 | step: 24750 +epoch: 143 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.032 | time: 1:40:24.4 | step: 24760 +epoch: 144 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.023 | time: 1:40:32.9 | step: 24770 +epoch: 144 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.031 | time: 1:40:41.8 | step: 24780 +epoch: 144 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 1:40:50.6 | step: 24790 +epoch: 144 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 1:40:59.5 | step: 24800 +epoch: 144 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 1:41:08.4 | step: 24810 +epoch: 145 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.021 | time: 1:41:16.8 | step: 24820 +epoch: 145 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.030 | time: 1:41:25.6 | step: 24830 +epoch: 145 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 1:41:34.5 | step: 24840 +epoch: 145 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.022 | time: 1:41:43.3 | step: 24850 +epoch: 145 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 1:41:52.1 | step: 24860 +epoch: 146 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.023 | time: 1:42:00.6 | step: 24870 +epoch: 146 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 1:42:09.4 | step: 24880 +epoch: 146 | 27/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 1:42:18.3 | step: 24890 +epoch: 146 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 1:42:27.2 | step: 24900 +epoch: 147 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.015 | time: 1:42:35.6 | step: 24910 +epoch: 147 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 1:42:44.5 | step: 24920 +epoch: 147 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 1:42:53.4 | step: 24930 +epoch: 147 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 1:43:02.2 | step: 24940 +epoch: 147 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 1:43:11.1 | step: 24950 +epoch: 148 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.032 | time: 1:43:19.5 | step: 24960 +epoch: 148 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 1:43:28.3 | step: 24970 +epoch: 148 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 1:43:37.2 | step: 24980 +epoch: 148 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.015 | time: 1:43:46.0 | step: 24990 +epoch: 148 | 43/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 1:43:54.9 | step: 25000 +epoch: 149 | 6/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.018 | time: 1:44:03.5 | step: 25010 +epoch: 149 | 16/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 1:44:12.4 | step: 25020 +epoch: 149 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.036 | time: 1:44:21.3 | step: 25030 +epoch: 149 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 1:44:30.2 | step: 25040 +epoch: 149 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.005 | time: 1:44:38.6 | step: 25050 +epoch: 150 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.029 | time: 1:44:47.6 | step: 25060 +epoch: 150 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.004 | time: 1:44:56.4 | step: 25070 +epoch: 150 | 29/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 1:45:05.2 | step: 25080 +epoch: 150 | 39/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.036 | time: 1:45:14.1 | step: 25090 +epoch: 151 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.027 | time: 1:45:22.6 | step: 25100 +epoch: 151 | 12/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.036 | time: 1:45:31.4 | step: 25110 +epoch: 151 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:45:40.3 | step: 25120 +epoch: 151 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:45:49.2 | step: 25130 +epoch: 151 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 1:45:58.2 | step: 25140 +epoch: 152 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 1:46:06.6 | step: 25150 +epoch: 152 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.039 | time: 1:46:15.6 | step: 25160 +epoch: 152 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:46:24.5 | step: 25170 +epoch: 152 | 35/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 1:46:33.4 | step: 25180 +epoch: 152 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 1:46:42.3 | step: 25190 +epoch: 153 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.031 | time: 1:46:50.8 | step: 25200 +epoch: 153 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 1:46:59.7 | step: 25210 +epoch: 153 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.018 | time: 1:47:08.6 | step: 25220 +epoch: 153 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 1:47:17.5 | step: 25230 +epoch: 154 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.020 | time: 1:47:25.9 | step: 25240 +epoch: 154 | 11/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 1:47:34.8 | step: 25250 +epoch: 154 | 21/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.015 | time: 1:47:43.7 | step: 25260 +epoch: 154 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 1:47:52.6 | step: 25270 +epoch: 154 | 41/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 1:48:01.5 | step: 25280 +epoch: 155 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.012 | time: 1:48:10.0 | step: 25290 +epoch: 155 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 1:48:18.8 | step: 25300 +epoch: 155 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.045 | time: 1:48:27.7 | step: 25310 +epoch: 155 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 1:48:36.6 | step: 25320 +epoch: 155 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 1:48:45.5 | step: 25330 +epoch: 156 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.023 | time: 1:48:53.9 | step: 25340 +epoch: 156 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 1:49:02.8 | step: 25350 +epoch: 156 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:49:11.7 | step: 25360 +epoch: 156 | 37/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 1:49:20.6 | step: 25370 +epoch: 157 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.017 | time: 1:49:29.1 | step: 25380 +epoch: 157 | 10/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:49:38.0 | step: 25390 +epoch: 157 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.008 | time: 1:49:46.9 | step: 25400 +epoch: 157 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:49:55.7 | step: 25410 +epoch: 157 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 1:50:04.6 | step: 25420 +epoch: 158 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 1:50:13.1 | step: 25430 +epoch: 158 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.023 | time: 1:50:22.0 | step: 25440 +epoch: 158 | 23/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:50:30.9 | step: 25450 +epoch: 158 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.017 | time: 1:50:39.8 | step: 25460 +epoch: 158 | 43/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.035 | time: 1:50:48.7 | step: 25470 +epoch: 159 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.009 | time: 1:50:57.1 | step: 25480 +epoch: 159 | 16/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.016 | time: 1:51:06.0 | step: 25490 +epoch: 159 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:51:14.9 | step: 25500 +epoch: 159 | 36/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.041 | time: 1:51:23.8 | step: 25510 +epoch: 159 | 46/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.003 | time: 1:51:32.3 | step: 25520 +epoch: 160 | 9/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.029 | time: 1:51:41.3 | step: 25530 +epoch: 160 | 19/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.024 | time: 1:51:50.2 | step: 25540 +epoch: 160 | 29/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 1:51:59.1 | step: 25550 +epoch: 160 | 39/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.008 | time: 1:52:08.1 | step: 25560 +epoch: 161 | 2/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.019 | time: 1:52:16.6 | step: 25570 +epoch: 161 | 12/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 1:52:25.5 | step: 25580 +epoch: 161 | 22/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 1:52:34.4 | step: 25590 +epoch: 161 | 32/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.025 | time: 1:52:43.3 | step: 25600 +epoch: 161 | 42/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.017 | time: 1:52:52.2 | step: 25610 +epoch: 162 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.010 | time: 1:53:00.7 | step: 25620 +epoch: 162 | 15/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.029 | time: 1:53:09.6 | step: 25630 +epoch: 162 | 25/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.021 | time: 1:53:18.6 | step: 25640 +epoch: 162 | 35/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.007 | time: 1:53:27.5 | step: 25650 +epoch: 162 | 45/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.029 | time: 1:53:36.4 | step: 25660 +epoch: 163 | 8/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.006 | time: 1:53:44.9 | step: 25670 +epoch: 163 | 18/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 1:53:53.8 | step: 25680 +epoch: 163 | 28/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.004 | time: 1:54:02.7 | step: 25690 +epoch: 163 | 38/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.023 | time: 1:54:11.6 | step: 25700 +epoch: 164 | 1/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.032 | time: 1:54:20.1 | step: 25710 +epoch: 164 | 11/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 1:54:29.0 | step: 25720 +epoch: 164 | 21/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:54:37.9 | step: 25730 +epoch: 164 | 31/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.011 | time: 1:54:46.8 | step: 25740 +epoch: 164 | 41/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 1:54:55.7 | step: 25750 +epoch: 165 | 4/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.019 | time: 1:55:04.1 | step: 25760 +epoch: 165 | 14/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:55:13.0 | step: 25770 +epoch: 165 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.026 | time: 1:55:21.9 | step: 25780 +epoch: 165 | 34/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.019 | time: 1:55:30.8 | step: 25790 +epoch: 165 | 44/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.028 | time: 1:55:39.7 | step: 25800 +epoch: 166 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 1:55:48.2 | step: 25810 +epoch: 166 | 17/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 1:55:57.1 | step: 25820 +epoch: 166 | 27/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.010 | time: 1:56:06.0 | step: 25830 +epoch: 166 | 37/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.009 | time: 1:56:14.9 | step: 25840 +epoch: 167 | 0/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.035 | time: 1:56:23.3 | step: 25850 +epoch: 167 | 10/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 1:56:32.2 | step: 25860 +epoch: 167 | 20/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.022 | time: 1:56:41.1 | step: 25870 +epoch: 167 | 30/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.022 | time: 1:56:50.0 | step: 25880 +epoch: 167 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.024 | time: 1:56:58.9 | step: 25890 +epoch: 168 | 3/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.012 | time: 1:57:07.4 | step: 25900 +epoch: 168 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.020 | time: 1:57:16.3 | step: 25910 +epoch: 168 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.032 | time: 1:57:25.2 | step: 25920 +epoch: 168 | 33/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.031 | time: 1:57:34.1 | step: 25930 +epoch: 168 | 43/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 1:57:42.9 | step: 25940 +epoch: 169 | 6/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.010 | time: 1:57:51.4 | step: 25950 +epoch: 169 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 1:58:00.3 | step: 25960 +epoch: 169 | 26/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.037 | time: 1:58:09.2 | step: 25970 +epoch: 169 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.026 | time: 1:58:18.1 | step: 25980 +epoch: 169 | 46/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.004 | time: 1:58:26.5 | step: 25990 +epoch: 170 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.008 | time: 1:58:35.5 | step: 26000 +--- model size --- +model: 55,192,704 +======= start training ======= +epoch|batch_idx/num_batches|output_dir|batch/s|lr|time|step +epoch: 0 | 9/ 47 | logs/44k/diffusion | batch/s: 0.65 | lr: 0.0002 | loss: 0.032 | time: 0:00:16.0 | step: 26010 +epoch: 0 | 19/ 47 | logs/44k/diffusion | batch/s: 1.22 | lr: 0.0002 | loss: 0.058 | time: 0:00:24.2 | step: 26020 +epoch: 0 | 29/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.030 | time: 0:00:32.5 | step: 26030 +epoch: 0 | 39/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.015 | time: 0:00:40.8 | step: 26040 +epoch: 1 | 2/ 47 | logs/44k/diffusion | batch/s: 1.23 | lr: 0.0002 | loss: 0.011 | time: 0:00:48.9 | step: 26050 +epoch: 1 | 12/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.013 | time: 0:00:57.4 | step: 26060 +epoch: 1 | 22/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.011 | time: 0:01:06.0 | step: 26070 +epoch: 1 | 32/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.021 | time: 0:01:14.7 | step: 26080 +epoch: 1 | 42/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.024 | time: 0:01:23.4 | step: 26090 +epoch: 2 | 5/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.015 | time: 0:01:31.8 | step: 26100 +epoch: 2 | 15/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.011 | time: 0:01:40.8 | step: 26110 +epoch: 2 | 25/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 0:01:49.8 | step: 26120 +epoch: 2 | 35/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.047 | time: 0:01:58.6 | step: 26130 +epoch: 2 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.005 | time: 0:02:07.3 | step: 26140 +epoch: 3 | 8/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.020 | time: 0:02:15.6 | step: 26150 +epoch: 3 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:02:24.4 | step: 26160 +epoch: 3 | 28/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.011 | time: 0:02:33.1 | step: 26170 +epoch: 3 | 38/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.021 | time: 0:02:41.8 | step: 26180 +epoch: 4 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.015 | time: 0:02:50.1 | step: 26190 +epoch: 4 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:02:58.9 | step: 26200 +epoch: 4 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.029 | time: 0:03:07.7 | step: 26210 +epoch: 4 | 31/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:03:16.6 | step: 26220 +epoch: 4 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:03:25.3 | step: 26230 +epoch: 5 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.024 | time: 0:03:33.7 | step: 26240 +epoch: 5 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:03:42.5 | step: 26250 +epoch: 5 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:03:51.3 | step: 26260 +epoch: 5 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:04:00.0 | step: 26270 +epoch: 5 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:04:08.8 | step: 26280 +epoch: 6 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.005 | time: 0:04:17.2 | step: 26290 +epoch: 6 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:04:26.0 | step: 26300 +epoch: 6 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:04:34.7 | step: 26310 +epoch: 6 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:04:43.5 | step: 26320 +epoch: 7 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.019 | time: 0:04:51.9 | step: 26330 +epoch: 7 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:05:00.6 | step: 26340 +epoch: 7 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:05:09.4 | step: 26350 +epoch: 7 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:05:18.2 | step: 26360 +epoch: 7 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:05:27.0 | step: 26370 +epoch: 8 | 3/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.011 | time: 0:05:35.3 | step: 26380 +epoch: 8 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:05:44.1 | step: 26390 +epoch: 8 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:05:52.9 | step: 26400 +epoch: 8 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:06:01.6 | step: 26410 +epoch: 8 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:06:10.4 | step: 26420 +epoch: 9 | 6/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.024 | time: 0:06:18.8 | step: 26430 +epoch: 9 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.040 | time: 0:06:27.5 | step: 26440 +epoch: 9 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:06:36.3 | step: 26450 +epoch: 9 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.049 | time: 0:06:45.1 | step: 26460 +epoch: 9 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.009 | time: 0:06:53.5 | step: 26470 +epoch: 10 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.016 | time: 0:07:02.3 | step: 26480 +epoch: 10 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:07:11.1 | step: 26490 +epoch: 10 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:07:19.9 | step: 26500 +epoch: 10 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:07:28.7 | step: 26510 +epoch: 11 | 2/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.010 | time: 0:07:37.0 | step: 26520 +epoch: 11 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:07:45.8 | step: 26530 +epoch: 11 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:07:54.6 | step: 26540 +epoch: 11 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:08:03.4 | step: 26550 +epoch: 11 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:08:12.1 | step: 26560 +epoch: 12 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.006 | time: 0:08:20.5 | step: 26570 +epoch: 12 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:08:29.2 | step: 26580 +epoch: 12 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.004 | time: 0:08:38.0 | step: 26590 +epoch: 12 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:08:46.8 | step: 26600 +epoch: 12 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:08:55.6 | step: 26610 +epoch: 13 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.045 | time: 0:09:03.9 | step: 26620 +epoch: 13 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 0:09:12.7 | step: 26630 +epoch: 13 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:09:21.5 | step: 26640 +epoch: 13 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 0:09:30.3 | step: 26650 +epoch: 14 | 1/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.040 | time: 0:09:38.6 | step: 26660 +epoch: 14 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.003 | time: 0:09:47.4 | step: 26670 +epoch: 14 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 0:09:56.2 | step: 26680 +epoch: 14 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:10:05.0 | step: 26690 +epoch: 14 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:10:13.7 | step: 26700 +epoch: 15 | 4/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.009 | time: 0:10:22.1 | step: 26710 +epoch: 15 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:10:30.9 | step: 26720 +epoch: 15 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 0:10:39.7 | step: 26730 +epoch: 15 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:10:48.5 | step: 26740 +epoch: 15 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.044 | time: 0:10:57.3 | step: 26750 +epoch: 16 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.022 | time: 0:11:05.6 | step: 26760 +epoch: 16 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:11:14.4 | step: 26770 +epoch: 16 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:11:23.2 | step: 26780 +epoch: 16 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.041 | time: 0:11:32.0 | step: 26790 +epoch: 17 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.007 | time: 0:11:40.4 | step: 26800 +epoch: 17 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:11:49.2 | step: 26810 +epoch: 17 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:11:57.9 | step: 26820 +epoch: 17 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:12:06.7 | step: 26830 +epoch: 17 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:12:15.5 | step: 26840 +epoch: 18 | 3/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.041 | time: 0:12:23.9 | step: 26850 +epoch: 18 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:12:32.7 | step: 26860 +epoch: 18 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:12:41.5 | step: 26870 +epoch: 18 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.048 | time: 0:12:50.2 | step: 26880 +epoch: 18 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.040 | time: 0:12:59.0 | step: 26890 +epoch: 19 | 6/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.043 | time: 0:13:07.4 | step: 26900 +epoch: 19 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:13:16.1 | step: 26910 +epoch: 19 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 0:13:24.9 | step: 26920 +epoch: 19 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:13:33.7 | step: 26930 +epoch: 19 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.009 | time: 0:13:42.1 | step: 26940 +epoch: 20 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.030 | time: 0:13:51.0 | step: 26950 +epoch: 20 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:13:59.7 | step: 26960 +epoch: 20 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:14:08.5 | step: 26970 +epoch: 20 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:14:17.3 | step: 26980 +epoch: 21 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.010 | time: 0:14:25.7 | step: 26990 +epoch: 21 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:14:34.5 | step: 27000 +epoch: 21 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.042 | time: 0:14:43.3 | step: 27010 +epoch: 21 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:14:52.1 | step: 27020 +epoch: 21 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:15:00.9 | step: 27030 +epoch: 22 | 5/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.030 | time: 0:15:09.2 | step: 27040 +epoch: 22 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:15:18.0 | step: 27050 +epoch: 22 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:15:26.8 | step: 27060 +epoch: 22 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.036 | time: 0:15:35.6 | step: 27070 +epoch: 22 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:15:44.4 | step: 27080 +epoch: 23 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.018 | time: 0:15:52.8 | step: 27090 +epoch: 23 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:16:01.6 | step: 27100 +epoch: 23 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:16:10.4 | step: 27110 +epoch: 23 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:16:19.2 | step: 27120 +epoch: 24 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.028 | time: 0:16:27.6 | step: 27130 +epoch: 24 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:16:36.3 | step: 27140 +epoch: 24 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:16:45.1 | step: 27150 +epoch: 24 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.004 | time: 0:16:53.9 | step: 27160 +epoch: 24 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:17:02.7 | step: 27170 +epoch: 25 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.032 | time: 0:17:11.0 | step: 27180 +epoch: 25 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:17:19.8 | step: 27190 +epoch: 25 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:17:28.6 | step: 27200 +epoch: 25 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:17:37.4 | step: 27210 +epoch: 25 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:17:46.2 | step: 27220 +epoch: 26 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.011 | time: 0:17:54.5 | step: 27230 +epoch: 26 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 0:18:03.3 | step: 27240 +epoch: 26 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 0:18:12.1 | step: 27250 +epoch: 26 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:18:20.9 | step: 27260 +epoch: 27 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.016 | time: 0:18:29.2 | step: 27270 +epoch: 27 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:18:38.0 | step: 27280 +epoch: 27 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:18:46.8 | step: 27290 +epoch: 27 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:18:55.6 | step: 27300 +epoch: 27 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:19:04.4 | step: 27310 +epoch: 28 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.029 | time: 0:19:12.8 | step: 27320 +epoch: 28 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.032 | time: 0:19:21.5 | step: 27330 +epoch: 28 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:19:30.3 | step: 27340 +epoch: 28 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.035 | time: 0:19:39.1 | step: 27350 +epoch: 28 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:19:47.9 | step: 27360 +epoch: 29 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.011 | time: 0:19:56.3 | step: 27370 +epoch: 29 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.031 | time: 0:20:05.1 | step: 27380 +epoch: 29 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 0:20:13.9 | step: 27390 +epoch: 29 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:20:22.7 | step: 27400 +epoch: 29 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.005 | time: 0:20:31.1 | step: 27410 +epoch: 30 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.015 | time: 0:20:40.0 | step: 27420 +epoch: 30 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:20:48.8 | step: 27430 +epoch: 30 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:20:57.6 | step: 27440 +epoch: 30 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:21:06.4 | step: 27450 +epoch: 31 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.017 | time: 0:21:14.8 | step: 27460 +epoch: 31 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.031 | time: 0:21:23.5 | step: 27470 +epoch: 31 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:21:32.3 | step: 27480 +epoch: 31 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.057 | time: 0:21:41.1 | step: 27490 +epoch: 31 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:21:49.9 | step: 27500 +epoch: 32 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.034 | time: 0:21:58.2 | step: 27510 +epoch: 32 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:22:07.0 | step: 27520 +epoch: 32 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:22:15.8 | step: 27530 +epoch: 32 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 0:22:24.6 | step: 27540 +epoch: 32 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:22:33.3 | step: 27550 +epoch: 33 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.031 | time: 0:22:41.7 | step: 27560 +epoch: 33 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 0:22:50.5 | step: 27570 +epoch: 33 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:22:59.2 | step: 27580 +epoch: 33 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:23:08.0 | step: 27590 +epoch: 34 | 1/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.023 | time: 0:23:16.4 | step: 27600 +epoch: 34 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:23:25.2 | step: 27610 +epoch: 34 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 0:23:34.0 | step: 27620 +epoch: 34 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:23:42.7 | step: 27630 +epoch: 34 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:23:51.5 | step: 27640 +epoch: 35 | 4/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.031 | time: 0:23:59.9 | step: 27650 +epoch: 35 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.040 | time: 0:24:08.6 | step: 27660 +epoch: 35 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.037 | time: 0:24:17.4 | step: 27670 +epoch: 35 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:24:26.2 | step: 27680 +epoch: 35 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:24:35.0 | step: 27690 +epoch: 36 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.007 | time: 0:24:43.3 | step: 27700 +epoch: 36 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.004 | time: 0:24:52.1 | step: 27710 +epoch: 36 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.050 | time: 0:25:00.9 | step: 27720 +epoch: 36 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:25:09.7 | step: 27730 +epoch: 37 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.011 | time: 0:25:18.0 | step: 27740 +epoch: 37 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:25:26.8 | step: 27750 +epoch: 37 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:25:35.6 | step: 27760 +epoch: 37 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 0:25:44.4 | step: 27770 +epoch: 37 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:25:53.2 | step: 27780 +epoch: 38 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.010 | time: 0:26:01.6 | step: 27790 +epoch: 38 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:26:10.4 | step: 27800 +epoch: 38 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 0:26:19.2 | step: 27810 +epoch: 38 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:26:28.0 | step: 27820 +epoch: 38 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:26:36.8 | step: 27830 +epoch: 39 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.031 | time: 0:26:45.2 | step: 27840 +epoch: 39 | 16/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.021 | time: 0:26:54.0 | step: 27850 +epoch: 39 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:27:02.8 | step: 27860 +epoch: 39 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:27:11.6 | step: 27870 +epoch: 39 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.006 | time: 0:27:20.0 | step: 27880 +epoch: 40 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.006 | time: 0:27:28.8 | step: 27890 +epoch: 40 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:27:37.7 | step: 27900 +epoch: 40 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.040 | time: 0:27:46.4 | step: 27910 +epoch: 40 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:27:55.2 | step: 27920 +epoch: 41 | 2/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.008 | time: 0:28:03.6 | step: 27930 +epoch: 41 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:28:12.4 | step: 27940 +epoch: 41 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:28:21.2 | step: 27950 +epoch: 41 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:28:29.9 | step: 27960 +epoch: 41 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:28:38.7 | step: 27970 +epoch: 42 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.016 | time: 0:28:47.1 | step: 27980 +epoch: 42 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 0:28:55.9 | step: 27990 +epoch: 42 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:29:04.7 | step: 28000 +epoch: 42 | 35/ 47 | logs/44k/diffusion | batch/s: 0.09 | lr: 0.0002 | loss: 0.025 | time: 0:30:52.8 | step: 28010 +epoch: 42 | 45/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.010 | time: 0:31:01.9 | step: 28020 +epoch: 43 | 8/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:31:10.6 | step: 28030 +epoch: 43 | 18/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.009 | time: 0:31:19.6 | step: 28040 +epoch: 43 | 28/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.011 | time: 0:31:28.5 | step: 28050 +epoch: 43 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.005 | time: 0:31:37.2 | step: 28060 +epoch: 44 | 1/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.023 | time: 0:31:45.5 | step: 28070 +epoch: 44 | 11/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.030 | time: 0:31:54.2 | step: 28080 +epoch: 44 | 21/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.042 | time: 0:32:02.9 | step: 28090 +epoch: 44 | 31/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.020 | time: 0:32:11.6 | step: 28100 +epoch: 44 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:32:20.4 | step: 28110 +epoch: 45 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.021 | time: 0:32:28.8 | step: 28120 +epoch: 45 | 14/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 0:32:37.7 | step: 28130 +epoch: 45 | 24/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.016 | time: 0:32:46.6 | step: 28140 +epoch: 45 | 34/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:32:55.4 | step: 28150 +epoch: 45 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:33:04.2 | step: 28160 +epoch: 46 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.019 | time: 0:33:12.6 | step: 28170 +epoch: 46 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:33:21.3 | step: 28180 +epoch: 46 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:33:30.1 | step: 28190 +epoch: 46 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 0:33:38.9 | step: 28200 +epoch: 47 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.021 | time: 0:33:47.2 | step: 28210 +epoch: 47 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:33:56.0 | step: 28220 +epoch: 47 | 20/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 0:34:04.8 | step: 28230 +epoch: 47 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.046 | time: 0:34:13.6 | step: 28240 +epoch: 47 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:34:22.4 | step: 28250 +epoch: 48 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.028 | time: 0:34:30.8 | step: 28260 +epoch: 48 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:34:39.6 | step: 28270 +epoch: 48 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 0:34:48.4 | step: 28280 +epoch: 48 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.031 | time: 0:34:57.2 | step: 28290 +epoch: 48 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:35:05.9 | step: 28300 +epoch: 49 | 6/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.016 | time: 0:35:14.3 | step: 28310 +epoch: 49 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:35:23.1 | step: 28320 +epoch: 49 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:35:31.8 | step: 28330 +epoch: 49 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:35:40.6 | step: 28340 +epoch: 49 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.004 | time: 0:35:49.0 | step: 28350 +epoch: 50 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.021 | time: 0:35:57.9 | step: 28360 +epoch: 50 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:36:06.6 | step: 28370 +epoch: 50 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:36:15.4 | step: 28380 +epoch: 50 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.005 | time: 0:36:24.2 | step: 28390 +epoch: 51 | 2/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.020 | time: 0:36:32.6 | step: 28400 +epoch: 51 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:36:41.3 | step: 28410 +epoch: 51 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:36:50.1 | step: 28420 +epoch: 51 | 32/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 0:36:58.9 | step: 28430 +epoch: 51 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:37:07.7 | step: 28440 +epoch: 52 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.014 | time: 0:37:16.1 | step: 28450 +epoch: 52 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 0:37:24.9 | step: 28460 +epoch: 52 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:37:33.7 | step: 28470 +epoch: 52 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:37:42.4 | step: 28480 +epoch: 52 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 0:37:51.2 | step: 28490 +epoch: 53 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.012 | time: 0:37:59.6 | step: 28500 +epoch: 53 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:38:08.4 | step: 28510 +epoch: 53 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:38:17.1 | step: 28520 +epoch: 53 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:38:25.9 | step: 28530 +epoch: 54 | 1/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.036 | time: 0:38:34.3 | step: 28540 +epoch: 54 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:38:43.1 | step: 28550 +epoch: 54 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:38:51.9 | step: 28560 +epoch: 54 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:39:00.6 | step: 28570 +epoch: 54 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:39:09.4 | step: 28580 +epoch: 55 | 4/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.008 | time: 0:39:17.8 | step: 28590 +epoch: 55 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 0:39:26.6 | step: 28600 +epoch: 55 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:39:35.3 | step: 28610 +epoch: 55 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:39:44.1 | step: 28620 +epoch: 55 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:39:52.9 | step: 28630 +epoch: 56 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.007 | time: 0:40:01.3 | step: 28640 +epoch: 56 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:40:10.0 | step: 28650 +epoch: 56 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:40:18.8 | step: 28660 +epoch: 56 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:40:27.6 | step: 28670 +epoch: 57 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.019 | time: 0:40:36.0 | step: 28680 +epoch: 57 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 0:40:44.8 | step: 28690 +epoch: 57 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:40:53.5 | step: 28700 +epoch: 57 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:41:02.3 | step: 28710 +epoch: 57 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:41:11.1 | step: 28720 +epoch: 58 | 3/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.010 | time: 0:41:19.5 | step: 28730 +epoch: 58 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:41:28.2 | step: 28740 +epoch: 58 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:41:37.0 | step: 28750 +epoch: 58 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 0:41:45.8 | step: 28760 +epoch: 58 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.036 | time: 0:41:54.6 | step: 28770 +epoch: 59 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.035 | time: 0:42:03.0 | step: 28780 +epoch: 59 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:42:11.7 | step: 28790 +epoch: 59 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 0:42:20.5 | step: 28800 +epoch: 59 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:42:29.3 | step: 28810 +epoch: 59 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.011 | time: 0:42:37.7 | step: 28820 +epoch: 60 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.015 | time: 0:42:46.5 | step: 28830 +epoch: 60 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:42:55.3 | step: 28840 +epoch: 60 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 0:43:04.1 | step: 28850 +epoch: 60 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:43:12.9 | step: 28860 +epoch: 61 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.011 | time: 0:43:21.3 | step: 28870 +epoch: 61 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:43:30.0 | step: 28880 +epoch: 61 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:43:38.8 | step: 28890 +epoch: 61 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.043 | time: 0:43:47.6 | step: 28900 +epoch: 61 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:43:56.4 | step: 28910 +epoch: 62 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.008 | time: 0:44:04.7 | step: 28920 +epoch: 62 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:44:13.5 | step: 28930 +epoch: 62 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:44:22.3 | step: 28940 +epoch: 62 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:44:31.1 | step: 28950 +epoch: 62 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 0:44:39.9 | step: 28960 +epoch: 63 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.011 | time: 0:44:48.2 | step: 28970 +epoch: 63 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:44:57.0 | step: 28980 +epoch: 63 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:45:05.8 | step: 28990 +epoch: 63 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:45:14.6 | step: 29000 +epoch: 64 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.017 | time: 0:45:22.9 | step: 29010 +epoch: 64 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:45:31.7 | step: 29020 +epoch: 64 | 21/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.034 | time: 0:45:40.5 | step: 29030 +epoch: 64 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 0:45:49.3 | step: 29040 +epoch: 64 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:45:58.0 | step: 29050 +epoch: 65 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.020 | time: 0:46:06.4 | step: 29060 +epoch: 65 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:46:15.2 | step: 29070 +epoch: 65 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:46:24.0 | step: 29080 +epoch: 65 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:46:32.8 | step: 29090 +epoch: 65 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:46:41.5 | step: 29100 +epoch: 66 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.012 | time: 0:46:49.9 | step: 29110 +epoch: 66 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:46:58.7 | step: 29120 +epoch: 66 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:47:07.5 | step: 29130 +epoch: 66 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:47:16.2 | step: 29140 +epoch: 67 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.015 | time: 0:47:24.6 | step: 29150 +epoch: 67 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:47:33.4 | step: 29160 +epoch: 67 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:47:42.1 | step: 29170 +epoch: 67 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:47:50.9 | step: 29180 +epoch: 67 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:47:59.7 | step: 29190 +epoch: 68 | 3/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.019 | time: 0:48:08.1 | step: 29200 +epoch: 68 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.041 | time: 0:48:16.8 | step: 29210 +epoch: 68 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:48:25.6 | step: 29220 +epoch: 68 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:48:34.4 | step: 29230 +epoch: 68 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:48:43.2 | step: 29240 +epoch: 69 | 6/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.014 | time: 0:48:51.5 | step: 29250 +epoch: 69 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:49:00.3 | step: 29260 +epoch: 69 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 0:49:09.1 | step: 29270 +epoch: 69 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:49:17.9 | step: 29280 +epoch: 69 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.033 | time: 0:49:26.3 | step: 29290 +epoch: 70 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.011 | time: 0:49:35.1 | step: 29300 +epoch: 70 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:49:43.9 | step: 29310 +epoch: 70 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.045 | time: 0:49:52.7 | step: 29320 +epoch: 70 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:50:01.5 | step: 29330 +epoch: 71 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.017 | time: 0:50:09.8 | step: 29340 +epoch: 71 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:50:18.6 | step: 29350 +epoch: 71 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 0:50:27.4 | step: 29360 +epoch: 71 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:50:36.2 | step: 29370 +epoch: 71 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:50:44.9 | step: 29380 +epoch: 72 | 5/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.017 | time: 0:50:53.3 | step: 29390 +epoch: 72 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:51:02.1 | step: 29400 +epoch: 72 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 0:51:10.8 | step: 29410 +epoch: 72 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 0:51:19.6 | step: 29420 +epoch: 72 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 0:51:28.4 | step: 29430 +epoch: 73 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.016 | time: 0:51:36.8 | step: 29440 +epoch: 73 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 0:51:45.6 | step: 29450 +epoch: 73 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.045 | time: 0:51:54.3 | step: 29460 +epoch: 73 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:52:03.1 | step: 29470 +epoch: 74 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.015 | time: 0:52:11.5 | step: 29480 +epoch: 74 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:52:20.2 | step: 29490 +epoch: 74 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:52:29.0 | step: 29500 +epoch: 74 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:52:37.8 | step: 29510 +epoch: 74 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:52:46.6 | step: 29520 +epoch: 75 | 4/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.041 | time: 0:52:54.9 | step: 29530 +epoch: 75 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.034 | time: 0:53:03.7 | step: 29540 +epoch: 75 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:53:12.5 | step: 29550 +epoch: 75 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 0:53:21.3 | step: 29560 +epoch: 75 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:53:30.1 | step: 29570 +epoch: 76 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.019 | time: 0:53:38.4 | step: 29580 +epoch: 76 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 0:53:47.2 | step: 29590 +epoch: 76 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:53:56.0 | step: 29600 +epoch: 76 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 0:54:04.7 | step: 29610 +epoch: 77 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.022 | time: 0:54:13.1 | step: 29620 +epoch: 77 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:54:21.9 | step: 29630 +epoch: 77 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 0:54:30.6 | step: 29640 +epoch: 77 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:54:39.4 | step: 29650 +epoch: 77 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.046 | time: 0:54:48.2 | step: 29660 +epoch: 78 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.012 | time: 0:54:56.5 | step: 29670 +epoch: 78 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.039 | time: 0:55:05.3 | step: 29680 +epoch: 78 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 0:55:14.1 | step: 29690 +epoch: 78 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 0:55:22.9 | step: 29700 +epoch: 78 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:55:31.6 | step: 29710 +epoch: 79 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.011 | time: 0:55:40.0 | step: 29720 +epoch: 79 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:55:48.8 | step: 29730 +epoch: 79 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:55:57.6 | step: 29740 +epoch: 79 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 0:56:06.4 | step: 29750 +epoch: 79 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.007 | time: 0:56:14.7 | step: 29760 +epoch: 80 | 9/ 47 | logs/44k/diffusion | batch/s: 1.16 | lr: 0.0002 | loss: 0.029 | time: 0:56:23.7 | step: 29770 +epoch: 80 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 0:56:32.4 | step: 29780 +epoch: 80 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 0:56:41.2 | step: 29790 +epoch: 80 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:56:50.0 | step: 29800 +epoch: 81 | 2/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.027 | time: 0:56:58.3 | step: 29810 +epoch: 81 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 0:57:07.1 | step: 29820 +epoch: 81 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:57:15.9 | step: 29830 +epoch: 81 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:57:24.7 | step: 29840 +epoch: 81 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 0:57:33.5 | step: 29850 +epoch: 82 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.022 | time: 0:57:41.8 | step: 29860 +epoch: 82 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 0:57:50.6 | step: 29870 +epoch: 82 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.044 | time: 0:57:59.4 | step: 29880 +epoch: 82 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 0:58:08.2 | step: 29890 +epoch: 82 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:58:17.0 | step: 29900 +epoch: 83 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.025 | time: 0:58:25.3 | step: 29910 +epoch: 83 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 0:58:34.1 | step: 29920 +epoch: 83 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 0:58:42.8 | step: 29930 +epoch: 83 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.042 | time: 0:58:51.6 | step: 29940 +epoch: 84 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.050 | time: 0:59:00.0 | step: 29950 +epoch: 84 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.035 | time: 0:59:08.8 | step: 29960 +epoch: 84 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:59:17.6 | step: 29970 +epoch: 84 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 0:59:26.3 | step: 29980 +epoch: 84 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 0:59:35.1 | step: 29990 +epoch: 85 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.019 | time: 0:59:43.5 | step: 30000 +epoch: 85 | 14/ 47 | logs/44k/diffusion | batch/s: 0.11 | lr: 0.0002 | loss: 0.009 | time: 1:01:15.2 | step: 30010 +epoch: 85 | 24/ 47 | logs/44k/diffusion | batch/s: 1.12 | lr: 0.0002 | loss: 0.020 | time: 1:01:24.1 | step: 30020 +epoch: 85 | 34/ 47 | logs/44k/diffusion | batch/s: 1.09 | lr: 0.0002 | loss: 0.042 | time: 1:01:33.3 | step: 30030 +epoch: 85 | 44/ 47 | logs/44k/diffusion | batch/s: 1.11 | lr: 0.0002 | loss: 0.027 | time: 1:01:42.4 | step: 30040 +epoch: 86 | 7/ 47 | logs/44k/diffusion | batch/s: 1.18 | lr: 0.0002 | loss: 0.008 | time: 1:01:50.8 | step: 30050 +epoch: 86 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 1:01:59.5 | step: 30060 +epoch: 86 | 27/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.017 | time: 1:02:08.2 | step: 30070 +epoch: 86 | 37/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.023 | time: 1:02:16.9 | step: 30080 +epoch: 87 | 0/ 47 | logs/44k/diffusion | batch/s: 1.21 | lr: 0.0002 | loss: 0.024 | time: 1:02:25.2 | step: 30090 +epoch: 87 | 10/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.013 | time: 1:02:33.9 | step: 30100 +epoch: 87 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 1:02:42.7 | step: 30110 +epoch: 87 | 30/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 1:02:51.6 | step: 30120 +epoch: 87 | 40/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 1:03:00.4 | step: 30130 +epoch: 88 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.012 | time: 1:03:08.8 | step: 30140 +epoch: 88 | 13/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.025 | time: 1:03:17.7 | step: 30150 +epoch: 88 | 23/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.009 | time: 1:03:26.5 | step: 30160 +epoch: 88 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 1:03:35.2 | step: 30170 +epoch: 88 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 1:03:44.0 | step: 30180 +epoch: 89 | 6/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.013 | time: 1:03:52.4 | step: 30190 +epoch: 89 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 1:04:01.1 | step: 30200 +epoch: 89 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:04:09.9 | step: 30210 +epoch: 89 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 1:04:18.7 | step: 30220 +epoch: 89 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.019 | time: 1:04:27.1 | step: 30230 +epoch: 90 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.011 | time: 1:04:35.9 | step: 30240 +epoch: 90 | 19/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.028 | time: 1:04:44.7 | step: 30250 +epoch: 90 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:04:53.5 | step: 30260 +epoch: 90 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 1:05:02.3 | step: 30270 +epoch: 91 | 2/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.011 | time: 1:05:10.7 | step: 30280 +epoch: 91 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.021 | time: 1:05:19.4 | step: 30290 +epoch: 91 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 1:05:28.2 | step: 30300 +epoch: 91 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:05:37.0 | step: 30310 +epoch: 91 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 1:05:45.8 | step: 30320 +epoch: 92 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.009 | time: 1:05:54.1 | step: 30330 +epoch: 92 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:06:02.9 | step: 30340 +epoch: 92 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 1:06:11.7 | step: 30350 +epoch: 92 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.020 | time: 1:06:20.5 | step: 30360 +epoch: 92 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 1:06:29.2 | step: 30370 +epoch: 93 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.031 | time: 1:06:37.6 | step: 30380 +epoch: 93 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 1:06:46.4 | step: 30390 +epoch: 93 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 1:06:55.1 | step: 30400 +epoch: 93 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 1:07:03.9 | step: 30410 +epoch: 94 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.037 | time: 1:07:12.3 | step: 30420 +epoch: 94 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:07:21.1 | step: 30430 +epoch: 94 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 1:07:29.8 | step: 30440 +epoch: 94 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 1:07:38.6 | step: 30450 +epoch: 94 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:07:47.4 | step: 30460 +epoch: 95 | 4/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.013 | time: 1:07:55.8 | step: 30470 +epoch: 95 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 1:08:04.5 | step: 30480 +epoch: 95 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:08:13.3 | step: 30490 +epoch: 95 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.032 | time: 1:08:22.1 | step: 30500 +epoch: 95 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 1:08:30.9 | step: 30510 +epoch: 96 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.015 | time: 1:08:39.2 | step: 30520 +epoch: 96 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 1:08:48.0 | step: 30530 +epoch: 96 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 1:08:56.8 | step: 30540 +epoch: 96 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 1:09:05.6 | step: 30550 +epoch: 97 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.014 | time: 1:09:13.9 | step: 30560 +epoch: 97 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 1:09:22.7 | step: 30570 +epoch: 97 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 1:09:31.5 | step: 30580 +epoch: 97 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 1:09:40.3 | step: 30590 +epoch: 97 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 1:09:49.1 | step: 30600 +epoch: 98 | 3/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.027 | time: 1:09:57.5 | step: 30610 +epoch: 98 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 1:10:06.2 | step: 30620 +epoch: 98 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 1:10:15.1 | step: 30630 +epoch: 98 | 33/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 1:10:23.8 | step: 30640 +epoch: 98 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 1:10:32.6 | step: 30650 +epoch: 99 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.023 | time: 1:10:41.0 | step: 30660 +epoch: 99 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 1:10:49.8 | step: 30670 +epoch: 99 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 1:10:58.6 | step: 30680 +epoch: 99 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.035 | time: 1:11:07.4 | step: 30690 +epoch: 99 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.014 | time: 1:11:15.7 | step: 30700 +epoch: 100 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.033 | time: 1:11:24.6 | step: 30710 +epoch: 100 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:11:33.4 | step: 30720 +epoch: 100 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 1:11:42.2 | step: 30730 +epoch: 100 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 1:11:51.0 | step: 30740 +epoch: 101 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.031 | time: 1:11:59.3 | step: 30750 +epoch: 101 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.005 | time: 1:12:08.1 | step: 30760 +epoch: 101 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:12:16.9 | step: 30770 +epoch: 101 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 1:12:25.7 | step: 30780 +epoch: 101 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 1:12:34.5 | step: 30790 +epoch: 102 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.014 | time: 1:12:42.9 | step: 30800 +epoch: 102 | 15/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.018 | time: 1:12:51.7 | step: 30810 +epoch: 102 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 1:13:00.5 | step: 30820 +epoch: 102 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 1:13:09.3 | step: 30830 +epoch: 102 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 1:13:18.1 | step: 30840 +epoch: 103 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.029 | time: 1:13:26.4 | step: 30850 +epoch: 103 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 1:13:35.2 | step: 30860 +epoch: 103 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 1:13:44.0 | step: 30870 +epoch: 103 | 38/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.010 | time: 1:13:52.8 | step: 30880 +epoch: 104 | 1/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.029 | time: 1:14:01.2 | step: 30890 +epoch: 104 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 1:14:10.0 | step: 30900 +epoch: 104 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 1:14:18.8 | step: 30910 +epoch: 104 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 1:14:27.6 | step: 30920 +epoch: 104 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 1:14:36.4 | step: 30930 +epoch: 105 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.012 | time: 1:14:44.8 | step: 30940 +epoch: 105 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:14:53.6 | step: 30950 +epoch: 105 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.028 | time: 1:15:02.4 | step: 30960 +epoch: 105 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.040 | time: 1:15:11.1 | step: 30970 +epoch: 105 | 44/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.019 | time: 1:15:20.0 | step: 30980 +epoch: 106 | 7/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.025 | time: 1:15:28.3 | step: 30990 +epoch: 106 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:15:37.1 | step: 31000 +epoch: 106 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 1:15:45.9 | step: 31010 +epoch: 106 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 1:15:54.7 | step: 31020 +epoch: 107 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.034 | time: 1:16:03.1 | step: 31030 +epoch: 107 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 1:16:11.8 | step: 31040 +epoch: 107 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 1:16:20.6 | step: 31050 +epoch: 107 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 1:16:29.4 | step: 31060 +epoch: 107 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 1:16:38.2 | step: 31070 +epoch: 108 | 3/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.013 | time: 1:16:46.6 | step: 31080 +epoch: 108 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:16:55.4 | step: 31090 +epoch: 108 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 1:17:04.2 | step: 31100 +epoch: 108 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.012 | time: 1:17:13.0 | step: 31110 +epoch: 108 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:17:21.8 | step: 31120 +epoch: 109 | 6/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.015 | time: 1:17:30.2 | step: 31130 +epoch: 109 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.038 | time: 1:17:38.9 | step: 31140 +epoch: 109 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 1:17:47.7 | step: 31150 +epoch: 109 | 36/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 1:17:56.5 | step: 31160 +epoch: 109 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.074 | time: 1:18:04.9 | step: 31170 +epoch: 110 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.049 | time: 1:18:13.8 | step: 31180 +epoch: 110 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 1:18:22.6 | step: 31190 +epoch: 110 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 1:18:31.4 | step: 31200 +epoch: 110 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 1:18:40.2 | step: 31210 +epoch: 111 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.006 | time: 1:18:48.5 | step: 31220 +epoch: 111 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 1:18:57.3 | step: 31230 +epoch: 111 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.037 | time: 1:19:06.1 | step: 31240 +epoch: 111 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 1:19:14.9 | step: 31250 +epoch: 111 | 42/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.013 | time: 1:19:23.7 | step: 31260 +epoch: 112 | 5/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.010 | time: 1:19:32.1 | step: 31270 +epoch: 112 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 1:19:40.9 | step: 31280 +epoch: 112 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.037 | time: 1:19:49.7 | step: 31290 +epoch: 112 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 1:19:58.5 | step: 31300 +epoch: 112 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.036 | time: 1:20:07.3 | step: 31310 +epoch: 113 | 8/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.010 | time: 1:20:15.6 | step: 31320 +epoch: 113 | 18/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.006 | time: 1:20:24.5 | step: 31330 +epoch: 113 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.036 | time: 1:20:33.2 | step: 31340 +epoch: 113 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.033 | time: 1:20:42.0 | step: 31350 +epoch: 114 | 1/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.021 | time: 1:20:50.4 | step: 31360 +epoch: 114 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.030 | time: 1:20:59.2 | step: 31370 +epoch: 114 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 1:21:08.0 | step: 31380 +epoch: 114 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.038 | time: 1:21:16.8 | step: 31390 +epoch: 114 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.012 | time: 1:21:25.6 | step: 31400 +epoch: 115 | 4/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.013 | time: 1:21:34.0 | step: 31410 +epoch: 115 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.016 | time: 1:21:42.8 | step: 31420 +epoch: 115 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 1:21:51.6 | step: 31430 +epoch: 115 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.022 | time: 1:22:00.4 | step: 31440 +epoch: 115 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.005 | time: 1:22:09.2 | step: 31450 +epoch: 116 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.004 | time: 1:22:17.5 | step: 31460 +epoch: 116 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 1:22:26.3 | step: 31470 +epoch: 116 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 1:22:35.1 | step: 31480 +epoch: 116 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 1:22:43.9 | step: 31490 +epoch: 117 | 0/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.014 | time: 1:22:52.3 | step: 31500 +epoch: 117 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.011 | time: 1:23:01.1 | step: 31510 +epoch: 117 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 1:23:09.9 | step: 31520 +epoch: 117 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.031 | time: 1:23:18.7 | step: 31530 +epoch: 117 | 40/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 1:23:27.5 | step: 31540 +epoch: 118 | 3/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.011 | time: 1:23:35.9 | step: 31550 +epoch: 118 | 13/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 1:23:44.7 | step: 31560 +epoch: 118 | 23/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 1:23:53.5 | step: 31570 +epoch: 118 | 33/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.014 | time: 1:24:02.3 | step: 31580 +epoch: 118 | 43/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.004 | time: 1:24:11.1 | step: 31590 +epoch: 119 | 6/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.010 | time: 1:24:19.5 | step: 31600 +epoch: 119 | 16/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.008 | time: 1:24:28.3 | step: 31610 +epoch: 119 | 26/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.009 | time: 1:24:37.0 | step: 31620 +epoch: 119 | 36/ 47 | logs/44k/diffusion | batch/s: 1.13 | lr: 0.0002 | loss: 0.036 | time: 1:24:45.8 | step: 31630 +epoch: 119 | 46/ 47 | logs/44k/diffusion | batch/s: 1.15 | lr: 0.0002 | loss: 0.013 | time: 1:24:54.2 | step: 31640 +epoch: 120 | 9/ 47 | logs/44k/diffusion | batch/s: 1.17 | lr: 0.0002 | loss: 0.025 | time: 1:25:03.1 | step: 31650 +epoch: 120 | 19/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.040 | time: 1:25:11.9 | step: 31660 +epoch: 120 | 29/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.019 | time: 1:25:20.7 | step: 31670 +epoch: 120 | 39/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.015 | time: 1:25:29.4 | step: 31680 +epoch: 121 | 2/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.041 | time: 1:25:37.8 | step: 31690 +epoch: 121 | 12/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.026 | time: 1:25:46.6 | step: 31700 +epoch: 121 | 22/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 1:25:55.4 | step: 31710 +epoch: 121 | 32/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 1:26:04.1 | step: 31720 +epoch: 121 | 42/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.031 | time: 1:26:12.9 | step: 31730 +epoch: 122 | 5/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.052 | time: 1:26:21.3 | step: 31740 +epoch: 122 | 15/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 1:26:30.1 | step: 31750 +epoch: 122 | 25/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:26:38.9 | step: 31760 +epoch: 122 | 35/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.013 | time: 1:26:47.6 | step: 31770 +epoch: 122 | 45/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.032 | time: 1:26:56.4 | step: 31780 +epoch: 123 | 8/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.016 | time: 1:27:04.8 | step: 31790 +epoch: 123 | 18/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.025 | time: 1:27:13.6 | step: 31800 +epoch: 123 | 28/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.023 | time: 1:27:22.4 | step: 31810 +epoch: 123 | 38/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.005 | time: 1:27:31.1 | step: 31820 +epoch: 124 | 1/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.006 | time: 1:27:39.5 | step: 31830 +epoch: 124 | 11/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.029 | time: 1:27:48.3 | step: 31840 +epoch: 124 | 21/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.037 | time: 1:27:57.0 | step: 31850 +epoch: 124 | 31/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:28:05.8 | step: 31860 +epoch: 124 | 41/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 1:28:14.6 | step: 31870 +epoch: 125 | 4/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.004 | time: 1:28:23.0 | step: 31880 +epoch: 125 | 14/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.018 | time: 1:28:31.7 | step: 31890 +epoch: 125 | 24/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.027 | time: 1:28:40.5 | step: 31900 +epoch: 125 | 34/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.045 | time: 1:28:49.3 | step: 31910 +epoch: 125 | 44/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.007 | time: 1:28:58.1 | step: 31920 +epoch: 126 | 7/ 47 | logs/44k/diffusion | batch/s: 1.19 | lr: 0.0002 | loss: 0.021 | time: 1:29:06.4 | step: 31930 +epoch: 126 | 17/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.010 | time: 1:29:15.2 | step: 31940 +epoch: 126 | 27/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.014 | time: 1:29:24.0 | step: 31950 +epoch: 126 | 37/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.056 | time: 1:29:32.8 | step: 31960 +epoch: 127 | 0/ 47 | logs/44k/diffusion | batch/s: 1.20 | lr: 0.0002 | loss: 0.024 | time: 1:29:41.1 | step: 31970 +epoch: 127 | 10/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.006 | time: 1:29:49.9 | step: 31980 +epoch: 127 | 20/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.017 | time: 1:29:58.7 | step: 31990 +epoch: 127 | 30/ 47 | logs/44k/diffusion | batch/s: 1.14 | lr: 0.0002 | loss: 0.024 | time: 1:30:07.5 | step: 32000