From 08f39ff2969eb8b5588683b5c030ca6a28093cec Mon Sep 17 00:00:00 2001 From: Ashish Kumar Singh Date: Tue, 9 Jul 2024 01:15:07 +0530 Subject: [PATCH] fix: rendered to unrendered cells --- example notebooks/simple diffusion flax.ipynb | 5123 +---------------- 1 file changed, 1 insertion(+), 5122 deletions(-) diff --git a/example notebooks/simple diffusion flax.ipynb b/example notebooks/simple diffusion flax.ipynb index c40ddbb..dcfe9a5 100644 --- a/example notebooks/simple diffusion flax.ipynb +++ b/example notebooks/simple diffusion flax.ipynb @@ -1487,5132 +1487,11 @@ "execution_count": 14, "metadata": {}, "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "Epoch 1/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 1: 600step [00:51, 11.69step/s, loss=0.0594] \n", - "WARNING:absl:SaveArgs.aggregate is deprecated, please use custom TypeHandler (https://orbax.readthedocs.io/en/latest/custom_handlers.html#typehandler) or contact Orbax team to migrate before August 1st, 2024.\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 0\n", - "\n", - "\tEpoch 1 completed. Avg Loss: 0.09080573171377182, Time: 51.33s, Best Loss: 0.09080573171377182\n", - "\n", - "Epoch 2/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 2: 600step [00:27, 21.58step/s, loss=0.0239] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 1\n", - "\n", - "\tEpoch 2 completed. Avg Loss: 0.04645586386322975, Time: 27.81s, Best Loss: 0.04645586386322975\n", - "\n", - "Epoch 3/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 3: 600step [00:27, 21.73step/s, loss=0.0563] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 2\n", - "\n", - "\tEpoch 3 completed. Avg Loss: 0.042779020965099335, Time: 27.62s, Best Loss: 0.042779020965099335\n", - "\n", - "Epoch 4/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 4: 600step [00:27, 22.06step/s, loss=0.0189] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 3\n", - "\n", - "\tEpoch 4 completed. Avg Loss: 0.040192410349845886, Time: 27.20s, Best Loss: 0.040192410349845886\n", - "\n", - "Epoch 5/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 5: 600step [00:26, 22.81step/s, loss=0.0186] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 4\n", - "\n", - "\tEpoch 5 completed. Avg Loss: 0.03994264826178551, Time: 26.30s, Best Loss: 0.03994264826178551\n", - "\n", - "Epoch 6/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 6: 600step [00:26, 22.43step/s, loss=0.0245] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 5\n", - "\n", - "\tEpoch 6 completed. Avg Loss: 0.03801179677248001, Time: 26.76s, Best Loss: 0.03801179677248001\n", - "\n", - "Epoch 7/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 7: 600step [00:26, 22.46step/s, loss=0.0216] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 6\n", - "\n", - "\tEpoch 7 completed. Avg Loss: 0.03678169101476669, Time: 26.71s, Best Loss: 0.03678169101476669\n", - "\n", - "Epoch 8/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 8: 600step [00:26, 22.29step/s, loss=0.0740] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 7\n", - "\n", - "\tEpoch 8 completed. Avg Loss: 0.036518700420856476, Time: 26.92s, Best Loss: 0.036518700420856476\n", - "\n", - "Epoch 9/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 9: 600step [00:26, 22.34step/s, loss=0.0503] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 8\n", - "\n", - "\tEpoch 9 completed. Avg Loss: 0.03589194267988205, Time: 26.85s, Best Loss: 0.03589194267988205\n", - "\n", - "Epoch 10/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 10: 600step [00:27, 21.78step/s, loss=0.0533] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 10 completed. Avg Loss: 0.03621599078178406, Time: 27.54s, Best Loss: 0.03589194267988205\n", - "\n", - "Epoch 11/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 11: 600step [00:26, 22.60step/s, loss=0.0402] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 10\n", - "\n", - "\tEpoch 11 completed. Avg Loss: 0.03573783487081528, Time: 26.55s, Best Loss: 0.03573783487081528\n", - "\n", - "Epoch 12/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 12: 600step [00:26, 22.64step/s, loss=0.0367] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 11\n", - "\n", - "\tEpoch 12 completed. Avg Loss: 0.034702200442552567, Time: 26.51s, Best Loss: 0.034702200442552567\n", - "\n", - "Epoch 13/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 13: 600step [00:26, 22.48step/s, loss=0.0246] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 12\n", - "\n", - "\tEpoch 13 completed. Avg Loss: 0.03454558551311493, Time: 26.70s, Best Loss: 0.03454558551311493\n", - "\n", - "Epoch 14/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 14: 600step [00:27, 22.10step/s, loss=0.0354] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 14 completed. Avg Loss: 0.035031046718358994, Time: 27.15s, Best Loss: 0.03454558551311493\n", - "\n", - "Epoch 15/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 15: 600step [00:27, 21.99step/s, loss=0.0424] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 15 completed. Avg Loss: 0.035461414605379105, Time: 27.29s, Best Loss: 0.03454558551311493\n", - "\n", - "Epoch 16/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 16: 600step [00:27, 22.03step/s, loss=0.0337] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 15\n", - "\n", - "\tEpoch 16 completed. Avg Loss: 0.03424842655658722, Time: 27.23s, Best Loss: 0.03424842655658722\n", - "\n", - "Epoch 17/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 17: 600step [00:26, 22.91step/s, loss=0.0222] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 16\n", - "\n", - "\tEpoch 17 completed. Avg Loss: 0.033752940595149994, Time: 26.19s, Best Loss: 0.033752940595149994\n", - "\n", - "Epoch 18/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 18: 600step [00:26, 22.51step/s, loss=0.0538] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 18 completed. Avg Loss: 0.03469432145357132, Time: 26.66s, Best Loss: 0.033752940595149994\n", - "\n", - "Epoch 19/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 19: 600step [00:27, 22.12step/s, loss=0.0197] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 19 completed. Avg Loss: 0.034264132380485535, Time: 27.13s, Best Loss: 0.033752940595149994\n", - "\n", - "Epoch 20/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 20: 600step [00:27, 21.63step/s, loss=0.0118] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 19\n", - "\n", - "\tEpoch 20 completed. Avg Loss: 0.03256053477525711, Time: 27.74s, Best Loss: 0.03256053477525711\n", - "\n", - "Epoch 21/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 21: 600step [00:27, 22.14step/s, loss=0.0198] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 21 completed. Avg Loss: 0.033350907266139984, Time: 27.10s, Best Loss: 0.03256053477525711\n", - "\n", - "Epoch 22/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 22: 600step [00:26, 22.47step/s, loss=0.0218] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 22 completed. Avg Loss: 0.034185633063316345, Time: 26.70s, Best Loss: 0.03256053477525711\n", - "\n", - "Epoch 23/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 23: 600step [00:27, 21.68step/s, loss=0.0411] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 23 completed. Avg Loss: 0.034173738211393356, Time: 27.67s, Best Loss: 0.03256053477525711\n", - "\n", - "Epoch 24/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 24: 600step [00:27, 21.53step/s, loss=0.0406] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 24 completed. Avg Loss: 0.03313639014959335, Time: 27.87s, Best Loss: 0.03256053477525711\n", - "\n", - "Epoch 25/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 25: 600step [00:18, 31.92step/s, loss=0.0241] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 25 completed. Avg Loss: 0.03290305286645889, Time: 18.80s, Best Loss: 0.03256053477525711\n", - "\n", - "Epoch 26/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 26: 600step [00:21, 27.95step/s, loss=0.0206] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 26 completed. Avg Loss: 0.03345366567373276, Time: 21.47s, Best Loss: 0.03256053477525711\n", - "\n", - "Epoch 27/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 27: 600step [00:25, 23.49step/s, loss=0.0299] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 27 completed. Avg Loss: 0.032624438405036926, Time: 25.54s, Best Loss: 0.03256053477525711\n", - "\n", - "Epoch 28/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 28: 600step [00:23, 25.11step/s, loss=0.0473] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 27\n", - "\n", - "\tEpoch 28 completed. Avg Loss: 0.03211237117648125, Time: 23.90s, Best Loss: 0.03211237117648125\n", - "\n", - "Epoch 29/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 29: 600step [00:22, 26.20step/s, loss=0.0322] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 29 completed. Avg Loss: 0.03273330256342888, Time: 22.90s, Best Loss: 0.03211237117648125\n", - "\n", - "Epoch 30/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 30: 600step [00:25, 23.53step/s, loss=0.0371] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 29\n", - "\n", - "\tEpoch 30 completed. Avg Loss: 0.03202373906970024, Time: 25.50s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 31/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 31: 600step [00:24, 24.64step/s, loss=0.0211] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 31 completed. Avg Loss: 0.03251713141798973, Time: 24.35s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 32/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 32: 600step [00:22, 26.33step/s, loss=0.0689] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 32 completed. Avg Loss: 0.0334281325340271, Time: 22.79s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 33/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 33: 600step [00:22, 26.28step/s, loss=0.0466] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 33 completed. Avg Loss: 0.03295937180519104, Time: 22.83s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 34/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 34: 600step [00:27, 21.63step/s, loss=0.0171] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 34 completed. Avg Loss: 0.032456181943416595, Time: 27.75s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 35/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 35: 600step [00:25, 23.58step/s, loss=0.0297] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 35 completed. Avg Loss: 0.03269660845398903, Time: 25.45s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 36/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 36: 600step [00:24, 24.04step/s, loss=0.0572] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 36 completed. Avg Loss: 0.03425575792789459, Time: 24.96s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 37/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 37: 600step [00:26, 22.62step/s, loss=0.0235] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 37 completed. Avg Loss: 0.03270065784454346, Time: 26.52s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 38/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 38: 600step [00:24, 24.04step/s, loss=0.0510] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 38 completed. Avg Loss: 0.032990530133247375, Time: 24.96s, Best Loss: 0.03202373906970024\n", - "\n", - "Epoch 39/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 39: 600step [00:22, 26.41step/s, loss=0.0302] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 38\n", - "\n", - "\tEpoch 39 completed. Avg Loss: 0.03196239843964577, Time: 22.72s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 40/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 40: 600step [00:23, 25.78step/s, loss=0.0395] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 40 completed. Avg Loss: 0.03205239772796631, Time: 23.27s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 41/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 41: 600step [00:23, 25.37step/s, loss=0.0491] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 41 completed. Avg Loss: 0.033081263303756714, Time: 23.66s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 42/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 42: 600step [00:22, 26.68step/s, loss=0.0184] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 42 completed. Avg Loss: 0.03300606831908226, Time: 22.49s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 43/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 43: 600step [00:22, 26.73step/s, loss=0.0232] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 43 completed. Avg Loss: 0.03200429305434227, Time: 22.45s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 44/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 44: 600step [00:21, 27.29step/s, loss=0.0268] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 44 completed. Avg Loss: 0.033106084913015366, Time: 21.98s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 45/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 45: 600step [00:22, 27.24step/s, loss=0.0168] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 45 completed. Avg Loss: 0.03220209851861, Time: 22.03s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 46/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 46: 600step [00:22, 26.78step/s, loss=0.0212] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 46 completed. Avg Loss: 0.032359909266233444, Time: 22.41s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 47/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 47: 600step [00:22, 27.27step/s, loss=0.0318] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 47 completed. Avg Loss: 0.03270978108048439, Time: 22.01s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 48/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 48: 600step [00:22, 27.03step/s, loss=0.0259] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 48 completed. Avg Loss: 0.032479140907526016, Time: 22.20s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 49/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 49: 600step [00:21, 27.34step/s, loss=0.0499] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 49 completed. Avg Loss: 0.03310719132423401, Time: 21.95s, Best Loss: 0.03196239843964577\n", - "\n", - "Epoch 50/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 50: 600step [00:21, 27.54step/s, loss=0.0396] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 49\n", - "\n", - "\tEpoch 50 completed. Avg Loss: 0.031949710100889206, Time: 21.78s, Best Loss: 0.031949710100889206\n", - "\n", - "Epoch 51/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 51: 600step [00:24, 24.89step/s, loss=0.0132] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 51 completed. Avg Loss: 0.0325763039290905, Time: 24.11s, Best Loss: 0.031949710100889206\n", - "\n", - "Epoch 52/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 52: 600step [00:23, 25.14step/s, loss=0.0392] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 52 completed. Avg Loss: 0.03241783753037453, Time: 23.86s, Best Loss: 0.031949710100889206\n", - "\n", - "Epoch 53/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 53: 600step [00:26, 22.95step/s, loss=0.0231] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 52\n", - "\n", - "\tEpoch 53 completed. Avg Loss: 0.03191205859184265, Time: 26.15s, Best Loss: 0.03191205859184265\n", - "\n", - "Epoch 54/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 54: 600step [00:26, 22.95step/s, loss=0.0502] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 54 completed. Avg Loss: 0.032294221222400665, Time: 26.14s, Best Loss: 0.03191205859184265\n", - "\n", - "Epoch 55/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 55: 600step [00:22, 26.48step/s, loss=0.0344] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 54\n", - "\n", - "\tEpoch 55 completed. Avg Loss: 0.03169962763786316, Time: 22.66s, Best Loss: 0.03169962763786316\n", - "\n", - "Epoch 56/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 56: 600step [00:22, 27.05step/s, loss=0.0232] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 56 completed. Avg Loss: 0.03263591229915619, Time: 22.18s, Best Loss: 0.03169962763786316\n", - "\n", - "Epoch 57/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 57: 600step [00:22, 26.93step/s, loss=0.0401] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 57 completed. Avg Loss: 0.031775712966918945, Time: 22.28s, Best Loss: 0.03169962763786316\n", - "\n", - "Epoch 58/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 58: 600step [00:22, 27.26step/s, loss=0.0376] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 58 completed. Avg Loss: 0.03211182728409767, Time: 22.01s, Best Loss: 0.03169962763786316\n", - "\n", - "Epoch 59/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 59: 600step [00:22, 27.23step/s, loss=0.0265] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 59 completed. Avg Loss: 0.03240136802196503, Time: 22.03s, Best Loss: 0.03169962763786316\n", - "\n", - "Epoch 60/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 60: 600step [00:24, 24.07step/s, loss=0.0421] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 59\n", - "\n", - "\tEpoch 60 completed. Avg Loss: 0.031421538442373276, Time: 24.93s, Best Loss: 0.031421538442373276\n", - "\n", - "Epoch 61/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 61: 600step [00:23, 25.69step/s, loss=0.0281] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 61 completed. Avg Loss: 0.031802840530872345, Time: 23.36s, Best Loss: 0.031421538442373276\n", - "\n", - "Epoch 62/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 62: 600step [00:22, 26.60step/s, loss=0.0312] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 62 completed. Avg Loss: 0.03187322989106178, Time: 22.56s, Best Loss: 0.031421538442373276\n", - "\n", - "Epoch 63/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 63: 600step [00:23, 26.02step/s, loss=0.0141] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 63 completed. Avg Loss: 0.03185668960213661, Time: 23.06s, Best Loss: 0.031421538442373276\n", - "\n", - "Epoch 64/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 64: 600step [00:23, 25.18step/s, loss=0.0558] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 63\n", - "\n", - "\tEpoch 64 completed. Avg Loss: 0.031077852472662926, Time: 23.83s, Best Loss: 0.031077852472662926\n", - "\n", - "Epoch 65/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 65: 600step [00:23, 25.11step/s, loss=0.0207] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 65 completed. Avg Loss: 0.031984418630599976, Time: 23.89s, Best Loss: 0.031077852472662926\n", - "\n", - "Epoch 66/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 66: 600step [00:22, 26.59step/s, loss=0.0520] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 66 completed. Avg Loss: 0.03188655897974968, Time: 22.57s, Best Loss: 0.031077852472662926\n", - "\n", - "Epoch 67/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 67: 600step [00:23, 25.07step/s, loss=0.0205] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 67 completed. Avg Loss: 0.03299045190215111, Time: 23.94s, Best Loss: 0.031077852472662926\n", - "\n", - "Epoch 68/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 68: 600step [00:23, 25.12step/s, loss=0.0330] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 68 completed. Avg Loss: 0.03133696690201759, Time: 23.89s, Best Loss: 0.031077852472662926\n", - "\n", - "Epoch 69/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 69: 600step [00:23, 25.99step/s, loss=0.0631] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 68\n", - "\n", - "\tEpoch 69 completed. Avg Loss: 0.03065236657857895, Time: 23.09s, Best Loss: 0.03065236657857895\n", - "\n", - "Epoch 70/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 70: 600step [00:23, 25.69step/s, loss=0.0546] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 70 completed. Avg Loss: 0.03172782063484192, Time: 23.36s, Best Loss: 0.03065236657857895\n", - "\n", - "Epoch 71/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 71: 600step [00:23, 25.97step/s, loss=0.0438] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 71 completed. Avg Loss: 0.031718868762254715, Time: 23.11s, Best Loss: 0.03065236657857895\n", - "\n", - "Epoch 72/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 72: 600step [00:23, 25.07step/s, loss=0.0269] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 72 completed. Avg Loss: 0.03231620788574219, Time: 23.94s, Best Loss: 0.03065236657857895\n", - "\n", - "Epoch 73/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 73: 600step [00:23, 25.47step/s, loss=0.0182] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 73 completed. Avg Loss: 0.03190268576145172, Time: 23.56s, Best Loss: 0.03065236657857895\n", - "\n", - "Epoch 74/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 74: 600step [00:27, 22.11step/s, loss=0.0326] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 74 completed. Avg Loss: 0.03146028146147728, Time: 27.15s, Best Loss: 0.03065236657857895\n", - "\n", - "Epoch 75/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 75: 600step [00:25, 23.58step/s, loss=0.0228] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 75 completed. Avg Loss: 0.0313989520072937, Time: 25.45s, Best Loss: 0.03065236657857895\n", - "\n", - "Epoch 76/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 76: 600step [00:23, 25.88step/s, loss=0.0330] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 75\n", - "\n", - "\tEpoch 76 completed. Avg Loss: 0.030625171959400177, Time: 23.19s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 77/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 77: 600step [00:25, 23.69step/s, loss=0.0253] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 77 completed. Avg Loss: 0.03182491660118103, Time: 25.33s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 78/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 78: 600step [00:22, 26.10step/s, loss=0.0276] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 78 completed. Avg Loss: 0.031595341861248016, Time: 22.99s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 79/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 79: 600step [00:23, 25.78step/s, loss=0.0195] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 79 completed. Avg Loss: 0.031896837055683136, Time: 23.27s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 80/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 80: 600step [00:22, 26.57step/s, loss=0.0212] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 80 completed. Avg Loss: 0.031346891075372696, Time: 22.58s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 81/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 81: 600step [00:22, 27.17step/s, loss=0.0330] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 81 completed. Avg Loss: 0.03143094852566719, Time: 22.09s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 82/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 82: 600step [00:26, 22.94step/s, loss=0.0407] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 82 completed. Avg Loss: 0.030973270535469055, Time: 26.16s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 83/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 83: 600step [00:24, 24.84step/s, loss=0.0462] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 83 completed. Avg Loss: 0.0317712239921093, Time: 24.16s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 84/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 84: 600step [00:21, 28.47step/s, loss=0.0114] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 84 completed. Avg Loss: 0.03178401663899422, Time: 21.07s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 85/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 85: 600step [00:21, 28.07step/s, loss=0.0182] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 85 completed. Avg Loss: 0.03204609453678131, Time: 21.38s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 86/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 86: 600step [00:21, 28.54step/s, loss=0.0382] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 86 completed. Avg Loss: 0.03121379390358925, Time: 21.03s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 87/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 87: 600step [00:20, 28.65step/s, loss=0.0246] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 87 completed. Avg Loss: 0.03142351284623146, Time: 20.94s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 88/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 88: 600step [00:21, 28.47step/s, loss=0.0239] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 88 completed. Avg Loss: 0.03096529096364975, Time: 21.07s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 89/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 89: 600step [00:21, 28.33step/s, loss=0.0214] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 89 completed. Avg Loss: 0.031511031091213226, Time: 21.18s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 90/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 90: 600step [00:21, 28.21step/s, loss=0.0280] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 90 completed. Avg Loss: 0.03126688674092293, Time: 21.27s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 91/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 91: 600step [00:20, 28.58step/s, loss=0.0231] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 91 completed. Avg Loss: 0.03170185536146164, Time: 21.00s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 92/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 92: 600step [00:21, 28.55step/s, loss=0.0358] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 92 completed. Avg Loss: 0.030834142118692398, Time: 21.01s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 93/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 93: 600step [00:21, 28.38step/s, loss=0.0330] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 93 completed. Avg Loss: 0.031204644590616226, Time: 21.14s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 94/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 94: 600step [00:21, 27.96step/s, loss=0.0366] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 94 completed. Avg Loss: 0.031423285603523254, Time: 21.46s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 95/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 95: 600step [00:21, 28.16step/s, loss=0.0221] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 95 completed. Avg Loss: 0.03122376836836338, Time: 21.31s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 96/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 96: 600step [00:21, 28.39step/s, loss=0.0323] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 96 completed. Avg Loss: 0.03140410780906677, Time: 21.14s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 97/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 97: 600step [00:21, 28.26step/s, loss=0.0471] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 97 completed. Avg Loss: 0.03193888068199158, Time: 21.23s, Best Loss: 0.030625171959400177\n", - "\n", - "Epoch 98/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 98: 600step [00:21, 28.33step/s, loss=0.0331] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 97\n", - "\n", - "\tEpoch 98 completed. Avg Loss: 0.030622398480772972, Time: 21.18s, Best Loss: 0.030622398480772972\n", - "\n", - "Epoch 99/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 99: 600step [00:21, 27.97step/s, loss=0.0350] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 98\n", - "\n", - "\tEpoch 99 completed. Avg Loss: 0.0298920925706625, Time: 21.46s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 100/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 100: 600step [00:21, 27.45step/s, loss=0.0137] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 100 completed. Avg Loss: 0.030855681747198105, Time: 21.86s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 101/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 101: 600step [00:25, 23.18step/s, loss=0.0363] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 101 completed. Avg Loss: 0.03179168701171875, Time: 25.89s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 102/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 102: 600step [00:22, 26.83step/s, loss=0.0485] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 102 completed. Avg Loss: 0.03130820021033287, Time: 22.36s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 103/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 103: 600step [00:21, 27.65step/s, loss=0.0311] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 103 completed. Avg Loss: 0.03206488490104675, Time: 21.70s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 104/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 104: 600step [00:21, 27.72step/s, loss=0.0236] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 104 completed. Avg Loss: 0.031366076320409775, Time: 21.64s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 105/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 105: 600step [00:22, 26.34step/s, loss=0.0372] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 105 completed. Avg Loss: 0.031081004068255424, Time: 22.78s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 106/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 106: 600step [00:23, 25.59step/s, loss=0.0324] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 106 completed. Avg Loss: 0.03168484568595886, Time: 23.45s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 107/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 107: 600step [00:22, 26.54step/s, loss=0.0422] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 107 completed. Avg Loss: 0.03104880452156067, Time: 22.61s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 108/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 108: 600step [00:25, 23.83step/s, loss=0.0156] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 108 completed. Avg Loss: 0.03202491253614426, Time: 25.18s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 109/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 109: 600step [00:22, 27.04step/s, loss=0.0446] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 109 completed. Avg Loss: 0.032374314963817596, Time: 22.19s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 110/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 110: 600step [00:23, 25.12step/s, loss=0.0241] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 110 completed. Avg Loss: 0.03126741200685501, Time: 23.89s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 111/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 111: 600step [00:23, 25.31step/s, loss=0.0331] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 111 completed. Avg Loss: 0.030626872554421425, Time: 23.71s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 112/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 112: 600step [00:22, 26.43step/s, loss=0.0266] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 112 completed. Avg Loss: 0.031008537858724594, Time: 22.70s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 113/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 113: 600step [00:23, 25.16step/s, loss=0.0268] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 113 completed. Avg Loss: 0.030490227043628693, Time: 23.85s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 114/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 114: 600step [00:26, 23.02step/s, loss=0.0302] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 114 completed. Avg Loss: 0.03127073496580124, Time: 26.07s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 115/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 115: 600step [00:23, 25.61step/s, loss=0.0160] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 115 completed. Avg Loss: 0.030524272471666336, Time: 23.43s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 116/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 116: 600step [00:23, 25.82step/s, loss=0.0361] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 116 completed. Avg Loss: 0.031035978347063065, Time: 23.24s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 117/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 117: 600step [00:23, 25.70step/s, loss=0.0146] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 117 completed. Avg Loss: 0.03169717639684677, Time: 23.34s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 118/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 118: 600step [00:22, 26.99step/s, loss=0.0289] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 118 completed. Avg Loss: 0.030680254101753235, Time: 22.23s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 119/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 119: 600step [00:22, 26.85step/s, loss=0.0117] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 119 completed. Avg Loss: 0.03039366565644741, Time: 22.35s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 120/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 120: 600step [00:22, 26.09step/s, loss=0.0395] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 120 completed. Avg Loss: 0.031135018914937973, Time: 23.00s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 121/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 121: 600step [00:22, 26.41step/s, loss=0.0379] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 121 completed. Avg Loss: 0.03172043338418007, Time: 22.72s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 122/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 122: 600step [00:22, 26.42step/s, loss=0.0304] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 122 completed. Avg Loss: 0.03116608038544655, Time: 22.71s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 123/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 123: 600step [00:22, 26.42step/s, loss=0.0393] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 123 completed. Avg Loss: 0.031194454059004784, Time: 22.71s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 124/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 124: 600step [00:22, 26.27step/s, loss=0.0276] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 124 completed. Avg Loss: 0.030779557302594185, Time: 22.84s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 125/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 125: 600step [00:22, 27.07step/s, loss=0.0471] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 125 completed. Avg Loss: 0.03019583597779274, Time: 22.17s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 126/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 126: 600step [00:22, 26.74step/s, loss=0.0226] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 126 completed. Avg Loss: 0.03080889955163002, Time: 22.44s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 127/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 127: 600step [00:22, 26.49step/s, loss=0.0386] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 127 completed. Avg Loss: 0.030673792585730553, Time: 22.65s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 128/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 128: 600step [00:26, 22.33step/s, loss=0.0492] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 128 completed. Avg Loss: 0.031561076641082764, Time: 26.87s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 129/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 129: 600step [00:24, 24.31step/s, loss=0.0140] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 129 completed. Avg Loss: 0.031432755291461945, Time: 24.68s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 130/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 130: 600step [00:22, 26.40step/s, loss=0.0161] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 130 completed. Avg Loss: 0.03164326399564743, Time: 22.73s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 131/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 131: 600step [00:22, 26.14step/s, loss=0.0170] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 131 completed. Avg Loss: 0.03005044162273407, Time: 22.96s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 132/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 132: 600step [00:22, 26.31step/s, loss=0.0295] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 132 completed. Avg Loss: 0.030689632520079613, Time: 22.81s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 133/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 133: 600step [00:23, 25.72step/s, loss=0.0208] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 133 completed. Avg Loss: 0.03157074376940727, Time: 23.33s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 134/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 134: 600step [00:23, 25.85step/s, loss=0.0482] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 134 completed. Avg Loss: 0.03071059286594391, Time: 23.22s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 135/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 135: 600step [00:23, 25.49step/s, loss=0.0154] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 135 completed. Avg Loss: 0.03057778999209404, Time: 23.54s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 136/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 136: 600step [00:23, 26.01step/s, loss=0.0476] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 136 completed. Avg Loss: 0.030958708375692368, Time: 23.07s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 137/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 137: 600step [00:23, 25.76step/s, loss=0.0563] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 137 completed. Avg Loss: 0.030941111966967583, Time: 23.30s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 138/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 138: 600step [00:23, 25.47step/s, loss=0.0581] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 138 completed. Avg Loss: 0.03045061230659485, Time: 23.56s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 139/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 139: 600step [00:23, 26.08step/s, loss=0.0249] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 139 completed. Avg Loss: 0.030742166563868523, Time: 23.00s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 140/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 140: 600step [00:23, 25.93step/s, loss=0.0356] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 140 completed. Avg Loss: 0.03120078146457672, Time: 23.14s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 141/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 141: 600step [00:22, 26.26step/s, loss=0.0278] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 141 completed. Avg Loss: 0.031024526804685593, Time: 22.85s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 142/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 142: 600step [00:23, 25.97step/s, loss=0.0132] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 142 completed. Avg Loss: 0.031216904520988464, Time: 23.11s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 143/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 143: 600step [00:23, 25.85step/s, loss=0.0237] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 143 completed. Avg Loss: 0.03126555308699608, Time: 23.21s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 144/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 144: 600step [00:23, 25.69step/s, loss=0.0269] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 144 completed. Avg Loss: 0.030669977888464928, Time: 23.35s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 145/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 145: 600step [00:23, 25.55step/s, loss=0.0283] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 145 completed. Avg Loss: 0.030286889523267746, Time: 23.48s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 146/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 146: 600step [00:25, 23.39step/s, loss=0.0252] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 146 completed. Avg Loss: 0.03138629347085953, Time: 25.66s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 147/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 147: 600step [00:23, 25.41step/s, loss=0.0232] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 147 completed. Avg Loss: 0.03070307895541191, Time: 23.62s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 148/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 148: 600step [00:22, 26.76step/s, loss=0.0402] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 148 completed. Avg Loss: 0.03043060004711151, Time: 22.43s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 149/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 149: 600step [00:25, 23.93step/s, loss=0.0373] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 149 completed. Avg Loss: 0.0307303499430418, Time: 25.07s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 150/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 150: 600step [00:23, 25.63step/s, loss=0.0289] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 150 completed. Avg Loss: 0.030935684219002724, Time: 23.41s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 151/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 151: 600step [00:22, 26.20step/s, loss=0.0307] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 151 completed. Avg Loss: 0.03086274117231369, Time: 22.90s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 152/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 152: 600step [00:24, 24.58step/s, loss=0.0146] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 152 completed. Avg Loss: 0.0310970451682806, Time: 24.42s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 153/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 153: 600step [00:27, 22.13step/s, loss=0.0177] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 153 completed. Avg Loss: 0.030520562082529068, Time: 27.11s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 154/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 154: 600step [00:25, 23.39step/s, loss=0.0216] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 154 completed. Avg Loss: 0.030300742015242577, Time: 25.65s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 155/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 155: 600step [00:22, 26.96step/s, loss=0.0367] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 155 completed. Avg Loss: 0.030584856867790222, Time: 22.26s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 156/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 156: 600step [00:22, 26.31step/s, loss=0.0227] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 156 completed. Avg Loss: 0.030916517600417137, Time: 22.81s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 157/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 157: 600step [00:23, 25.72step/s, loss=0.0245] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 157 completed. Avg Loss: 0.030586332082748413, Time: 23.33s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 158/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 158: 600step [00:23, 25.97step/s, loss=0.0191] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 158 completed. Avg Loss: 0.031091608107089996, Time: 23.10s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 159/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 159: 600step [00:24, 24.99step/s, loss=0.0317] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 159 completed. Avg Loss: 0.03185242414474487, Time: 24.01s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 160/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 160: 600step [00:22, 26.24step/s, loss=0.0340] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 160 completed. Avg Loss: 0.030392343178391457, Time: 22.87s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 161/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 161: 600step [00:23, 25.83step/s, loss=0.0286] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 161 completed. Avg Loss: 0.0304632019251585, Time: 23.23s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 162/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 162: 600step [00:25, 23.75step/s, loss=0.0140] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 162 completed. Avg Loss: 0.03184927627444267, Time: 25.27s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 163/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 163: 600step [00:24, 24.10step/s, loss=0.0482] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 163 completed. Avg Loss: 0.030112819746136665, Time: 24.90s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 164/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 164: 600step [00:26, 23.02step/s, loss=0.0367] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 164 completed. Avg Loss: 0.03130125626921654, Time: 26.06s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 165/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 165: 600step [00:25, 23.71step/s, loss=0.0228] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 165 completed. Avg Loss: 0.03048659861087799, Time: 25.31s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 166/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 166: 600step [00:25, 23.94step/s, loss=0.0170] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 166 completed. Avg Loss: 0.030602067708969116, Time: 25.07s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 167/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 167: 600step [00:24, 24.73step/s, loss=0.0467] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 167 completed. Avg Loss: 0.030904268845915794, Time: 24.26s, Best Loss: 0.0298920925706625\n", - "\n", - "Epoch 168/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 168: 600step [00:26, 22.66step/s, loss=0.0392] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 167\n", - "\n", - "\tEpoch 168 completed. Avg Loss: 0.029834823682904243, Time: 26.48s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 169/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 169: 600step [00:25, 23.66step/s, loss=0.0174] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 169 completed. Avg Loss: 0.03110351599752903, Time: 25.36s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 170/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 170: 600step [00:23, 25.40step/s, loss=0.0253] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 170 completed. Avg Loss: 0.031386617571115494, Time: 23.63s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 171/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 171: 600step [00:26, 22.98step/s, loss=0.0361] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 171 completed. Avg Loss: 0.030754121020436287, Time: 26.11s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 172/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 172: 600step [00:27, 21.95step/s, loss=0.0404] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 172 completed. Avg Loss: 0.030754534527659416, Time: 27.34s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 173/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 173: 600step [00:25, 23.15step/s, loss=0.0240] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 173 completed. Avg Loss: 0.03044099733233452, Time: 25.92s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 174/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 174: 600step [00:28, 21.06step/s, loss=0.0243] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 174 completed. Avg Loss: 0.031532712280750275, Time: 28.50s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 175/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 175: 600step [00:25, 23.98step/s, loss=0.0387] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 175 completed. Avg Loss: 0.030652254819869995, Time: 25.03s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 176/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 176: 600step [00:24, 24.04step/s, loss=0.0272] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 176 completed. Avg Loss: 0.029988424852490425, Time: 24.96s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 177/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 177: 600step [00:24, 24.60step/s, loss=0.0379] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 177 completed. Avg Loss: 0.030592622235417366, Time: 24.40s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 178/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 178: 600step [00:25, 23.78step/s, loss=0.0438] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 178 completed. Avg Loss: 0.030984899029135704, Time: 25.23s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 179/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 179: 600step [00:25, 23.41step/s, loss=0.0469] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 179 completed. Avg Loss: 0.029900571331381798, Time: 25.63s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 180/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 180: 600step [00:25, 23.69step/s, loss=0.0168] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 180 completed. Avg Loss: 0.030912701040506363, Time: 25.33s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 181/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 181: 600step [00:26, 22.91step/s, loss=0.0251] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 181 completed. Avg Loss: 0.03021235018968582, Time: 26.20s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 182/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 182: 600step [00:27, 21.80step/s, loss=0.0286] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 182 completed. Avg Loss: 0.030836468562483788, Time: 27.52s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 183/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 183: 600step [00:25, 23.50step/s, loss=0.0452] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 183 completed. Avg Loss: 0.031009651720523834, Time: 25.54s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 184/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 184: 600step [00:22, 26.90step/s, loss=0.0409] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 184 completed. Avg Loss: 0.030340110883116722, Time: 22.31s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 185/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 185: 600step [00:24, 24.00step/s, loss=0.0237] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 185 completed. Avg Loss: 0.030099017545580864, Time: 25.00s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 186/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 186: 600step [00:25, 23.92step/s, loss=0.0345] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 186 completed. Avg Loss: 0.030865279957652092, Time: 25.09s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 187/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 187: 600step [00:22, 26.22step/s, loss=0.0336] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 187 completed. Avg Loss: 0.03092220425605774, Time: 22.88s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 188/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 188: 600step [00:22, 27.27step/s, loss=0.0389] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 188 completed. Avg Loss: 0.030810778960585594, Time: 22.01s, Best Loss: 0.029834823682904243\n", - "\n", - "Epoch 189/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 189: 600step [00:19, 30.28step/s, loss=0.0355] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Saving model at epoch 188\n", - "\n", - "\tEpoch 189 completed. Avg Loss: 0.02911863848567009, Time: 19.82s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 190/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 190: 600step [00:19, 30.03step/s, loss=0.0549] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 190 completed. Avg Loss: 0.031167929992079735, Time: 19.98s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 191/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 191: 600step [00:20, 29.81step/s, loss=0.0253] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 191 completed. Avg Loss: 0.030371375381946564, Time: 20.13s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 192/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 192: 600step [00:20, 29.23step/s, loss=0.0347] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 192 completed. Avg Loss: 0.03068062663078308, Time: 20.53s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 193/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 193: 600step [00:20, 28.99step/s, loss=0.0416] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 193 completed. Avg Loss: 0.030108770355582237, Time: 20.70s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 194/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 194: 600step [00:20, 28.96step/s, loss=0.0178] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 194 completed. Avg Loss: 0.030193457379937172, Time: 20.72s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 195/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 195: 600step [00:20, 29.86step/s, loss=0.0293] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 195 completed. Avg Loss: 0.03137557953596115, Time: 20.10s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 196/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 196: 600step [00:21, 27.79step/s, loss=0.0274] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 196 completed. Avg Loss: 0.030947834253311157, Time: 21.59s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 197/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 197: 600step [00:20, 29.48step/s, loss=0.0274] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 197 completed. Avg Loss: 0.031006354838609695, Time: 20.35s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 198/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 198: 600step [00:20, 29.10step/s, loss=0.0138] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 198 completed. Avg Loss: 0.031136009842157364, Time: 20.62s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 199/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 199: 600step [00:21, 28.12step/s, loss=0.0359] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 199 completed. Avg Loss: 0.030296465381979942, Time: 21.34s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 200/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 200: 600step [00:20, 29.85step/s, loss=0.0443] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 200 completed. Avg Loss: 0.030657414346933365, Time: 20.10s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 201/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 201: 600step [00:20, 28.76step/s, loss=0.0229] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 201 completed. Avg Loss: 0.03059197962284088, Time: 20.86s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 202/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 202: 600step [00:20, 28.78step/s, loss=0.0175] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 202 completed. Avg Loss: 0.030891722068190575, Time: 20.85s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 203/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 203: 600step [00:20, 29.47step/s, loss=0.0454] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 203 completed. Avg Loss: 0.030515819787979126, Time: 20.36s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 204/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 204: 600step [00:20, 29.51step/s, loss=0.0491] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 204 completed. Avg Loss: 0.03112410381436348, Time: 20.34s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 205/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 205: 600step [00:20, 28.82step/s, loss=0.0167] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 205 completed. Avg Loss: 0.031512875109910965, Time: 20.82s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 206/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 206: 600step [00:20, 29.32step/s, loss=0.0279] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 206 completed. Avg Loss: 0.029946276918053627, Time: 20.47s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 207/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 207: 600step [00:20, 28.64step/s, loss=0.0235] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 207 completed. Avg Loss: 0.029766127467155457, Time: 20.95s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 208/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 208: 600step [00:20, 29.07step/s, loss=0.0206] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 208 completed. Avg Loss: 0.030870771035552025, Time: 20.64s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 209/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 209: 600step [00:20, 29.93step/s, loss=0.0502] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 209 completed. Avg Loss: 0.03100993111729622, Time: 20.05s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 210/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 210: 600step [00:20, 29.88step/s, loss=0.0215] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 210 completed. Avg Loss: 0.03065209835767746, Time: 20.08s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 211/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 211: 600step [00:21, 28.51step/s, loss=0.0383] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 211 completed. Avg Loss: 0.031462348997592926, Time: 21.05s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 212/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 212: 600step [00:21, 28.31step/s, loss=0.0377] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 212 completed. Avg Loss: 0.029879948124289513, Time: 21.20s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 213/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 213: 600step [00:21, 28.25step/s, loss=0.0291] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 213 completed. Avg Loss: 0.03128215670585632, Time: 21.24s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 214/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 214: 600step [00:21, 28.21step/s, loss=0.0177] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 214 completed. Avg Loss: 0.03068498894572258, Time: 21.27s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 215/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 215: 600step [00:21, 28.07step/s, loss=0.0154] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 215 completed. Avg Loss: 0.030377749353647232, Time: 21.38s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 216/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 216: 600step [00:21, 28.45step/s, loss=0.0387] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 216 completed. Avg Loss: 0.030554519966244698, Time: 21.09s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 217/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 217: 600step [00:21, 27.92step/s, loss=0.0195] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 217 completed. Avg Loss: 0.029797246679663658, Time: 21.49s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 218/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 218: 600step [00:21, 28.50step/s, loss=0.0367] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 218 completed. Avg Loss: 0.029915928840637207, Time: 21.06s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 219/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 219: 600step [00:19, 30.38step/s, loss=0.0350] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 219 completed. Avg Loss: 0.03033987432718277, Time: 19.75s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 220/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 220: 600step [00:20, 28.64step/s, loss=0.0602] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 220 completed. Avg Loss: 0.030266499146819115, Time: 20.95s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 221/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 221: 600step [00:20, 28.93step/s, loss=0.0303] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 221 completed. Avg Loss: 0.03022736683487892, Time: 20.74s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 222/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 222: 600step [00:20, 28.71step/s, loss=0.0281] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 222 completed. Avg Loss: 0.031702592968940735, Time: 20.90s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 223/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 223: 600step [00:21, 28.46step/s, loss=0.0138] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 223 completed. Avg Loss: 0.030798694118857384, Time: 21.08s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 224/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 224: 600step [00:20, 29.95step/s, loss=0.0582] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 224 completed. Avg Loss: 0.03008972480893135, Time: 20.03s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 225/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 225: 600step [00:20, 29.44step/s, loss=0.0370] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 225 completed. Avg Loss: 0.029286356642842293, Time: 20.38s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 226/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 226: 600step [00:20, 29.35step/s, loss=0.0269] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 226 completed. Avg Loss: 0.03143226355314255, Time: 20.44s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 227/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 227: 600step [00:20, 29.35step/s, loss=0.0173] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 227 completed. Avg Loss: 0.031141705811023712, Time: 20.45s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 228/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 228: 600step [00:20, 29.24step/s, loss=0.0245] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 228 completed. Avg Loss: 0.030557889491319656, Time: 20.52s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 229/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 229: 600step [00:20, 29.63step/s, loss=0.0288] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 229 completed. Avg Loss: 0.02997661754488945, Time: 20.25s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 230/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 230: 600step [00:21, 27.93step/s, loss=0.0154] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 230 completed. Avg Loss: 0.030890755355358124, Time: 21.48s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 231/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 231: 600step [00:21, 28.02step/s, loss=0.0221] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 231 completed. Avg Loss: 0.029879407957196236, Time: 21.41s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 232/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 232: 600step [00:20, 29.00step/s, loss=0.0302] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 232 completed. Avg Loss: 0.031005728989839554, Time: 20.69s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 233/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 233: 600step [00:20, 28.77step/s, loss=0.0239] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 233 completed. Avg Loss: 0.030774911865592003, Time: 20.85s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 234/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 234: 600step [00:20, 29.54step/s, loss=0.0151] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 234 completed. Avg Loss: 0.029269268736243248, Time: 20.31s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 235/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 235: 600step [00:20, 29.18step/s, loss=0.0296] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 235 completed. Avg Loss: 0.030035896226763725, Time: 20.56s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 236/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 236: 600step [00:20, 29.17step/s, loss=0.0147] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 236 completed. Avg Loss: 0.030141755938529968, Time: 20.57s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 237/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 237: 600step [00:20, 28.97step/s, loss=0.0403] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 237 completed. Avg Loss: 0.03023518994450569, Time: 20.71s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 238/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 238: 600step [00:20, 29.03step/s, loss=0.0431] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 238 completed. Avg Loss: 0.029967201873660088, Time: 20.67s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 239/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 239: 600step [00:20, 29.77step/s, loss=0.0297] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 239 completed. Avg Loss: 0.03024066798388958, Time: 20.15s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 240/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 240: 600step [00:20, 28.97step/s, loss=0.0308] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 240 completed. Avg Loss: 0.029853347688913345, Time: 20.71s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 241/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 241: 600step [00:20, 28.92step/s, loss=0.0225] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 241 completed. Avg Loss: 0.029862258583307266, Time: 20.75s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 242/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 242: 600step [00:21, 28.07step/s, loss=0.0456] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 242 completed. Avg Loss: 0.030556395649909973, Time: 21.38s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 243/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 243: 600step [00:21, 28.35step/s, loss=0.0220] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 243 completed. Avg Loss: 0.031456153839826584, Time: 21.17s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 244/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 244: 600step [00:20, 28.64step/s, loss=0.0269] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 244 completed. Avg Loss: 0.029869651421904564, Time: 20.95s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 245/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 245: 600step [00:20, 29.57step/s, loss=0.0352] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 245 completed. Avg Loss: 0.030350862070918083, Time: 20.29s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 246/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 246: 600step [00:20, 29.44step/s, loss=0.0639] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 246 completed. Avg Loss: 0.0302216075360775, Time: 20.38s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 247/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 247: 600step [00:20, 29.86step/s, loss=0.0327] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 247 completed. Avg Loss: 0.029878510162234306, Time: 20.10s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 248/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 248: 600step [00:20, 29.62step/s, loss=0.0334] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 248 completed. Avg Loss: 0.03063737414777279, Time: 20.26s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 249/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 249: 600step [00:20, 29.84step/s, loss=0.0346] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 249 completed. Avg Loss: 0.030474552884697914, Time: 20.11s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 250/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 250: 600step [00:20, 28.66step/s, loss=0.0253] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 250 completed. Avg Loss: 0.030552174896001816, Time: 20.94s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 251/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 251: 600step [00:19, 30.28step/s, loss=0.0221] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 251 completed. Avg Loss: 0.02930343523621559, Time: 19.82s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 252/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 252: 600step [00:20, 28.75step/s, loss=0.0402] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 252 completed. Avg Loss: 0.029680443927645683, Time: 20.87s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 253/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 253: 600step [00:20, 28.62step/s, loss=0.0140] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 253 completed. Avg Loss: 0.030639704316854477, Time: 20.97s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 254/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 254: 600step [00:20, 29.12step/s, loss=0.0363] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 254 completed. Avg Loss: 0.029463477432727814, Time: 20.60s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 255/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 255: 600step [00:20, 29.22step/s, loss=0.0191] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 255 completed. Avg Loss: 0.03154565021395683, Time: 20.53s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 256/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 256: 600step [00:21, 27.80step/s, loss=0.0394] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 256 completed. Avg Loss: 0.02973053604364395, Time: 21.58s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 257/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 257: 600step [00:20, 29.81step/s, loss=0.0243] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 257 completed. Avg Loss: 0.030894488096237183, Time: 20.13s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 258/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 258: 600step [00:20, 29.26step/s, loss=0.0312] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 258 completed. Avg Loss: 0.03097139485180378, Time: 20.51s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 259/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 259: 600step [00:20, 28.79step/s, loss=0.0589] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 259 completed. Avg Loss: 0.029975291341543198, Time: 20.84s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 260/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 260: 600step [00:20, 29.79step/s, loss=0.0248] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 260 completed. Avg Loss: 0.03074849396944046, Time: 20.14s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 261/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 261: 600step [00:20, 29.40step/s, loss=0.0368] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 261 completed. Avg Loss: 0.03127008676528931, Time: 20.41s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 262/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 262: 600step [00:20, 28.85step/s, loss=0.0454] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 262 completed. Avg Loss: 0.030147749930620193, Time: 20.80s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 263/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 263: 600step [00:20, 29.61step/s, loss=0.0247] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 263 completed. Avg Loss: 0.030923856422305107, Time: 20.26s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 264/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 264: 600step [00:20, 29.70step/s, loss=0.0466] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 264 completed. Avg Loss: 0.030110353603959084, Time: 20.20s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 265/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 265: 600step [00:20, 28.70step/s, loss=0.0189] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 265 completed. Avg Loss: 0.030306534841656685, Time: 20.91s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 266/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 266: 600step [00:21, 28.26step/s, loss=0.0191] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 266 completed. Avg Loss: 0.02932608872652054, Time: 21.24s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 267/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 267: 600step [00:20, 28.90step/s, loss=0.0459] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 267 completed. Avg Loss: 0.030413834378123283, Time: 20.77s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 268/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 268: 600step [00:20, 28.95step/s, loss=0.0102] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 268 completed. Avg Loss: 0.029550213366746902, Time: 20.73s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 269/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 269: 600step [00:20, 29.31step/s, loss=0.0158] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 269 completed. Avg Loss: 0.030407404527068138, Time: 20.47s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 270/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 270: 600step [00:20, 28.70step/s, loss=0.0359] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 270 completed. Avg Loss: 0.02956535294651985, Time: 20.91s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 271/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 271: 600step [00:20, 28.73step/s, loss=0.0159] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 271 completed. Avg Loss: 0.02983720600605011, Time: 20.88s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 272/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 272: 600step [00:20, 29.15step/s, loss=0.0231] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 272 completed. Avg Loss: 0.030363643541932106, Time: 20.58s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 273/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 273: 600step [00:21, 28.34step/s, loss=0.0296] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 273 completed. Avg Loss: 0.030253378674387932, Time: 21.17s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 274/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 274: 600step [00:20, 29.46step/s, loss=0.0121] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 274 completed. Avg Loss: 0.030917268246412277, Time: 20.37s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 275/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 275: 600step [00:20, 29.32step/s, loss=0.0518] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 275 completed. Avg Loss: 0.030820336192846298, Time: 20.46s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 276/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 276: 600step [00:20, 29.73step/s, loss=0.0183] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 276 completed. Avg Loss: 0.031120145693421364, Time: 20.18s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 277/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 277: 600step [00:20, 28.88step/s, loss=0.0338] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 277 completed. Avg Loss: 0.030239492654800415, Time: 20.78s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 278/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 278: 600step [00:20, 29.24step/s, loss=0.0222] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 278 completed. Avg Loss: 0.031044285744428635, Time: 20.52s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 279/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 279: 600step [00:20, 29.75step/s, loss=0.0470] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 279 completed. Avg Loss: 0.030430959537625313, Time: 20.17s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 280/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 280: 600step [00:21, 27.89step/s, loss=0.0263] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 280 completed. Avg Loss: 0.030406493693590164, Time: 21.52s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 281/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 281: 600step [00:20, 28.78step/s, loss=0.0704] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 281 completed. Avg Loss: 0.030351663008332253, Time: 20.85s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 282/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 282: 600step [00:19, 30.44step/s, loss=0.0385] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 282 completed. Avg Loss: 0.030156703665852547, Time: 19.71s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 283/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 283: 600step [00:20, 29.18step/s, loss=0.0740] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 283 completed. Avg Loss: 0.02955285646021366, Time: 20.56s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 284/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 284: 600step [00:20, 28.87step/s, loss=0.0382] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 284 completed. Avg Loss: 0.0296962708234787, Time: 20.78s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 285/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 285: 600step [00:21, 28.47step/s, loss=0.0317] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 285 completed. Avg Loss: 0.03034166991710663, Time: 21.08s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 286/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 286: 600step [00:21, 28.08step/s, loss=0.0231] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 286 completed. Avg Loss: 0.029358938336372375, Time: 21.37s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 287/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 287: 600step [00:21, 28.09step/s, loss=0.0349] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 287 completed. Avg Loss: 0.03014751896262169, Time: 21.36s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 288/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 288: 600step [00:20, 29.49step/s, loss=0.0142] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 288 completed. Avg Loss: 0.029915982857346535, Time: 20.35s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 289/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 289: 600step [00:20, 29.99step/s, loss=0.0335] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 289 completed. Avg Loss: 0.02998582273721695, Time: 20.01s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 290/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 290: 600step [00:20, 28.97step/s, loss=0.0297] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 290 completed. Avg Loss: 0.029476497322320938, Time: 20.71s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 291/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 291: 600step [00:21, 28.27step/s, loss=0.0260] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 291 completed. Avg Loss: 0.030181851238012314, Time: 21.23s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 292/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 292: 600step [00:21, 28.18step/s, loss=0.0260] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 292 completed. Avg Loss: 0.030212005600333214, Time: 21.29s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 293/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 293: 600step [00:20, 29.79step/s, loss=0.0129] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 293 completed. Avg Loss: 0.03067186288535595, Time: 20.14s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 294/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 294: 600step [00:20, 29.47step/s, loss=0.0101] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 294 completed. Avg Loss: 0.02944846637547016, Time: 20.36s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 295/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 295: 600step [00:20, 28.69step/s, loss=0.0264] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 295 completed. Avg Loss: 0.030761005356907845, Time: 20.92s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 296/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 296: 600step [00:20, 28.84step/s, loss=0.0317] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 296 completed. Avg Loss: 0.03056473284959793, Time: 20.81s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 297/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 297: 600step [00:20, 29.19step/s, loss=0.0288] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 297 completed. Avg Loss: 0.030081303790211678, Time: 20.55s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 298/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 298: 600step [00:20, 29.03step/s, loss=0.0319] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 298 completed. Avg Loss: 0.030031388625502586, Time: 20.67s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 299/500\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\t\tEpoch 299: 600step [00:21, 28.27step/s, loss=0.0135] \n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "\tEpoch 299 completed. Avg Loss: 0.02981877140700817, Time: 21.23s, Best Loss: 0.02911863848567009\n", - "\n", - "Epoch 300/500\n" - ] - }, { "name": "stderr", "output_type": "stream", "text": [ - "\t\tEpoch 300: 59%|███████████████████▎ | 300/511 [00:08<00:06, 34.21step/s, loss=0.0200]" + "\t\tEpoch 323: 39%|████████████▉ | 200/511 [00:04<00:06, 48.78step/s, loss=0.0191]" ] } ],