diff --git "a/inference.ipynb" "b/inference.ipynb"
new file mode 100644--- /dev/null
+++ "b/inference.ipynb"
@@ -0,0 +1 @@
+{"nbformat":4,"nbformat_minor":0,"metadata":{"accelerator":"GPU","colab":{"name":"hhhh.ipynb","provenance":[],"collapsed_sections":[]},"kernelspec":{"display_name":"Python 3","name":"python3"}},"cells":[{"cell_type":"code","metadata":{"id":"8qEqdj8u0gdN","colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"status":"ok","timestamp":1659796105720,"user_tz":-180,"elapsed":12,"user":{"displayName":"Ivan Ivanov","userId":"14212634423080719601"}},"outputId":"178ab62d-db65-4cd2-c1b2-fa8a0ce9491c"},"source":["!nvidia-smi -L\n","import psutil\n","print(psutil.virtual_memory())\n","\n","lemodel = 'slon'\n","leartist = 'unknown'\n","legenre = 'unknown'\n","leeventlog = False"],"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["GPU 0: Tesla T4 (UUID: GPU-1d6551b6-262e-815d-1255-6b5128ef486c)\n","svmem(total=13617745920, available=12766134272, percent=6.3, used=600608768, free=10925678592, active=975699968, inactive=1472458752, buffers=115712000, cached=1975746560, shared=1241088, slab=136245248)\n"]}]},{"cell_type":"code","metadata":{"id":"ZPdMgaH_BPGN","colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"status":"ok","timestamp":1659796129619,"user_tz":-180,"elapsed":23904,"user":{"displayName":"Ivan Ivanov","userId":"14212634423080719601"}},"outputId":"e6033314-c5e3-4631-d475-0559c6a086a5"},"source":[" from google.colab import drive\n","drive.mount('/content/gdrive')"],"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Mounted at /content/gdrive\n"]}]},{"cell_type":"markdown","metadata":{"id":"UXXsstiqTSxI"},"source":["๐ฎ Setup ๐ฎ"]},{"cell_type":"code","metadata":{"id":"e1jVq3CbTSxI","colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"status":"ok","timestamp":1659796210286,"user_tz":-180,"elapsed":80676,"user":{"displayName":"Ivan Ivanov","userId":"14212634423080719601"}},"outputId":"48a15649-5605-47bf-b624-24e83ba0f636"},"source":["!pip install git+https://github.com/openai/jukebox.git\n","!git clone https://github.com/openai/jukebox.git\n","!pip install av==8.1.0\n","!pip install tensorboardX \n","import os\n","\n","lemodelpath = '/content/gdrive/MyDrive/juke/' + lemodel + '_prior/checkpoint_latest.pth.tar'\n","leaudio_files_dir = '/content/gdrive/MyDrive/' + lemodel\n","lepriorname = lemodel + '_prior'\n","\n","print(lemodelpath,leaudio_files_dir,lepriorname,os.path.isfile(lemodelpath))\n","\n","############### To Change to Google Drive\n","\n","fin = open(\"/usr/local/lib/python3.7/dist-packages/jukebox/utils/logger.py\", \"rt\")\n","data = fin.read()\n","data = data.replace('logdir = f\"{hps.local_logdir}/{hps.name}\"', 'logdir = f\"/content/gdrive/MyDrive/juke/{hps.name}\"')\n","fin.close()\n","fin = open(\"/usr/local/lib/python3.7/dist-packages/jukebox/utils/logger.py\", \"wt\")\n","fin.write(data)\n","fin.close()\n","\n","############### To Sample with Google Drive\n","\n","fin = open(\"/usr/local/lib/python3.7/dist-packages/jukebox/hparams.py\", \"rt\")\n","data = fin.read()\n","fin.close()\n","\n","data += lemodel + \"\"\"_prior = Hyperparams() \n","\"\"\" + lemodel + \"\"\"_prior.update(prior_1b_lyrics)\n","\"\"\" + lemodel + \"\"\"_prior.restore_prior='\"\"\" + lemodelpath + \"\"\"'\n","\"\"\" + lemodel + \"\"\"_prior.level=2\n","HPARAMS_REGISTRY['\"\"\" + lemodel + \"\"\"_prior'] = \"\"\" + lemodel + \"\"\"_prior\n","\"\"\"\n","\n","#data = data.replace('y_bins=(10,100)','y_bins=(604, 7898)')\n","data = data.replace('min_duration=60.0','min_duration=24.0')\n","#data = data.replace('max_duration=600.0','max_duration=666.0')\n","\n","fin = open(\"/usr/local/lib/python3.7/dist-packages/jukebox/hparams.py\", \"wt\")\n","fin.write(data)\n","fin.close()\n","\n","####################### To get Artist Genre, Lyrics \n","\n","fin = open(\"/usr/local/lib/python3.7/dist-packages/jukebox/data/files_dataset.py\", \"rt\")\n","data = fin.read()\n","fin.close()\n","\n","data = data.replace('def get_metadata(self, filename, test):','''def get_metadata(self, filename, test):\n"," lyr = \"\"\n"," letx = filename.replace('.wav','.txt').replace('.mp3','.txt')\n"," print(letx)\n"," if os.path.isfile(letx):\n"," fin = open(letx, \"rt\")\n"," lyr = fin.read()\n"," print('yes')\n"," fin.close''')\n","\n","data = data.replace('return None, None, None',\"return '\" + leartist + \"', '\" + legenre + \"', lyr\")\n","data = data.replace('import librosa', '''import librosa\n","import os''')\n","\n","\n","fin = open(\"/usr/local/lib/python3.7/dist-packages/jukebox/data/files_dataset.py\", \"wt\")\n","fin.write(data)\n","fin.close()\n","\n","####################### step print\n","\n","fin = open(\"/content/jukebox/jukebox/train.py\", \"rt\")\n","data = fin.read()\n","fin.close()\n","\n","data = data.replace('log_inputs(orig_model, logger, x_in, y, x_out, hps)','log_inputs(orig_model, logger, x_in, y, x_out, hps);print(colored(\"steps:\" + str(logger.iters),\"magenta\"))')\n","data = \"\"\"from termcolor import colored\n","\n","\"\"\" + data\n","\n","if leeventlog == False:\n"," data = data.replace('logger.flush()','#logger.flush()')\n"," \n","fin = open(\"/content/jukebox/jukebox/train.py\", \"wt\")\n","fin.write(data)\n","fin.close()\n","\n","\n","fin = open(\"/usr/local/lib/python3.7/dist-packages/jukebox/make_models.py\", \"rt\")\n","data = fin.read(); fin.close() \n","\n","data = data.replace(\"dist.barrier()\",\"dist.barrier(); print('1')\")\n","#data = data.replace(\"checkpoint = t.load(restore, map_location=t.device('cpu'))\",\"checkpoint = t.load(restore, map_location=t.device('cuda')); print('2')\")\n","data = data.replace(\".format(restore))\",\".format(restore)); print(3); import gc; gc.collect()\")\n","\n","fin = open(\"/usr/local/lib/python3.7/dist-packages/jukebox/make_models.py\", \"wt\")\n","fin.write(data); fin.close() \n"],"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n","Collecting git+https://github.com/openai/jukebox.git\n"," Cloning https://github.com/openai/jukebox.git to /tmp/pip-req-build-h_njyndg\n"," Running command git clone -q https://github.com/openai/jukebox.git /tmp/pip-req-build-h_njyndg\n","Collecting fire==0.1.3\n"," Downloading fire-0.1.3.tar.gz (33 kB)\n","Collecting tqdm==4.45.0\n"," Downloading tqdm-4.45.0-py2.py3-none-any.whl (60 kB)\n","\u001b[K |โโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโ| 60 kB 8.0 MB/s \n","\u001b[?25hRequirement already satisfied: soundfile==0.10.3.post1 in /usr/local/lib/python3.7/dist-packages (from jukebox==1.0) (0.10.3.post1)\n","Collecting unidecode==1.1.1\n"," Downloading Unidecode-1.1.1-py2.py3-none-any.whl (238 kB)\n","\u001b[K |โโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโ| 238 kB 2.5 MB/s \n","\u001b[?25hCollecting numba==0.48.0\n"," Downloading numba-0.48.0-1-cp37-cp37m-manylinux2014_x86_64.whl (3.5 MB)\n","\u001b[K |โโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโ| 3.5 MB 45.9 MB/s \n","\u001b[?25hCollecting librosa==0.7.2\n"," Downloading librosa-0.7.2.tar.gz (1.6 MB)\n","\u001b[K |โโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโ| 1.6 MB 55.6 MB/s \n","\u001b[?25hCollecting mpi4py>=3.0.0\n"," Downloading mpi4py-3.1.3.tar.gz (2.5 MB)\n","\u001b[K |โโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโ| 2.5 MB 10.3 MB/s \n","\u001b[?25h Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n"," Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n"," Preparing wheel metadata ... \u001b[?25l\u001b[?25hdone\n","Requirement already satisfied: six in /usr/local/lib/python3.7/dist-packages (from fire==0.1.3->jukebox==1.0) (1.15.0)\n","Requirement already satisfied: audioread>=2.0.0 in /usr/local/lib/python3.7/dist-packages (from librosa==0.7.2->jukebox==1.0) (2.1.9)\n","Requirement already satisfied: numpy>=1.15.0 in /usr/local/lib/python3.7/dist-packages (from librosa==0.7.2->jukebox==1.0) (1.21.6)\n","Requirement already satisfied: scipy>=1.0.0 in /usr/local/lib/python3.7/dist-packages (from librosa==0.7.2->jukebox==1.0) (1.7.3)\n","Requirement already satisfied: scikit-learn!=0.19.0,>=0.14.0 in /usr/local/lib/python3.7/dist-packages (from librosa==0.7.2->jukebox==1.0) (1.0.2)\n","Requirement already satisfied: joblib>=0.12 in /usr/local/lib/python3.7/dist-packages (from librosa==0.7.2->jukebox==1.0) (1.1.0)\n","Requirement already satisfied: decorator>=3.0.0 in /usr/local/lib/python3.7/dist-packages (from librosa==0.7.2->jukebox==1.0) (4.4.2)\n","Requirement already satisfied: resampy>=0.2.2 in /usr/local/lib/python3.7/dist-packages (from librosa==0.7.2->jukebox==1.0) (0.3.1)\n","Collecting llvmlite<0.32.0,>=0.31.0dev0\n"," Downloading llvmlite-0.31.0-cp37-cp37m-manylinux1_x86_64.whl (20.2 MB)\n","\u001b[K |โโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโ| 20.2 MB 1.2 MB/s \n","\u001b[?25hRequirement already satisfied: setuptools in /usr/local/lib/python3.7/dist-packages (from numba==0.48.0->jukebox==1.0) (57.4.0)\n","Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.7/dist-packages (from soundfile==0.10.3.post1->jukebox==1.0) (1.15.1)\n","Requirement already satisfied: pycparser in /usr/local/lib/python3.7/dist-packages (from cffi>=1.0->soundfile==0.10.3.post1->jukebox==1.0) (2.21)\n","Requirement already satisfied: threadpoolctl>=2.0.0 in /usr/local/lib/python3.7/dist-packages (from scikit-learn!=0.19.0,>=0.14.0->librosa==0.7.2->jukebox==1.0) (3.1.0)\n","Building wheels for collected packages: jukebox, fire, librosa, mpi4py\n"," Building wheel for jukebox (setup.py) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for jukebox: filename=jukebox-1.0-py3-none-any.whl size=197916 sha256=a4b63eeb069c2a8404e81d288f7083cc035f56ab8a00f4eef04a4b2240840813\n"," Stored in directory: /tmp/pip-ephem-wheel-cache-ehxjqqzn/wheels/d6/42/39/91f8a32505a445499702ae0f887769e6bb5030c42382d74ae0\n"," Building wheel for fire (setup.py) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for fire: filename=fire-0.1.3-py2.py3-none-any.whl size=49719 sha256=19f25e55721603f0bfe989fa8a24048180c9cf309837d070c45026bfc357ef01\n"," Stored in directory: /root/.cache/pip/wheels/dd/c5/df/d9bf8223023d31343b65f1cc57d2dc005610ebbcd2b4a5d1e7\n"," Building wheel for librosa (setup.py) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for librosa: filename=librosa-0.7.2-py3-none-any.whl size=1612902 sha256=ee1070d1c7a79eb748ec8445304db62ca4a9ed11094d07d544333736259bffa5\n"," Stored in directory: /root/.cache/pip/wheels/18/9e/42/3224f85730f92fa2925f0b4fb6ef7f9c5431a64dfc77b95b39\n"," Building wheel for mpi4py (PEP 517) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for mpi4py: filename=mpi4py-3.1.3-cp37-cp37m-linux_x86_64.whl size=2185270 sha256=605539953018e4e3312369ede372145d3ae621232b86e2e09b5cfd4b45ae7d19\n"," Stored in directory: /root/.cache/pip/wheels/7a/07/14/6a0c63fa2c6e473c6edc40985b7d89f05c61ff25ee7f0ad9ac\n","Successfully built jukebox fire librosa mpi4py\n","Installing collected packages: llvmlite, numba, unidecode, tqdm, mpi4py, librosa, fire, jukebox\n"," Attempting uninstall: llvmlite\n"," Found existing installation: llvmlite 0.39.0\n"," Uninstalling llvmlite-0.39.0:\n"," Successfully uninstalled llvmlite-0.39.0\n"," Attempting uninstall: numba\n"," Found existing installation: numba 0.56.0\n"," Uninstalling numba-0.56.0:\n"," Successfully uninstalled numba-0.56.0\n"," Attempting uninstall: tqdm\n"," Found existing installation: tqdm 4.64.0\n"," Uninstalling tqdm-4.64.0:\n"," Successfully uninstalled tqdm-4.64.0\n"," Attempting uninstall: librosa\n"," Found existing installation: librosa 0.8.1\n"," Uninstalling librosa-0.8.1:\n"," Successfully uninstalled librosa-0.8.1\n","\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n","panel 0.12.1 requires tqdm>=4.48.0, but you have tqdm 4.45.0 which is incompatible.\u001b[0m\n","Successfully installed fire-0.1.3 jukebox-1.0 librosa-0.7.2 llvmlite-0.31.0 mpi4py-3.1.3 numba-0.48.0 tqdm-4.45.0 unidecode-1.1.1\n","Cloning into 'jukebox'...\n","remote: Enumerating objects: 932, done.\u001b[K\n","remote: Total 932 (delta 0), reused 0 (delta 0), pack-reused 932\u001b[K\n","Receiving objects: 100% (932/932), 2.75 MiB | 2.89 MiB/s, done.\n","Resolving deltas: 100% (456/456), done.\n","Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n","Collecting av==8.1.0\n"," Downloading av-8.1.0-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (36.1 MB)\n","\u001b[K |โโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโ| 36.1 MB 372 kB/s \n","\u001b[?25hInstalling collected packages: av\n","Successfully installed av-8.1.0\n","Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n","Collecting tensorboardX\n"," Downloading tensorboardX-2.5.1-py2.py3-none-any.whl (125 kB)\n","\u001b[K |โโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโโ| 125 kB 35.7 MB/s \n","\u001b[?25hRequirement already satisfied: protobuf<=3.20.1,>=3.8.0 in /usr/local/lib/python3.7/dist-packages (from tensorboardX) (3.17.3)\n","Requirement already satisfied: numpy in /usr/local/lib/python3.7/dist-packages (from tensorboardX) (1.21.6)\n","Requirement already satisfied: six>=1.9 in /usr/local/lib/python3.7/dist-packages (from protobuf<=3.20.1,>=3.8.0->tensorboardX) (1.15.0)\n","Installing collected packages: tensorboardX\n","Successfully installed tensorboardX-2.5.1\n","/content/gdrive/MyDrive/juke/slon_prior/checkpoint_latest.pth.tar /content/gdrive/MyDrive/slon slon_prior False\n"]}]},{"cell_type":"markdown","metadata":{"id":"NX0gpk1ITSys"},"source":["## Prior\n"]},{"cell_type":"code","metadata":{"id":"tCu02U-OTSys","colab":{"base_uri":"https://localhost:8080/"},"outputId":"4e3578b6-c668-4724-9605-a959bccf31c2"},"source":["import gc; gc.collect()\n","\n","lehps = ('vqvae,prior_1b_lyrics,all_fp16,cpu_ema','vqvae,prior_1b_lyrics,'+lepriorname+',all_fp16,cpu_ema')[os.path.isfile(lemodelpath)]\n","print((\"new training model\",lepriorname + \" model found\")[os.path.isfile(lemodelpath)])\n","\n","!python jukebox/jukebox/train.py \\\n","--prior --test --train --aug_shift --aug_blend \\\n","--hps=$lehps \\\n","--save_iters=238 \\\n","--levels=3 \\\n","--level=2 \\\n","--name=$lepriorname \\\n","--sample_length=786432 \\\n","--bs=1 \\\n","--audio_files_dir=$leaudio_files_dir \\\n","--weight_decay=0.01\n","\n"],"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["\u001b[1;30;43mะัั
ะพะดะฝัะต ะดะฐะฝะฝัะต ะฑัะปะธ ะพะฑัะตะทะฐะฝั ะดะพ ะฝะตัะบะพะปัะบะธั
ะฟะพัะปะตะดะฝะธั
ัััะพะบ (5000).\u001b[0m\n"," 69% 4215/6144 [04:19<01:38, 19.57it/s]\u001b[A\n"," 69% 4218/6144 [04:19<01:37, 19.80it/s]\u001b[A\n"," 69% 4220/6144 [04:19<01:37, 19.83it/s]\u001b[A\n"," 69% 4222/6144 [04:19<01:37, 19.68it/s]\u001b[A\n"," 69% 4225/6144 [04:19<01:38, 19.55it/s]\u001b[A\n"," 69% 4227/6144 [04:19<01:38, 19.45it/s]\u001b[A\n"," 69% 4230/6144 [04:19<01:37, 19.69it/s]\u001b[A\n"," 69% 4232/6144 [04:20<01:38, 19.35it/s]\u001b[A\n"," 69% 4235/6144 [04:20<01:37, 19.64it/s]\u001b[A\n"," 69% 4238/6144 [04:20<01:37, 19.60it/s]\u001b[A\n"," 69% 4240/6144 [04:20<01:36, 19.68it/s]\u001b[A\n"," 69% 4242/6144 [04:20<01:36, 19.75it/s]\u001b[A\n"," 69% 4244/6144 [04:20<01:38, 19.28it/s]\u001b[A\n"," 69% 4246/6144 [04:20<01:38, 19.18it/s]\u001b[A\n"," 69% 4249/6144 [04:20<01:37, 19.47it/s]\u001b[A\n"," 69% 4251/6144 [04:21<01:38, 19.23it/s]\u001b[A\n"," 69% 4253/6144 [04:21<01:37, 19.44it/s]\u001b[A\n"," 69% 4256/6144 [04:21<01:37, 19.30it/s]\u001b[A\n"," 69% 4258/6144 [04:21<01:37, 19.39it/s]\u001b[A\n"," 69% 4261/6144 [04:21<01:36, 19.48it/s]\u001b[A\n"," 69% 4263/6144 [04:21<01:40, 18.63it/s]\u001b[A\n"," 69% 4265/6144 [04:21<01:40, 18.65it/s]\u001b[A\n"," 69% 4267/6144 [04:21<01:40, 18.72it/s]\u001b[A\n"," 69% 4269/6144 [04:21<01:38, 19.02it/s]\u001b[A\n"," 70% 4272/6144 [04:22<01:36, 19.31it/s]\u001b[A\n"," 70% 4274/6144 [04:22<01:38, 18.91it/s]\u001b[A\n"," 70% 4276/6144 [04:22<01:37, 19.22it/s]\u001b[A\n"," 70% 4279/6144 [04:22<01:37, 19.04it/s]\u001b[A\n"," 70% 4281/6144 [04:22<01:37, 19.05it/s]\u001b[A\n"," 70% 4283/6144 [04:22<01:36, 19.25it/s]\u001b[A\n"," 70% 4285/6144 [04:22<01:38, 18.90it/s]\u001b[A\n"," 70% 4287/6144 [04:22<01:37, 19.05it/s]\u001b[A\n"," 70% 4290/6144 [04:23<01:36, 19.23it/s]\u001b[A\n"," 70% 4293/6144 [04:23<01:34, 19.53it/s]\u001b[A\n"," 70% 4296/6144 [04:23<01:34, 19.64it/s]\u001b[A\n"," 70% 4298/6144 [04:23<01:34, 19.59it/s]\u001b[A\n"," 70% 4300/6144 [04:23<01:34, 19.43it/s]\u001b[A\n"," 70% 4302/6144 [04:23<01:53, 16.25it/s]\u001b[A\n"," 70% 4304/6144 [04:23<02:00, 15.23it/s]\u001b[A\n"," 70% 4306/6144 [04:23<02:00, 15.25it/s]\u001b[A\n"," 70% 4308/6144 [04:24<02:01, 15.06it/s]\u001b[A\n"," 70% 4310/6144 [04:24<02:00, 15.18it/s]\u001b[A\n"," 70% 4312/6144 [04:24<02:04, 14.74it/s]\u001b[A\n"," 70% 4314/6144 [04:24<02:04, 14.75it/s]\u001b[A\n"," 70% 4316/6144 [04:24<02:05, 14.55it/s]\u001b[A\n"," 70% 4318/6144 [04:24<02:07, 14.36it/s]\u001b[A\n"," 70% 4320/6144 [04:24<02:05, 14.54it/s]\u001b[A\n"," 70% 4322/6144 [04:25<02:08, 14.23it/s]\u001b[A\n"," 70% 4324/6144 [04:25<02:07, 14.22it/s]\u001b[A\n"," 70% 4326/6144 [04:25<02:06, 14.40it/s]\u001b[A\n"," 70% 4328/6144 [04:25<02:04, 14.64it/s]\u001b[A\n"," 70% 4330/6144 [04:25<02:02, 14.85it/s]\u001b[A\n"," 71% 4332/6144 [04:25<02:00, 14.99it/s]\u001b[A\n"," 71% 4334/6144 [04:25<02:09, 13.98it/s]\u001b[A\n"," 71% 4336/6144 [04:26<02:08, 14.06it/s]\u001b[A\n"," 71% 4338/6144 [04:26<02:04, 14.48it/s]\u001b[A\n"," 71% 4340/6144 [04:26<02:01, 14.82it/s]\u001b[A\n"," 71% 4342/6144 [04:26<02:00, 14.94it/s]\u001b[A\n"," 71% 4344/6144 [04:26<02:00, 14.94it/s]\u001b[A\n"," 71% 4346/6144 [04:26<02:02, 14.73it/s]\u001b[A\n"," 71% 4348/6144 [04:26<02:04, 14.41it/s]\u001b[A\n"," 71% 4350/6144 [04:27<01:57, 15.26it/s]\u001b[A\n"," 71% 4352/6144 [04:27<01:50, 16.23it/s]\u001b[A\n"," 71% 4355/6144 [04:27<01:44, 17.18it/s]\u001b[A\n"," 71% 4357/6144 [04:27<01:41, 17.69it/s]\u001b[A\n"," 71% 4360/6144 [04:27<01:37, 18.37it/s]\u001b[A\n"," 71% 4362/6144 [04:27<01:35, 18.74it/s]\u001b[A\n"," 71% 4364/6144 [04:27<01:34, 18.93it/s]\u001b[A\n"," 71% 4367/6144 [04:27<01:32, 19.28it/s]\u001b[A\n"," 71% 4369/6144 [04:27<01:34, 18.80it/s]\u001b[A\n"," 71% 4372/6144 [04:28<01:32, 19.18it/s]\u001b[A\n"," 71% 4375/6144 [04:28<01:31, 19.31it/s]\u001b[A\n"," 71% 4377/6144 [04:28<01:31, 19.39it/s]\u001b[A\n"," 71% 4380/6144 [04:28<01:30, 19.53it/s]\u001b[A\n"," 71% 4382/6144 [04:28<01:32, 19.10it/s]\u001b[A\n"," 71% 4385/6144 [04:28<01:30, 19.41it/s]\u001b[A\n"," 71% 4388/6144 [04:28<01:31, 19.21it/s]\u001b[A\n"," 71% 4390/6144 [04:29<01:31, 19.21it/s]\u001b[A\n"," 72% 4393/6144 [04:29<01:29, 19.51it/s]\u001b[A\n"," 72% 4395/6144 [04:29<01:29, 19.53it/s]\u001b[A\n"," 72% 4398/6144 [04:29<01:29, 19.60it/s]\u001b[A\n"," 72% 4400/6144 [04:29<01:29, 19.50it/s]\u001b[A\n"," 72% 4402/6144 [04:29<01:29, 19.49it/s]\u001b[A\n"," 72% 4404/6144 [04:29<01:30, 19.31it/s]\u001b[A\n"," 72% 4407/6144 [04:29<01:29, 19.33it/s]\u001b[A\n"," 72% 4409/6144 [04:30<01:29, 19.45it/s]\u001b[A\n"," 72% 4411/6144 [04:30<01:30, 19.24it/s]\u001b[A\n"," 72% 4414/6144 [04:30<01:28, 19.53it/s]\u001b[A\n"," 72% 4416/6144 [04:30<01:29, 19.35it/s]\u001b[A\n"," 72% 4419/6144 [04:30<01:28, 19.57it/s]\u001b[A\n"," 72% 4421/6144 [04:30<01:27, 19.69it/s]\u001b[A\n"," 72% 4423/6144 [04:30<01:28, 19.45it/s]\u001b[A\n"," 72% 4426/6144 [04:30<01:27, 19.67it/s]\u001b[A\n"," 72% 4428/6144 [04:31<01:29, 19.15it/s]\u001b[A\n"," 72% 4430/6144 [04:31<01:28, 19.33it/s]\u001b[A\n"," 72% 4433/6144 [04:31<01:27, 19.58it/s]\u001b[A\n"," 72% 4435/6144 [04:31<01:29, 19.12it/s]\u001b[A\n"," 72% 4438/6144 [04:31<01:29, 19.12it/s]\u001b[A\n"," 72% 4441/6144 [04:31<01:28, 19.27it/s]\u001b[A\n"," 72% 4443/6144 [04:31<01:27, 19.35it/s]\u001b[A\n"," 72% 4446/6144 [04:31<01:26, 19.57it/s]\u001b[A\n"," 72% 4448/6144 [04:32<01:29, 18.94it/s]\u001b[A\n"," 72% 4451/6144 [04:32<01:27, 19.30it/s]\u001b[A\n"," 72% 4453/6144 [04:32<01:30, 18.78it/s]\u001b[A\n"," 73% 4455/6144 [04:32<01:28, 19.10it/s]\u001b[A\n"," 73% 4458/6144 [04:32<01:26, 19.40it/s]\u001b[A\n"," 73% 4460/6144 [04:32<01:27, 19.32it/s]\u001b[A\n"," 73% 4463/6144 [04:32<01:25, 19.55it/s]\u001b[A\n"," 73% 4465/6144 [04:32<01:27, 19.22it/s]\u001b[A\n"," 73% 4467/6144 [04:33<01:31, 18.30it/s]\u001b[A\n"," 73% 4470/6144 [04:33<01:29, 18.71it/s]\u001b[A\n"," 73% 4472/6144 [04:33<01:27, 19.07it/s]\u001b[A\n"," 73% 4474/6144 [04:33<01:26, 19.32it/s]\u001b[A\n"," 73% 4476/6144 [04:33<01:28, 18.95it/s]\u001b[A\n"," 73% 4478/6144 [04:33<01:26, 19.22it/s]\u001b[A\n"," 73% 4480/6144 [04:33<01:25, 19.36it/s]\u001b[A\n"," 73% 4482/6144 [04:33<01:26, 19.12it/s]\u001b[A\n"," 73% 4485/6144 [04:33<01:25, 19.38it/s]\u001b[A\n"," 73% 4487/6144 [04:34<01:26, 19.26it/s]\u001b[A\n"," 73% 4489/6144 [04:34<01:26, 19.20it/s]\u001b[A\n"," 73% 4491/6144 [04:34<01:25, 19.34it/s]\u001b[A\n"," 73% 4493/6144 [04:34<01:24, 19.52it/s]\u001b[A\n"," 73% 4495/6144 [04:34<01:26, 19.15it/s]\u001b[A\n"," 73% 4498/6144 [04:34<01:24, 19.38it/s]\u001b[A\n"," 73% 4501/6144 [04:34<01:23, 19.61it/s]\u001b[A\n"," 73% 4503/6144 [04:34<01:24, 19.37it/s]\u001b[A\n"," 73% 4505/6144 [04:34<01:24, 19.41it/s]\u001b[A\n"," 73% 4507/6144 [04:35<01:30, 18.01it/s]\u001b[A\n"," 73% 4509/6144 [04:35<01:28, 18.55it/s]\u001b[A\n"," 73% 4511/6144 [04:35<01:26, 18.82it/s]\u001b[A\n"," 73% 4513/6144 [04:35<01:26, 18.83it/s]\u001b[A\n"," 73% 4515/6144 [04:35<01:25, 19.10it/s]\u001b[A\n"," 74% 4518/6144 [04:35<01:23, 19.40it/s]\u001b[A\n"," 74% 4520/6144 [04:35<01:24, 19.27it/s]\u001b[A\n"," 74% 4522/6144 [04:35<01:23, 19.38it/s]\u001b[A\n"," 74% 4524/6144 [04:35<01:22, 19.54it/s]\u001b[A\n"," 74% 4526/6144 [04:36<01:30, 17.98it/s]\u001b[A\n"," 74% 4528/6144 [04:36<01:37, 16.65it/s]\u001b[A\n"," 74% 4530/6144 [04:36<01:46, 15.20it/s]\u001b[A\n"," 74% 4532/6144 [04:36<01:45, 15.28it/s]\u001b[A\n"," 74% 4534/6144 [04:36<01:44, 15.34it/s]\u001b[A\n"," 74% 4536/6144 [04:36<01:48, 14.87it/s]\u001b[A\n"," 74% 4538/6144 [04:36<01:49, 14.67it/s]\u001b[A\n"," 74% 4540/6144 [04:37<01:49, 14.71it/s]\u001b[A\n"," 74% 4542/6144 [04:37<01:52, 14.22it/s]\u001b[A\n"," 74% 4544/6144 [04:37<01:55, 13.81it/s]\u001b[A\n"," 74% 4546/6144 [04:37<01:56, 13.75it/s]\u001b[A\n"," 74% 4548/6144 [04:37<01:55, 13.85it/s]\u001b[A\n"," 74% 4550/6144 [04:37<01:52, 14.16it/s]\u001b[A\n"," 74% 4552/6144 [04:37<01:49, 14.55it/s]\u001b[A\n"," 74% 4554/6144 [04:38<01:48, 14.66it/s]\u001b[A\n"," 74% 4556/6144 [04:38<01:51, 14.28it/s]\u001b[A\n"," 74% 4558/6144 [04:38<01:51, 14.23it/s]\u001b[A\n"," 74% 4560/6144 [04:38<01:55, 13.75it/s]\u001b[A\n"," 74% 4562/6144 [04:38<01:53, 13.96it/s]\u001b[A\n"," 74% 4564/6144 [04:38<01:51, 14.15it/s]\u001b[A\n"," 74% 4566/6144 [04:38<01:52, 14.04it/s]\u001b[A\n"," 74% 4568/6144 [04:39<01:51, 14.14it/s]\u001b[A\n"," 74% 4570/6144 [04:39<01:52, 13.96it/s]\u001b[A\n"," 74% 4572/6144 [04:39<01:45, 14.90it/s]\u001b[A\n"," 74% 4575/6144 [04:39<01:39, 15.80it/s]\u001b[A\n"," 74% 4577/6144 [04:39<01:34, 16.66it/s]\u001b[A\n"," 75% 4580/6144 [04:39<01:29, 17.56it/s]\u001b[A\n"," 75% 4582/6144 [04:39<01:26, 18.01it/s]\u001b[A\n"," 75% 4585/6144 [04:40<01:23, 18.58it/s]\u001b[A\n"," 75% 4587/6144 [04:40<01:23, 18.71it/s]\u001b[A\n"," 75% 4589/6144 [04:40<01:22, 18.77it/s]\u001b[A\n"," 75% 4592/6144 [04:40<01:21, 19.10it/s]\u001b[A\n"," 75% 4594/6144 [04:40<01:21, 19.00it/s]\u001b[A\n"," 75% 4596/6144 [04:40<01:20, 19.23it/s]\u001b[A\n"," 75% 4599/6144 [04:40<01:20, 19.31it/s]\u001b[A\n"," 75% 4601/6144 [04:40<01:19, 19.48it/s]\u001b[A\n"," 75% 4604/6144 [04:40<01:18, 19.67it/s]\u001b[A\n"," 75% 4606/6144 [04:41<01:18, 19.51it/s]\u001b[A\n"," 75% 4608/6144 [04:41<01:18, 19.49it/s]\u001b[A\n"," 75% 4610/6144 [04:41<01:19, 19.38it/s]\u001b[A\n"," 75% 4612/6144 [04:41<01:20, 19.14it/s]\u001b[A\n"," 75% 4615/6144 [04:41<01:19, 19.34it/s]\u001b[A\n"," 75% 4617/6144 [04:41<01:19, 19.28it/s]\u001b[A\n"," 75% 4619/6144 [04:41<01:19, 19.29it/s]\u001b[A\n"," 75% 4622/6144 [04:41<01:18, 19.42it/s]\u001b[A\n"," 75% 4624/6144 [04:42<01:18, 19.49it/s]\u001b[A\n"," 75% 4627/6144 [04:42<01:17, 19.69it/s]\u001b[A\n"," 75% 4629/6144 [04:42<01:18, 19.34it/s]\u001b[A\n"," 75% 4631/6144 [04:42<01:17, 19.42it/s]\u001b[A\n"," 75% 4634/6144 [04:42<01:17, 19.40it/s]\u001b[A\n"," 75% 4637/6144 [04:42<01:16, 19.59it/s]\u001b[A\n"," 76% 4640/6144 [04:42<01:16, 19.53it/s]\u001b[A\n"," 76% 4642/6144 [04:42<01:17, 19.49it/s]\u001b[A\n"," 76% 4645/6144 [04:43<01:16, 19.68it/s]\u001b[A\n"," 76% 4647/6144 [04:43<01:16, 19.52it/s]\u001b[A\n"," 76% 4649/6144 [04:43<01:16, 19.42it/s]\u001b[A\n"," 76% 4652/6144 [04:43<01:17, 19.29it/s]\u001b[A\n"," 76% 4654/6144 [04:43<01:16, 19.40it/s]\u001b[A\n"," 76% 4656/6144 [04:43<01:16, 19.37it/s]\u001b[A\n"," 76% 4658/6144 [04:43<01:17, 19.25it/s]\u001b[A\n"," 76% 4661/6144 [04:43<01:15, 19.52it/s]\u001b[A\n"," 76% 4663/6144 [04:44<01:15, 19.66it/s]\u001b[A\n"," 76% 4665/6144 [04:44<01:16, 19.38it/s]\u001b[A\n"," 76% 4668/6144 [04:44<01:15, 19.60it/s]\u001b[A\n"," 76% 4670/6144 [04:44<01:17, 18.98it/s]\u001b[A\n"," 76% 4673/6144 [04:44<01:16, 19.32it/s]\u001b[A\n"," 76% 4675/6144 [04:44<01:16, 19.29it/s]\u001b[A\n"," 76% 4677/6144 [04:44<01:15, 19.48it/s]\u001b[A\n"," 76% 4680/6144 [04:44<01:14, 19.65it/s]\u001b[A\n"," 76% 4682/6144 [04:45<01:15, 19.30it/s]\u001b[A\n"," 76% 4685/6144 [04:45<01:14, 19.54it/s]\u001b[A\n"," 76% 4687/6144 [04:45<01:15, 19.34it/s]\u001b[A\n"," 76% 4689/6144 [04:45<01:16, 19.14it/s]\u001b[A\n"," 76% 4692/6144 [04:45<01:15, 19.23it/s]\u001b[A\n"," 76% 4694/6144 [04:45<01:17, 18.67it/s]\u001b[A\n"," 76% 4696/6144 [04:45<01:16, 19.04it/s]\u001b[A\n"," 76% 4698/6144 [04:45<01:14, 19.30it/s]\u001b[A\n"," 76% 4700/6144 [04:45<01:14, 19.33it/s]\u001b[A\n"," 77% 4702/6144 [04:46<01:15, 19.20it/s]\u001b[A\n"," 77% 4705/6144 [04:46<01:13, 19.46it/s]\u001b[A\n"," 77% 4707/6144 [04:46<01:13, 19.43it/s]\u001b[A\n"," 77% 4709/6144 [04:46<01:14, 19.24it/s]\u001b[A\n"," 77% 4712/6144 [04:46<01:14, 19.23it/s]\u001b[A\n"," 77% 4715/6144 [04:46<01:13, 19.39it/s]\u001b[A\n"," 77% 4717/6144 [04:46<01:13, 19.45it/s]\u001b[A\n"," 77% 4719/6144 [04:46<01:14, 19.05it/s]\u001b[A\n"," 77% 4721/6144 [04:47<01:13, 19.31it/s]\u001b[A\n"," 77% 4723/6144 [04:47<01:13, 19.31it/s]\u001b[A\n"," 77% 4725/6144 [04:47<01:13, 19.20it/s]\u001b[A\n"," 77% 4727/6144 [04:47<01:12, 19.43it/s]\u001b[A\n"," 77% 4729/6144 [04:47<01:14, 18.90it/s]\u001b[A\n"," 77% 4731/6144 [04:47<01:14, 18.98it/s]\u001b[A\n"," 77% 4734/6144 [04:47<01:13, 19.30it/s]\u001b[A\n"," 77% 4736/6144 [04:47<01:14, 18.99it/s]\u001b[A\n"," 77% 4738/6144 [04:47<01:13, 19.19it/s]\u001b[A\n"," 77% 4740/6144 [04:48<01:12, 19.42it/s]\u001b[A\n"," 77% 4742/6144 [04:48<01:12, 19.39it/s]\u001b[A\n"," 77% 4745/6144 [04:48<01:11, 19.60it/s]\u001b[A\n"," 77% 4747/6144 [04:48<01:14, 18.80it/s]\u001b[A\n"," 77% 4749/6144 [04:48<01:14, 18.82it/s]\u001b[A\n"," 77% 4751/6144 [04:48<01:23, 16.66it/s]\u001b[A\n"," 77% 4753/6144 [04:48<01:29, 15.63it/s]\u001b[A\n"," 77% 4755/6144 [04:48<01:28, 15.61it/s]\u001b[A\n"," 77% 4757/6144 [04:49<01:28, 15.63it/s]\u001b[A\n"," 77% 4759/6144 [04:49<01:29, 15.55it/s]\u001b[A\n"," 77% 4761/6144 [04:49<01:30, 15.26it/s]\u001b[A\n"," 78% 4763/6144 [04:49<01:32, 15.01it/s]\u001b[A\n"," 78% 4765/6144 [04:49<01:32, 14.98it/s]\u001b[A\n"," 78% 4767/6144 [04:49<01:30, 15.14it/s]\u001b[A\n"," 78% 4769/6144 [04:49<01:31, 15.10it/s]\u001b[A\n"," 78% 4771/6144 [04:49<01:33, 14.61it/s]\u001b[A\n"," 78% 4773/6144 [04:50<01:40, 13.60it/s]\u001b[A\n"," 78% 4775/6144 [04:50<01:37, 14.08it/s]\u001b[A\n"," 78% 4777/6144 [04:50<01:35, 14.38it/s]\u001b[A\n"," 78% 4779/6144 [04:50<01:36, 14.19it/s]\u001b[A\n"," 78% 4781/6144 [04:50<01:35, 14.31it/s]\u001b[A\n"," 78% 4783/6144 [04:50<01:36, 14.11it/s]\u001b[A\n"," 78% 4785/6144 [04:50<01:34, 14.41it/s]\u001b[A\n"," 78% 4787/6144 [04:51<01:32, 14.74it/s]\u001b[A\n"," 78% 4789/6144 [04:51<01:30, 15.00it/s]\u001b[A\n"," 78% 4791/6144 [04:51<01:29, 15.08it/s]\u001b[A\n"," 78% 4793/6144 [04:51<01:31, 14.72it/s]\u001b[A\n"," 78% 4795/6144 [04:51<01:32, 14.61it/s]\u001b[A\n"," 78% 4797/6144 [04:51<01:32, 14.55it/s]\u001b[A\n"," 78% 4799/6144 [04:51<01:26, 15.57it/s]\u001b[A\n"," 78% 4802/6144 [04:52<01:20, 16.68it/s]\u001b[A\n"," 78% 4804/6144 [04:52<01:17, 17.34it/s]\u001b[A\n"," 78% 4807/6144 [04:52<01:14, 17.93it/s]\u001b[A\n"," 78% 4809/6144 [04:52<01:13, 18.19it/s]\u001b[A\n"," 78% 4811/6144 [04:52<01:12, 18.45it/s]\u001b[A\n"," 78% 4813/6144 [04:52<01:11, 18.51it/s]\u001b[A\n"," 78% 4816/6144 [04:52<01:10, 18.95it/s]\u001b[A\n"," 78% 4818/6144 [04:52<01:09, 19.03it/s]\u001b[A\n"," 78% 4821/6144 [04:53<01:08, 19.35it/s]\u001b[A\n"," 78% 4823/6144 [04:53<01:08, 19.26it/s]\u001b[A\n"," 79% 4826/6144 [04:53<01:07, 19.52it/s]\u001b[A\n"," 79% 4828/6144 [04:53<01:07, 19.59it/s]\u001b[A\n"," 79% 4830/6144 [04:53<01:07, 19.55it/s]\u001b[A\n"," 79% 4832/6144 [04:53<01:08, 19.29it/s]\u001b[A\n"," 79% 4834/6144 [04:53<01:08, 19.22it/s]\u001b[A\n"," 79% 4837/6144 [04:53<01:07, 19.45it/s]\u001b[A\n"," 79% 4840/6144 [04:54<01:07, 19.38it/s]\u001b[A\n"," 79% 4843/6144 [04:54<01:06, 19.49it/s]\u001b[A\n"," 79% 4846/6144 [04:54<01:06, 19.48it/s]\u001b[A\n"," 79% 4849/6144 [04:54<01:05, 19.65it/s]\u001b[A\n"," 79% 4851/6144 [04:54<01:06, 19.42it/s]\u001b[A\n"," 79% 4853/6144 [04:54<01:07, 19.23it/s]\u001b[A\n"," 79% 4855/6144 [04:54<01:06, 19.42it/s]\u001b[A\n"," 79% 4857/6144 [04:54<01:05, 19.54it/s]\u001b[A\n"," 79% 4859/6144 [04:54<01:06, 19.42it/s]\u001b[A\n"," 79% 4861/6144 [04:55<01:05, 19.58it/s]\u001b[A\n"," 79% 4864/6144 [04:55<01:05, 19.47it/s]\u001b[A\n"," 79% 4866/6144 [04:55<01:05, 19.59it/s]\u001b[A\n"," 79% 4868/6144 [04:55<01:05, 19.54it/s]\u001b[A\n"," 79% 4870/6144 [04:55<01:05, 19.35it/s]\u001b[A\n"," 79% 4872/6144 [04:55<01:06, 19.12it/s]\u001b[A\n"," 79% 4875/6144 [04:55<01:05, 19.25it/s]\u001b[A\n"," 79% 4878/6144 [04:55<01:05, 19.22it/s]\u001b[A\n"," 79% 4881/6144 [04:56<01:06, 18.91it/s]\u001b[A\n"," 79% 4883/6144 [04:56<01:07, 18.72it/s]\u001b[A\n"," 80% 4885/6144 [04:56<01:05, 19.08it/s]\u001b[A\n"," 80% 4887/6144 [04:56<01:06, 18.89it/s]\u001b[A\n"," 80% 4889/6144 [04:56<01:05, 19.15it/s]\u001b[A\n"," 80% 4891/6144 [04:56<01:05, 18.99it/s]\u001b[A\n"," 80% 4893/6144 [04:56<01:05, 19.06it/s]\u001b[A\n"," 80% 4896/6144 [04:56<01:04, 19.35it/s]\u001b[A\n"," 80% 4898/6144 [04:57<01:04, 19.40it/s]\u001b[A\n"," 80% 4900/6144 [04:57<01:03, 19.48it/s]\u001b[A\n"," 80% 4903/6144 [04:57<01:03, 19.65it/s]\u001b[A\n"," 80% 4905/6144 [04:57<01:03, 19.53it/s]\u001b[A\n"," 80% 4907/6144 [04:57<01:02, 19.66it/s]\u001b[A\n"," 80% 4909/6144 [04:57<01:02, 19.76it/s]\u001b[A\n"," 80% 4911/6144 [04:57<01:04, 19.18it/s]\u001b[A\n"," 80% 4913/6144 [04:57<01:03, 19.31it/s]\u001b[A\n"," 80% 4915/6144 [04:57<01:03, 19.43it/s]\u001b[A\n"," 80% 4917/6144 [04:57<01:03, 19.24it/s]\u001b[A\n"," 80% 4919/6144 [04:58<01:02, 19.45it/s]\u001b[A\n"," 80% 4921/6144 [04:58<01:03, 19.30it/s]\u001b[A\n"," 80% 4923/6144 [04:58<01:02, 19.49it/s]\u001b[A\n"," 80% 4925/6144 [04:58<01:02, 19.59it/s]\u001b[A\n"," 80% 4927/6144 [04:58<01:03, 19.22it/s]\u001b[A\n"," 80% 4929/6144 [04:58<01:02, 19.40it/s]\u001b[A\n"," 80% 4931/6144 [04:58<01:03, 19.03it/s]\u001b[A\n"," 80% 4933/6144 [04:58<01:03, 18.99it/s]\u001b[A\n"," 80% 4935/6144 [04:58<01:02, 19.28it/s]\u001b[A\n"," 80% 4937/6144 [04:59<01:01, 19.47it/s]\u001b[A\n"," 80% 4939/6144 [04:59<01:03, 19.08it/s]\u001b[A\n"," 80% 4942/6144 [04:59<01:02, 19.24it/s]\u001b[A\n"," 80% 4944/6144 [04:59<01:04, 18.53it/s]\u001b[A\n"," 81% 4946/6144 [04:59<01:03, 18.92it/s]\u001b[A\n"," 81% 4948/6144 [04:59<01:02, 19.13it/s]\u001b[A\n"," 81% 4950/6144 [04:59<01:04, 18.52it/s]\u001b[A\n"," 81% 4952/6144 [04:59<01:03, 18.84it/s]\u001b[A\n"," 81% 4954/6144 [04:59<01:02, 19.15it/s]\u001b[A\n"," 81% 4956/6144 [05:00<01:02, 19.15it/s]\u001b[A\n"," 81% 4958/6144 [05:00<01:01, 19.24it/s]\u001b[A\n"," 81% 4960/6144 [05:00<01:01, 19.39it/s]\u001b[A\n"," 81% 4962/6144 [05:00<01:01, 19.28it/s]\u001b[A\n"," 81% 4964/6144 [05:00<01:01, 19.29it/s]\u001b[A\n"," 81% 4967/6144 [05:00<01:00, 19.50it/s]\u001b[A\n"," 81% 4969/6144 [05:00<01:02, 18.83it/s]\u001b[A\n"," 81% 4972/6144 [05:00<01:02, 18.78it/s]\u001b[A\n"," 81% 4974/6144 [05:00<01:08, 17.01it/s]\u001b[A\n"," 81% 4976/6144 [05:01<01:12, 16.13it/s]\u001b[A\n"," 81% 4978/6144 [05:01<01:12, 15.99it/s]\u001b[A\n"," 81% 4980/6144 [05:01<01:12, 15.95it/s]\u001b[A\n"," 81% 4982/6144 [05:01<01:14, 15.65it/s]\u001b[A\n"," 81% 4984/6144 [05:01<01:14, 15.62it/s]\u001b[A\n"," 81% 4986/6144 [05:01<01:16, 15.09it/s]\u001b[A\n"," 81% 4988/6144 [05:01<01:19, 14.59it/s]\u001b[A\n"," 81% 4990/6144 [05:02<01:18, 14.66it/s]\u001b[A\n"," 81% 4992/6144 [05:02<01:17, 14.87it/s]\u001b[A\n"," 81% 4994/6144 [05:02<01:22, 13.90it/s]\u001b[A\n"," 81% 4996/6144 [05:02<01:20, 14.31it/s]\u001b[A\n"," 81% 4998/6144 [05:02<01:18, 14.54it/s]\u001b[A\n"," 81% 5000/6144 [05:02<01:20, 14.13it/s]\u001b[A\n"," 81% 5002/6144 [05:02<01:18, 14.54it/s]\u001b[A\n"," 81% 5004/6144 [05:03<01:17, 14.63it/s]\u001b[A\n"," 81% 5006/6144 [05:03<01:19, 14.37it/s]\u001b[A\n"," 82% 5008/6144 [05:03<01:19, 14.25it/s]\u001b[A\n"," 82% 5010/6144 [05:03<01:18, 14.43it/s]\u001b[A\n"," 82% 5012/6144 [05:03<01:17, 14.60it/s]\u001b[A\n"," 82% 5014/6144 [05:03<01:20, 13.98it/s]\u001b[A\n"," 82% 5016/6144 [05:03<01:21, 13.81it/s]\u001b[A\n"," 82% 5018/6144 [05:04<01:20, 13.99it/s]\u001b[A\n"," 82% 5020/6144 [05:04<01:15, 14.84it/s]\u001b[A\n"," 82% 5022/6144 [05:04<01:09, 16.04it/s]\u001b[A\n"," 82% 5024/6144 [05:04<01:07, 16.66it/s]\u001b[A\n"," 82% 5026/6144 [05:04<01:03, 17.51it/s]\u001b[A\n"," 82% 5028/6144 [05:04<01:02, 17.99it/s]\u001b[A\n"," 82% 5030/6144 [05:04<01:00, 18.39it/s]\u001b[A\n"," 82% 5033/6144 [05:04<00:59, 18.61it/s]\u001b[A\n"," 82% 5035/6144 [05:04<00:59, 18.79it/s]\u001b[A\n"," 82% 5037/6144 [05:05<00:58, 19.08it/s]\u001b[A\n"," 82% 5040/6144 [05:05<00:57, 19.36it/s]\u001b[A\n"," 82% 5042/6144 [05:05<00:57, 19.10it/s]\u001b[A\n"," 82% 5044/6144 [05:05<00:56, 19.36it/s]\u001b[A\n"," 82% 5046/6144 [05:05<00:56, 19.54it/s]\u001b[A\n"," 82% 5048/6144 [05:05<00:56, 19.34it/s]\u001b[A\n"," 82% 5050/6144 [05:05<00:56, 19.52it/s]\u001b[A\n"," 82% 5052/6144 [05:05<00:55, 19.65it/s]\u001b[A\n"," 82% 5054/6144 [05:05<00:57, 18.98it/s]\u001b[A\n"," 82% 5056/6144 [05:06<00:56, 19.23it/s]\u001b[A\n"," 82% 5058/6144 [05:06<00:55, 19.44it/s]\u001b[A\n"," 82% 5060/6144 [05:06<00:56, 19.32it/s]\u001b[A\n"," 82% 5062/6144 [05:06<00:55, 19.50it/s]\u001b[A\n"," 82% 5064/6144 [05:06<00:55, 19.57it/s]\u001b[A\n"," 82% 5066/6144 [05:06<00:55, 19.30it/s]\u001b[A\n"," 82% 5068/6144 [05:06<00:56, 18.92it/s]\u001b[A\n"," 83% 5070/6144 [05:06<00:55, 19.18it/s]\u001b[A\n"," 83% 5072/6144 [05:06<00:55, 19.23it/s]\u001b[A\n"," 83% 5074/6144 [05:06<00:56, 18.86it/s]\u001b[A\n"," 83% 5077/6144 [05:07<00:55, 19.19it/s]\u001b[A\n"," 83% 5079/6144 [05:07<00:55, 19.17it/s]\u001b[A\n"," 83% 5082/6144 [05:07<00:54, 19.41it/s]\u001b[A\n"," 83% 5084/6144 [05:07<00:55, 19.21it/s]\u001b[A\n"," 83% 5086/6144 [05:07<00:54, 19.41it/s]\u001b[A\n"," 83% 5088/6144 [05:07<00:53, 19.58it/s]\u001b[A\n"," 83% 5090/6144 [05:07<00:54, 19.23it/s]\u001b[A\n"," 83% 5092/6144 [05:07<00:54, 19.14it/s]\u001b[A\n"," 83% 5094/6144 [05:07<00:54, 19.34it/s]\u001b[A\n"," 83% 5096/6144 [05:08<00:54, 19.17it/s]\u001b[A\n"," 83% 5098/6144 [05:08<00:53, 19.40it/s]\u001b[A\n"," 83% 5100/6144 [05:08<00:53, 19.56it/s]\u001b[A\n"," 83% 5102/6144 [05:08<00:54, 19.28it/s]\u001b[A\n"," 83% 5104/6144 [05:08<00:53, 19.48it/s]\u001b[A\n"," 83% 5106/6144 [05:08<00:53, 19.52it/s]\u001b[A\n"," 83% 5108/6144 [05:08<00:53, 19.25it/s]\u001b[A\n"," 83% 5110/6144 [05:08<00:53, 19.43it/s]\u001b[A\n"," 83% 5112/6144 [05:08<00:53, 19.24it/s]\u001b[A\n"," 83% 5114/6144 [05:09<00:53, 19.08it/s]\u001b[A\n"," 83% 5116/6144 [05:09<00:53, 19.12it/s]\u001b[A\n"," 83% 5118/6144 [05:09<00:53, 19.32it/s]\u001b[A\n"," 83% 5120/6144 [05:09<00:53, 19.11it/s]\u001b[A\n"," 83% 5122/6144 [05:09<00:52, 19.29it/s]\u001b[A\n"," 83% 5124/6144 [05:09<00:52, 19.45it/s]\u001b[A\n"," 83% 5126/6144 [05:09<00:53, 19.17it/s]\u001b[A\n"," 83% 5128/6144 [05:09<00:53, 19.15it/s]\u001b[A\n"," 83% 5130/6144 [05:09<00:53, 19.11it/s]\u001b[A\n"," 84% 5132/6144 [05:09<00:55, 18.30it/s]\u001b[A\n"," 84% 5134/6144 [05:10<00:54, 18.58it/s]\u001b[A\n"," 84% 5136/6144 [05:10<00:53, 18.95it/s]\u001b[A\n"," 84% 5138/6144 [05:10<00:54, 18.57it/s]\u001b[A\n"," 84% 5140/6144 [05:10<00:53, 18.70it/s]\u001b[A\n"," 84% 5142/6144 [05:10<00:52, 19.02it/s]\u001b[A\n"," 84% 5144/6144 [05:10<00:52, 18.90it/s]\u001b[A\n"," 84% 5146/6144 [05:10<00:51, 19.21it/s]\u001b[A\n"," 84% 5148/6144 [05:10<00:51, 19.40it/s]\u001b[A\n"," 84% 5150/6144 [05:10<00:51, 19.39it/s]\u001b[A\n"," 84% 5152/6144 [05:11<00:51, 19.23it/s]\u001b[A\n"," 84% 5154/6144 [05:11<00:50, 19.41it/s]\u001b[A\n"," 84% 5156/6144 [05:11<00:51, 19.34it/s]\u001b[A\n"," 84% 5158/6144 [05:11<00:50, 19.53it/s]\u001b[A\n"," 84% 5160/6144 [05:11<00:50, 19.65it/s]\u001b[A\n"," 84% 5162/6144 [05:11<00:50, 19.37it/s]\u001b[A\n"," 84% 5164/6144 [05:11<00:50, 19.54it/s]\u001b[A\n"," 84% 5166/6144 [05:11<00:49, 19.63it/s]\u001b[A\n"," 84% 5168/6144 [05:11<00:50, 19.41it/s]\u001b[A\n"," 84% 5170/6144 [05:11<00:50, 19.46it/s]\u001b[A\n"," 84% 5172/6144 [05:12<00:50, 19.21it/s]\u001b[A\n"," 84% 5174/6144 [05:12<00:50, 19.06it/s]\u001b[A\n"," 84% 5176/6144 [05:12<00:50, 19.31it/s]\u001b[A\n"," 84% 5178/6144 [05:12<00:49, 19.35it/s]\u001b[A\n"," 84% 5180/6144 [05:12<00:50, 19.05it/s]\u001b[A\n"," 84% 5182/6144 [05:12<00:50, 19.24it/s]\u001b[A\n"," 84% 5184/6144 [05:12<00:49, 19.23it/s]\u001b[A\n"," 84% 5186/6144 [05:12<00:49, 19.31it/s]\u001b[A\n"," 84% 5188/6144 [05:12<00:49, 19.46it/s]\u001b[A\n"," 84% 5190/6144 [05:12<00:51, 18.66it/s]\u001b[A\n"," 85% 5192/6144 [05:13<00:50, 18.87it/s]\u001b[A\n"," 85% 5194/6144 [05:13<00:50, 18.96it/s]\u001b[A\n"," 85% 5196/6144 [05:13<00:51, 18.26it/s]\u001b[A\n"," 85% 5198/6144 [05:13<00:57, 16.57it/s]\u001b[A\n"," 85% 5200/6144 [05:13<01:01, 15.30it/s]\u001b[A\n"," 85% 5202/6144 [05:13<01:02, 15.16it/s]\u001b[A\n"," 85% 5204/6144 [05:13<01:02, 15.13it/s]\u001b[A\n"," 85% 5206/6144 [05:14<01:03, 14.87it/s]\u001b[A\n"," 85% 5208/6144 [05:14<01:03, 14.82it/s]\u001b[A\n"," 85% 5210/6144 [05:14<01:03, 14.69it/s]\u001b[A\n"," 85% 5212/6144 [05:14<01:02, 14.88it/s]\u001b[A\n"," 85% 5214/6144 [05:14<01:02, 15.00it/s]\u001b[A\n"," 85% 5216/6144 [05:14<01:01, 15.06it/s]\u001b[A\n"," 85% 5218/6144 [05:14<01:03, 14.61it/s]\u001b[A\n"," 85% 5220/6144 [05:14<01:03, 14.65it/s]\u001b[A\n"," 85% 5222/6144 [05:15<01:02, 14.78it/s]\u001b[A\n"," 85% 5224/6144 [05:15<01:01, 15.08it/s]\u001b[A\n"," 85% 5226/6144 [05:15<01:02, 14.68it/s]\u001b[A\n"," 85% 5228/6144 [05:15<01:01, 14.94it/s]\u001b[A\n"," 85% 5230/6144 [05:15<01:01, 14.82it/s]\u001b[A\n"," 85% 5232/6144 [05:15<01:02, 14.60it/s]\u001b[A\n"," 85% 5234/6144 [05:15<01:01, 14.88it/s]\u001b[A\n"," 85% 5236/6144 [05:16<00:59, 15.15it/s]\u001b[A\n"," 85% 5238/6144 [05:16<01:01, 14.69it/s]\u001b[A\n"," 85% 5240/6144 [05:16<01:00, 14.94it/s]\u001b[A\n"," 85% 5242/6144 [05:16<01:01, 14.64it/s]\u001b[A\n"," 85% 5244/6144 [05:16<01:00, 14.81it/s]\u001b[A\n"," 85% 5246/6144 [05:16<00:57, 15.62it/s]\u001b[A\n"," 85% 5248/6144 [05:16<00:53, 16.70it/s]\u001b[A\n"," 85% 5250/6144 [05:16<00:51, 17.32it/s]\u001b[A\n"," 85% 5252/6144 [05:17<00:49, 18.04it/s]\u001b[A\n"," 86% 5254/6144 [05:17<00:47, 18.55it/s]\u001b[A\n"," 86% 5256/6144 [05:17<00:48, 18.45it/s]\u001b[A\n"," 86% 5258/6144 [05:17<00:47, 18.80it/s]\u001b[A\n"," 86% 5260/6144 [05:17<00:46, 19.10it/s]\u001b[A\n"," 86% 5262/6144 [05:17<00:46, 18.92it/s]\u001b[A\n"," 86% 5264/6144 [05:17<00:45, 19.21it/s]\u001b[A\n"," 86% 5266/6144 [05:17<00:45, 19.42it/s]\u001b[A\n"," 86% 5268/6144 [05:17<00:45, 19.21it/s]\u001b[A\n"," 86% 5270/6144 [05:17<00:45, 19.30it/s]\u001b[A\n"," 86% 5272/6144 [05:18<00:45, 19.09it/s]\u001b[A\n"," 86% 5274/6144 [05:18<00:46, 18.63it/s]\u001b[A\n"," 86% 5276/6144 [05:18<00:46, 18.61it/s]\u001b[A\n"," 86% 5278/6144 [05:18<00:45, 18.94it/s]\u001b[A\n"," 86% 5280/6144 [05:18<00:45, 18.89it/s]\u001b[A\n"," 86% 5282/6144 [05:18<00:45, 19.13it/s]\u001b[A\n"," 86% 5284/6144 [05:18<00:44, 19.13it/s]\u001b[A\n"," 86% 5286/6144 [05:18<00:45, 18.97it/s]\u001b[A\n"," 86% 5288/6144 [05:18<00:44, 19.24it/s]\u001b[A\n"," 86% 5290/6144 [05:18<00:44, 19.34it/s]\u001b[A\n"," 86% 5292/6144 [05:19<00:43, 19.47it/s]\u001b[A\n"," 86% 5294/6144 [05:19<00:44, 19.22it/s]\u001b[A\n"," 86% 5296/6144 [05:19<00:43, 19.42it/s]\u001b[A\n"," 86% 5298/6144 [05:19<00:43, 19.45it/s]\u001b[A\n"," 86% 5300/6144 [05:19<00:43, 19.53it/s]\u001b[A\n"," 86% 5302/6144 [05:19<00:43, 19.55it/s]\u001b[A\n"," 86% 5304/6144 [05:19<00:43, 19.38it/s]\u001b[A\n"," 86% 5306/6144 [05:19<00:43, 19.48it/s]\u001b[A\n"," 86% 5308/6144 [05:19<00:42, 19.60it/s]\u001b[A\n"," 86% 5310/6144 [05:20<00:42, 19.41it/s]\u001b[A\n"," 86% 5312/6144 [05:20<00:42, 19.48it/s]\u001b[A\n"," 86% 5314/6144 [05:20<00:43, 19.30it/s]\u001b[A\n"," 87% 5316/6144 [05:20<00:43, 19.17it/s]\u001b[A\n"," 87% 5318/6144 [05:20<00:42, 19.24it/s]\u001b[A\n"," 87% 5320/6144 [05:20<00:42, 19.30it/s]\u001b[A\n"," 87% 5322/6144 [05:20<00:43, 19.03it/s]\u001b[A\n"," 87% 5324/6144 [05:20<00:42, 19.21it/s]\u001b[A\n"," 87% 5326/6144 [05:20<00:42, 19.38it/s]\u001b[A\n"," 87% 5328/6144 [05:20<00:42, 19.16it/s]\u001b[A\n"," 87% 5330/6144 [05:21<00:42, 19.30it/s]\u001b[A\n"," 87% 5332/6144 [05:21<00:41, 19.45it/s]\u001b[A\n"," 87% 5334/6144 [05:21<00:43, 18.79it/s]\u001b[A\n"," 87% 5336/6144 [05:21<00:42, 18.97it/s]\u001b[A\n"," 87% 5338/6144 [05:21<00:42, 19.13it/s]\u001b[A\n"," 87% 5340/6144 [05:21<00:42, 18.98it/s]\u001b[A\n"," 87% 5342/6144 [05:21<00:41, 19.23it/s]\u001b[A\n"," 87% 5344/6144 [05:21<00:41, 19.42it/s]\u001b[A\n"," 87% 5346/6144 [05:21<00:41, 19.18it/s]\u001b[A\n"," 87% 5348/6144 [05:22<00:41, 19.30it/s]\u001b[A\n"," 87% 5350/6144 [05:22<00:40, 19.45it/s]\u001b[A\n"," 87% 5352/6144 [05:22<00:41, 19.28it/s]\u001b[A\n"," 87% 5354/6144 [05:22<00:41, 19.21it/s]\u001b[A\n"," 87% 5356/6144 [05:22<00:41, 19.02it/s]\u001b[A\n"," 87% 5358/6144 [05:22<00:41, 19.14it/s]\u001b[A\n"," 87% 5360/6144 [05:22<00:40, 19.28it/s]\u001b[A\n"," 87% 5362/6144 [05:22<00:41, 19.06it/s]\u001b[A\n"," 87% 5364/6144 [05:22<00:40, 19.24it/s]\u001b[A\n"," 87% 5366/6144 [05:22<00:40, 19.32it/s]\u001b[A\n"," 87% 5368/6144 [05:23<00:40, 19.25it/s]\u001b[A\n"," 87% 5370/6144 [05:23<00:39, 19.36it/s]\u001b[A\n"," 87% 5372/6144 [05:23<00:39, 19.51it/s]\u001b[A\n"," 87% 5374/6144 [05:23<00:40, 18.82it/s]\u001b[A\n"," 88% 5376/6144 [05:23<00:40, 19.14it/s]\u001b[A\n"," 88% 5378/6144 [05:23<00:39, 19.31it/s]\u001b[A\n"," 88% 5380/6144 [05:23<00:41, 18.57it/s]\u001b[A\n"," 88% 5382/6144 [05:23<00:40, 18.93it/s]\u001b[A\n"," 88% 5384/6144 [05:23<00:39, 19.11it/s]\u001b[A\n"," 88% 5386/6144 [05:23<00:39, 19.03it/s]\u001b[A\n"," 88% 5388/6144 [05:24<00:39, 19.24it/s]\u001b[A\n"," 88% 5390/6144 [05:24<00:39, 19.29it/s]\u001b[A\n"," 88% 5392/6144 [05:24<00:40, 18.80it/s]\u001b[A\n"," 88% 5394/6144 [05:24<00:39, 19.02it/s]\u001b[A\n"," 88% 5396/6144 [05:24<00:38, 19.22it/s]\u001b[A\n"," 88% 5398/6144 [05:24<00:39, 18.98it/s]\u001b[A\n"," 88% 5400/6144 [05:24<00:38, 19.20it/s]\u001b[A\n"," 88% 5402/6144 [05:24<00:38, 19.37it/s]\u001b[A\n"," 88% 5404/6144 [05:24<00:38, 19.09it/s]\u001b[A\n"," 88% 5406/6144 [05:25<00:38, 19.17it/s]\u001b[A\n"," 88% 5408/6144 [05:25<00:38, 19.34it/s]\u001b[A\n"," 88% 5410/6144 [05:25<00:38, 18.99it/s]\u001b[A\n"," 88% 5412/6144 [05:25<00:39, 18.73it/s]\u001b[A\n"," 88% 5414/6144 [05:25<00:39, 18.71it/s]\u001b[A\n"," 88% 5416/6144 [05:25<00:39, 18.60it/s]\u001b[A\n"," 88% 5418/6144 [05:25<00:43, 16.62it/s]\u001b[A\n"," 88% 5420/6144 [05:25<00:45, 15.98it/s]\u001b[A\n"," 88% 5422/6144 [05:25<00:46, 15.61it/s]\u001b[A\n"," 88% 5424/6144 [05:26<00:45, 15.67it/s]\u001b[A\n"," 88% 5426/6144 [05:26<00:45, 15.66it/s]\u001b[A\n"," 88% 5428/6144 [05:26<00:47, 15.15it/s]\u001b[A\n"," 88% 5430/6144 [05:26<00:47, 14.91it/s]\u001b[A\n"," 88% 5432/6144 [05:26<00:48, 14.77it/s]\u001b[A\n"," 88% 5434/6144 [05:26<00:47, 14.83it/s]\u001b[A\n"," 88% 5436/6144 [05:26<00:47, 15.02it/s]\u001b[A\n"," 89% 5438/6144 [05:27<00:47, 14.91it/s]\u001b[A\n"," 89% 5440/6144 [05:27<00:47, 14.67it/s]\u001b[A\n"," 89% 5442/6144 [05:27<00:50, 13.79it/s]\u001b[A\n"," 89% 5444/6144 [05:27<00:50, 13.95it/s]\u001b[A\n"," 89% 5446/6144 [05:27<00:48, 14.36it/s]\u001b[A\n"," 89% 5448/6144 [05:27<00:47, 14.72it/s]\u001b[A\n"," 89% 5450/6144 [05:27<00:46, 14.95it/s]\u001b[A\n"," 89% 5452/6144 [05:28<00:48, 14.34it/s]\u001b[A\n"," 89% 5454/6144 [05:28<00:46, 14.70it/s]\u001b[A\n"," 89% 5456/6144 [05:28<00:45, 14.96it/s]\u001b[A\n"," 89% 5458/6144 [05:28<00:47, 14.46it/s]\u001b[A\n"," 89% 5460/6144 [05:28<00:48, 14.20it/s]\u001b[A\n"," 89% 5462/6144 [05:28<00:49, 13.89it/s]\u001b[A\n"," 89% 5464/6144 [05:28<00:48, 13.95it/s]\u001b[A\n"," 89% 5466/6144 [05:29<00:45, 14.77it/s]\u001b[A\n"," 89% 5468/6144 [05:29<00:43, 15.66it/s]\u001b[A\n"," 89% 5470/6144 [05:29<00:40, 16.64it/s]\u001b[A\n"," 89% 5472/6144 [05:29<00:38, 17.44it/s]\u001b[A\n"," 89% 5474/6144 [05:29<00:37, 17.70it/s]\u001b[A\n"," 89% 5476/6144 [05:29<00:37, 17.92it/s]\u001b[A\n"," 89% 5478/6144 [05:29<00:36, 18.35it/s]\u001b[A\n"," 89% 5480/6144 [05:29<00:35, 18.52it/s]\u001b[A\n"," 89% 5482/6144 [05:29<00:35, 18.72it/s]\u001b[A\n"," 89% 5484/6144 [05:29<00:34, 19.04it/s]\u001b[A\n"," 89% 5486/6144 [05:30<00:34, 18.85it/s]\u001b[A\n"," 89% 5488/6144 [05:30<00:34, 19.03it/s]\u001b[A\n"," 89% 5490/6144 [05:30<00:34, 19.24it/s]\u001b[A\n"," 89% 5492/6144 [05:30<00:34, 18.95it/s]\u001b[A\n"," 89% 5494/6144 [05:30<00:35, 18.55it/s]\u001b[A\n"," 89% 5496/6144 [05:30<00:34, 18.91it/s]\u001b[A\n"," 89% 5498/6144 [05:30<00:34, 18.87it/s]\u001b[A\n"," 90% 5500/6144 [05:30<00:33, 19.14it/s]\u001b[A\n"," 90% 5502/6144 [05:30<00:33, 19.32it/s]\u001b[A\n"," 90% 5504/6144 [05:31<00:33, 19.12it/s]\u001b[A\n"," 90% 5506/6144 [05:31<00:33, 19.33it/s]\u001b[A\n"," 90% 5508/6144 [05:31<00:32, 19.35it/s]\u001b[A\n"," 90% 5510/6144 [05:31<00:33, 19.19it/s]\u001b[A\n"," 90% 5512/6144 [05:31<00:32, 19.32it/s]\u001b[A\n"," 90% 5514/6144 [05:31<00:33, 18.79it/s]\u001b[A\n"," 90% 5516/6144 [05:31<00:33, 18.67it/s]\u001b[A\n"," 90% 5518/6144 [05:31<00:33, 18.94it/s]\u001b[A\n"," 90% 5520/6144 [05:31<00:33, 18.90it/s]\u001b[A\n"," 90% 5522/6144 [05:31<00:32, 19.09it/s]\u001b[A\n"," 90% 5524/6144 [05:32<00:32, 19.25it/s]\u001b[A\n"," 90% 5526/6144 [05:32<00:32, 19.15it/s]\u001b[A\n"," 90% 5528/6144 [05:32<00:32, 19.21it/s]\u001b[A\n"," 90% 5530/6144 [05:32<00:32, 19.01it/s]\u001b[A\n"," 90% 5532/6144 [05:32<00:32, 19.04it/s]\u001b[A\n"," 90% 5534/6144 [05:32<00:32, 18.83it/s]\u001b[A\n"," 90% 5536/6144 [05:32<00:32, 18.82it/s]\u001b[A\n"," 90% 5538/6144 [05:32<00:31, 19.10it/s]\u001b[A\n"," 90% 5540/6144 [05:32<00:31, 19.30it/s]\u001b[A\n"," 90% 5542/6144 [05:33<00:31, 18.92it/s]\u001b[A\n"," 90% 5544/6144 [05:33<00:31, 19.19it/s]\u001b[A\n"," 90% 5546/6144 [05:33<00:30, 19.36it/s]\u001b[A\n"," 90% 5548/6144 [05:33<00:30, 19.28it/s]\u001b[A\n"," 90% 5550/6144 [05:33<00:30, 19.40it/s]\u001b[A\n"," 90% 5552/6144 [05:33<00:30, 19.48it/s]\u001b[A\n"," 90% 5554/6144 [05:33<00:31, 18.59it/s]\u001b[A\n"," 90% 5556/6144 [05:33<00:31, 18.62it/s]\u001b[A\n"," 90% 5558/6144 [05:33<00:30, 18.95it/s]\u001b[A\n"," 90% 5560/6144 [05:33<00:30, 18.85it/s]\u001b[A\n"," 91% 5562/6144 [05:34<00:30, 19.10it/s]\u001b[A\n"," 91% 5564/6144 [05:34<00:30, 19.23it/s]\u001b[A\n"," 91% 5566/6144 [05:34<00:30, 19.05it/s]\u001b[A\n"," 91% 5568/6144 [05:34<00:29, 19.23it/s]\u001b[A\n"," 91% 5570/6144 [05:34<00:29, 19.38it/s]\u001b[A\n"," 91% 5572/6144 [05:34<00:30, 18.87it/s]\u001b[A\n"," 91% 5574/6144 [05:34<00:29, 19.01it/s]\u001b[A\n"," 91% 5576/6144 [05:34<00:29, 19.24it/s]\u001b[A\n"," 91% 5578/6144 [05:34<00:29, 19.09it/s]\u001b[A\n"," 91% 5580/6144 [05:34<00:29, 19.23it/s]\u001b[A\n"," 91% 5582/6144 [05:35<00:28, 19.39it/s]\u001b[A\n"," 91% 5584/6144 [05:35<00:29, 18.83it/s]\u001b[A\n"," 91% 5586/6144 [05:35<00:29, 18.72it/s]\u001b[A\n"," 91% 5588/6144 [05:35<00:29, 18.79it/s]\u001b[A\n"," 91% 5590/6144 [05:35<00:29, 18.82it/s]\u001b[A\n"," 91% 5592/6144 [05:35<00:29, 18.83it/s]\u001b[A\n"," 91% 5594/6144 [05:35<00:28, 19.08it/s]\u001b[A\n"," 91% 5596/6144 [05:35<00:28, 18.91it/s]\u001b[A\n"," 91% 5598/6144 [05:35<00:28, 19.06it/s]\u001b[A\n"," 91% 5600/6144 [05:36<00:28, 19.26it/s]\u001b[A\n"," 91% 5602/6144 [05:36<00:28, 19.07it/s]\u001b[A\n"," 91% 5604/6144 [05:36<00:28, 19.27it/s]\u001b[A\n"," 91% 5606/6144 [05:36<00:27, 19.36it/s]\u001b[A\n"," 91% 5608/6144 [05:36<00:27, 19.17it/s]\u001b[A\n"," 91% 5610/6144 [05:36<00:27, 19.20it/s]\u001b[A\n"," 91% 5612/6144 [05:36<00:28, 18.86it/s]\u001b[A\n"," 91% 5614/6144 [05:36<00:28, 18.86it/s]\u001b[A\n"," 91% 5616/6144 [05:36<00:27, 19.12it/s]\u001b[A\n"," 91% 5618/6144 [05:36<00:27, 18.96it/s]\u001b[A\n"," 91% 5620/6144 [05:37<00:27, 19.00it/s]\u001b[A\n"," 92% 5622/6144 [05:37<00:27, 19.21it/s]\u001b[A\n"," 92% 5624/6144 [05:37<00:27, 18.99it/s]\u001b[A\n"," 92% 5626/6144 [05:37<00:27, 19.03it/s]\u001b[A\n"," 92% 5628/6144 [05:37<00:26, 19.22it/s]\u001b[A\n"," 92% 5630/6144 [05:37<00:27, 18.37it/s]\u001b[A\n"," 92% 5632/6144 [05:37<00:27, 18.78it/s]\u001b[A\n"," 92% 5634/6144 [05:37<00:26, 19.02it/s]\u001b[A\n"," 92% 5636/6144 [05:37<00:28, 18.06it/s]\u001b[A\n"," 92% 5638/6144 [05:38<00:27, 18.30it/s]\u001b[A\n"," 92% 5640/6144 [05:38<00:28, 17.95it/s]\u001b[A\n"," 92% 5642/6144 [05:38<00:30, 16.42it/s]\u001b[A\n"," 92% 5644/6144 [05:38<00:33, 15.03it/s]\u001b[A\n"," 92% 5646/6144 [05:38<00:33, 14.77it/s]\u001b[A\n"," 92% 5648/6144 [05:38<00:34, 14.57it/s]\u001b[A\n"," 92% 5650/6144 [05:38<00:33, 14.57it/s]\u001b[A\n"," 92% 5652/6144 [05:39<00:34, 14.43it/s]\u001b[A\n"," 92% 5654/6144 [05:39<00:35, 13.97it/s]\u001b[A\n"," 92% 5656/6144 [05:39<00:34, 14.30it/s]\u001b[A\n"," 92% 5658/6144 [05:39<00:33, 14.37it/s]\u001b[A\n"," 92% 5660/6144 [05:39<00:34, 14.14it/s]\u001b[A\n"," 92% 5662/6144 [05:39<00:34, 13.93it/s]\u001b[A\n"," 92% 5664/6144 [05:39<00:34, 13.80it/s]\u001b[A\n"," 92% 5666/6144 [05:40<00:34, 14.01it/s]\u001b[A\n"," 92% 5668/6144 [05:40<00:32, 14.44it/s]\u001b[A\n"," 92% 5670/6144 [05:40<00:32, 14.48it/s]\u001b[A\n"," 92% 5672/6144 [05:40<00:32, 14.44it/s]\u001b[A\n"," 92% 5674/6144 [05:40<00:33, 14.19it/s]\u001b[A\n"," 92% 5676/6144 [05:40<00:32, 14.19it/s]\u001b[A\n"," 92% 5678/6144 [05:40<00:32, 14.43it/s]\u001b[A\n"," 92% 5680/6144 [05:41<00:33, 13.99it/s]\u001b[A\n"," 92% 5682/6144 [05:41<00:31, 14.51it/s]\u001b[A\n"," 93% 5684/6144 [05:41<00:31, 14.43it/s]\u001b[A\n"," 93% 5686/6144 [05:41<00:32, 13.92it/s]\u001b[A\n"," 93% 5688/6144 [05:41<00:29, 15.24it/s]\u001b[A\n"," 93% 5690/6144 [05:41<00:27, 16.25it/s]\u001b[A\n"," 93% 5692/6144 [05:41<00:27, 16.46it/s]\u001b[A\n"," 93% 5694/6144 [05:41<00:26, 17.30it/s]\u001b[A\n"," 93% 5696/6144 [05:41<00:24, 17.97it/s]\u001b[A\n"," 93% 5698/6144 [05:42<00:24, 18.11it/s]\u001b[A\n"," 93% 5700/6144 [05:42<00:23, 18.51it/s]\u001b[A\n"," 93% 5702/6144 [05:42<00:23, 18.85it/s]\u001b[A\n"," 93% 5704/6144 [05:42<00:23, 18.87it/s]\u001b[A\n"," 93% 5706/6144 [05:42<00:22, 19.11it/s]\u001b[A\n"," 93% 5708/6144 [05:42<00:22, 19.28it/s]\u001b[A\n"," 93% 5710/6144 [05:42<00:22, 18.97it/s]\u001b[A\n"," 93% 5712/6144 [05:42<00:22, 18.86it/s]\u001b[A\n"," 93% 5714/6144 [05:42<00:22, 19.09it/s]\u001b[A\n"," 93% 5716/6144 [05:43<00:22, 19.23it/s]\u001b[A\n"," 93% 5718/6144 [05:43<00:22, 19.26it/s]\u001b[A\n"," 93% 5720/6144 [05:43<00:21, 19.39it/s]\u001b[A\n"," 93% 5722/6144 [05:43<00:21, 19.24it/s]\u001b[A\n"," 93% 5724/6144 [05:43<00:21, 19.34it/s]\u001b[A\n"," 93% 5726/6144 [05:43<00:21, 19.45it/s]\u001b[A\n"," 93% 5728/6144 [05:43<00:21, 19.18it/s]\u001b[A\n"," 93% 5730/6144 [05:43<00:21, 19.03it/s]\u001b[A\n"," 93% 5732/6144 [05:43<00:21, 18.92it/s]\u001b[A\n"," 93% 5734/6144 [05:43<00:21, 18.75it/s]\u001b[A\n"," 93% 5736/6144 [05:44<00:21, 19.03it/s]\u001b[A\n"," 93% 5738/6144 [05:44<00:21, 19.23it/s]\u001b[A\n"," 93% 5740/6144 [05:44<00:21, 19.19it/s]\u001b[A\n"," 93% 5742/6144 [05:44<00:20, 19.18it/s]\u001b[A\n"," 93% 5744/6144 [05:44<00:20, 19.35it/s]\u001b[A\n"," 94% 5746/6144 [05:44<00:20, 19.20it/s]\u001b[A\n"," 94% 5748/6144 [05:44<00:20, 19.27it/s]\u001b[A\n"," 94% 5750/6144 [05:44<00:20, 19.33it/s]\u001b[A\n"," 94% 5752/6144 [05:44<00:20, 18.75it/s]\u001b[A\n"," 94% 5754/6144 [05:45<00:20, 19.04it/s]\u001b[A\n"," 94% 5756/6144 [05:45<00:20, 19.22it/s]\u001b[A\n"," 94% 5758/6144 [05:45<00:20, 19.06it/s]\u001b[A\n"," 94% 5760/6144 [05:45<00:19, 19.25it/s]\u001b[A\n"," 94% 5762/6144 [05:45<00:19, 19.29it/s]\u001b[A\n"," 94% 5764/6144 [05:45<00:19, 19.34it/s]\u001b[A\n"," 94% 5766/6144 [05:45<00:19, 19.17it/s]\u001b[A\n"," 94% 5768/6144 [05:45<00:19, 19.32it/s]\u001b[A\n"," 94% 5770/6144 [05:45<00:19, 18.80it/s]\u001b[A\n"," 94% 5772/6144 [05:45<00:19, 19.04it/s]\u001b[A\n"," 94% 5774/6144 [05:46<00:19, 19.10it/s]\u001b[A\n"," 94% 5776/6144 [05:46<00:19, 18.88it/s]\u001b[A\n"," 94% 5778/6144 [05:46<00:19, 19.11it/s]\u001b[A\n"," 94% 5780/6144 [05:46<00:18, 19.26it/s]\u001b[A\n"," 94% 5782/6144 [05:46<00:18, 19.11it/s]\u001b[A\n"," 94% 5784/6144 [05:46<00:18, 19.26it/s]\u001b[A\n"," 94% 5786/6144 [05:46<00:18, 19.17it/s]\u001b[A\n"," 94% 5788/6144 [05:46<00:18, 19.06it/s]\u001b[A\n"," 94% 5790/6144 [05:46<00:18, 18.84it/s]\u001b[A\n"," 94% 5792/6144 [05:46<00:18, 19.11it/s]\u001b[A\n"," 94% 5794/6144 [05:47<00:18, 19.06it/s]\u001b[A\n"," 94% 5796/6144 [05:47<00:18, 19.24it/s]\u001b[A\n"," 94% 5798/6144 [05:47<00:17, 19.27it/s]\u001b[A\n"," 94% 5800/6144 [05:47<00:18, 19.11it/s]\u001b[A\n"," 94% 5802/6144 [05:47<00:17, 19.25it/s]\u001b[A\n"," 94% 5804/6144 [05:47<00:17, 19.37it/s]\u001b[A\n"," 94% 5806/6144 [05:47<00:17, 19.12it/s]\u001b[A\n"," 95% 5808/6144 [05:47<00:17, 18.95it/s]\u001b[A\n"," 95% 5810/6144 [05:47<00:17, 18.70it/s]\u001b[A\n"," 95% 5812/6144 [05:48<00:17, 18.76it/s]\u001b[A\n"," 95% 5814/6144 [05:48<00:17, 18.96it/s]\u001b[A\n"," 95% 5816/6144 [05:48<00:17, 18.96it/s]\u001b[A\n"," 95% 5818/6144 [05:48<00:17, 19.13it/s]\u001b[A\n"," 95% 5820/6144 [05:48<00:16, 19.26it/s]\u001b[A\n"," 95% 5822/6144 [05:48<00:16, 18.97it/s]\u001b[A\n"," 95% 5824/6144 [05:48<00:17, 18.80it/s]\u001b[A\n"," 95% 5826/6144 [05:48<00:17, 18.70it/s]\u001b[A\n"," 95% 5828/6144 [05:48<00:17, 18.33it/s]\u001b[A\n"," 95% 5830/6144 [05:49<00:16, 18.69it/s]\u001b[A\n"," 95% 5832/6144 [05:49<00:16, 18.56it/s]\u001b[A\n"," 95% 5834/6144 [05:49<00:16, 18.88it/s]\u001b[A\n"," 95% 5836/6144 [05:49<00:16, 19.09it/s]\u001b[A\n"," 95% 5838/6144 [05:49<00:16, 18.92it/s]\u001b[A\n"," 95% 5840/6144 [05:49<00:15, 19.12it/s]\u001b[A\n"," 95% 5842/6144 [05:49<00:15, 19.22it/s]\u001b[A\n"," 95% 5844/6144 [05:49<00:15, 18.79it/s]\u001b[A\n"," 95% 5846/6144 [05:49<00:15, 18.82it/s]\u001b[A\n"," 95% 5848/6144 [05:49<00:16, 18.04it/s]\u001b[A\n"," 95% 5850/6144 [05:50<00:15, 18.50it/s]\u001b[A\n"," 95% 5852/6144 [05:50<00:15, 18.84it/s]\u001b[A\n"," 95% 5854/6144 [05:50<00:15, 18.82it/s]\u001b[A\n"," 95% 5856/6144 [05:50<00:15, 18.85it/s]\u001b[A\n"," 95% 5858/6144 [05:50<00:15, 18.84it/s]\u001b[A\n"," 95% 5860/6144 [05:50<00:16, 16.79it/s]\u001b[A\n"," 95% 5862/6144 [05:50<00:17, 15.78it/s]\u001b[A\n"," 95% 5864/6144 [05:50<00:18, 15.54it/s]\u001b[A\n"," 95% 5866/6144 [05:51<00:18, 15.12it/s]\u001b[A\n"," 96% 5868/6144 [05:51<00:18, 15.18it/s]\u001b[A\n"," 96% 5870/6144 [05:51<00:17, 15.29it/s]\u001b[A\n"," 96% 5872/6144 [05:51<00:18, 14.97it/s]\u001b[A\n"," 96% 5874/6144 [05:51<00:17, 15.20it/s]\u001b[A\n"," 96% 5876/6144 [05:51<00:17, 15.25it/s]\u001b[A\n"," 96% 5878/6144 [05:51<00:17, 14.86it/s]\u001b[A\n"," 96% 5880/6144 [05:52<00:18, 14.57it/s]\u001b[A\n"," 96% 5882/6144 [05:52<00:18, 14.39it/s]\u001b[A\n"," 96% 5884/6144 [05:52<00:17, 14.45it/s]\u001b[A\n"," 96% 5886/6144 [05:52<00:17, 14.74it/s]\u001b[A\n"," 96% 5888/6144 [05:52<00:17, 14.95it/s]\u001b[A\n"," 96% 5890/6144 [05:52<00:16, 15.04it/s]\u001b[A\n"," 96% 5892/6144 [05:52<00:16, 15.20it/s]\u001b[A\n"," 96% 5894/6144 [05:52<00:17, 14.55it/s]\u001b[A\n"," 96% 5896/6144 [05:53<00:18, 13.37it/s]\u001b[A\n"," 96% 5898/6144 [05:53<00:17, 13.86it/s]\u001b[A\n"," 96% 5900/6144 [05:53<00:17, 13.86it/s]\u001b[A\n"," 96% 5902/6144 [05:53<00:17, 14.12it/s]\u001b[A\n"," 96% 5904/6144 [05:53<00:17, 13.78it/s]\u001b[A\n"," 96% 5906/6144 [05:53<00:16, 14.02it/s]\u001b[A\n"," 96% 5908/6144 [05:53<00:15, 15.15it/s]\u001b[A\n"," 96% 5910/6144 [05:54<00:14, 15.99it/s]\u001b[A\n"," 96% 5912/6144 [05:54<00:13, 16.62it/s]\u001b[A\n"," 96% 5914/6144 [05:54<00:13, 17.40it/s]\u001b[A\n"," 96% 5916/6144 [05:54<00:12, 17.61it/s]\u001b[A\n"," 96% 5918/6144 [05:54<00:12, 18.17it/s]\u001b[A\n"," 96% 5920/6144 [05:54<00:12, 18.57it/s]\u001b[A\n"," 96% 5922/6144 [05:54<00:11, 18.73it/s]\u001b[A\n"," 96% 5924/6144 [05:54<00:11, 18.71it/s]\u001b[A\n"," 96% 5926/6144 [05:54<00:11, 18.95it/s]\u001b[A\n"," 96% 5928/6144 [05:54<00:11, 18.86it/s]\u001b[A\n"," 97% 5930/6144 [05:55<00:11, 18.58it/s]\u001b[A\n"," 97% 5932/6144 [05:55<00:11, 18.86it/s]\u001b[A\n"," 97% 5934/6144 [05:55<00:11, 18.63it/s]\u001b[A\n"," 97% 5936/6144 [05:55<00:11, 18.84it/s]\u001b[A\n"," 97% 5938/6144 [05:55<00:10, 19.04it/s]\u001b[A\n"," 97% 5940/6144 [05:55<00:10, 18.86it/s]\u001b[A\n"," 97% 5942/6144 [05:55<00:10, 18.87it/s]\u001b[A\n"," 97% 5944/6144 [05:55<00:10, 19.09it/s]\u001b[A\n"," 97% 5946/6144 [05:55<00:10, 18.91it/s]\u001b[A\n"," 97% 5948/6144 [05:56<00:10, 19.12it/s]\u001b[A\n"," 97% 5950/6144 [05:56<00:10, 19.06it/s]\u001b[A\n"," 97% 5952/6144 [05:56<00:10, 18.86it/s]\u001b[A\n"," 97% 5954/6144 [05:56<00:09, 19.10it/s]\u001b[A\n"," 97% 5956/6144 [05:56<00:09, 19.26it/s]\u001b[A\n"," 97% 5958/6144 [05:56<00:09, 19.01it/s]\u001b[A\n"," 97% 5960/6144 [05:56<00:09, 19.16it/s]\u001b[A\n"," 97% 5962/6144 [05:56<00:09, 19.30it/s]\u001b[A\n"," 97% 5964/6144 [05:56<00:09, 18.98it/s]\u001b[A\n"," 97% 5966/6144 [05:56<00:09, 18.95it/s]\u001b[A\n"," 97% 5968/6144 [05:57<00:09, 18.56it/s]\u001b[A\n"," 97% 5970/6144 [05:57<00:09, 18.47it/s]\u001b[A\n"," 97% 5972/6144 [05:57<00:09, 18.82it/s]\u001b[A\n"," 97% 5974/6144 [05:57<00:09, 18.64it/s]\u001b[A\n"," 97% 5976/6144 [05:57<00:08, 18.86it/s]\u001b[A\n"," 97% 5978/6144 [05:57<00:08, 19.09it/s]\u001b[A\n"," 97% 5980/6144 [05:57<00:08, 18.80it/s]\u001b[A\n"," 97% 5982/6144 [05:57<00:08, 18.96it/s]\u001b[A\n"," 97% 5984/6144 [05:57<00:08, 18.99it/s]\u001b[A\n"," 97% 5986/6144 [05:58<00:08, 18.28it/s]\u001b[A\n"," 97% 5988/6144 [05:58<00:08, 18.19it/s]\u001b[A\n"," 97% 5990/6144 [05:58<00:08, 18.41it/s]\u001b[A\n"," 98% 5992/6144 [05:58<00:08, 18.42it/s]\u001b[A\n"," 98% 5994/6144 [05:58<00:07, 18.76it/s]\u001b[A\n"," 98% 5996/6144 [05:58<00:07, 18.95it/s]\u001b[A\n"," 98% 5998/6144 [05:58<00:07, 18.89it/s]\u001b[A\n"," 98% 6000/6144 [05:58<00:07, 19.11it/s]\u001b[A\n"," 98% 6002/6144 [05:58<00:07, 18.80it/s]\u001b[A\n"," 98% 6004/6144 [05:59<00:07, 19.04it/s]\u001b[A\n"," 98% 6006/6144 [05:59<00:07, 19.20it/s]\u001b[A\n"," 98% 6008/6144 [05:59<00:07, 18.78it/s]\u001b[A\n"," 98% 6010/6144 [05:59<00:07, 19.01it/s]\u001b[A\n"," 98% 6012/6144 [05:59<00:07, 18.57it/s]\u001b[A\n"," 98% 6014/6144 [05:59<00:07, 18.49it/s]\u001b[A\n"," 98% 6016/6144 [05:59<00:06, 18.81it/s]\u001b[A\n"," 98% 6018/6144 [05:59<00:06, 19.03it/s]\u001b[A\n"," 98% 6020/6144 [05:59<00:06, 18.95it/s]\u001b[A\n"," 98% 6022/6144 [05:59<00:06, 19.13it/s]\u001b[A\n"," 98% 6024/6144 [06:00<00:06, 19.25it/s]\u001b[A\n"," 98% 6026/6144 [06:00<00:06, 18.52it/s]\u001b[A\n"," 98% 6028/6144 [06:00<00:06, 18.82it/s]\u001b[A\n"," 98% 6030/6144 [06:00<00:05, 19.03it/s]\u001b[A\n"," 98% 6032/6144 [06:00<00:05, 19.17it/s]\u001b[A\n"," 98% 6034/6144 [06:00<00:05, 19.06it/s]\u001b[A\n"," 98% 6036/6144 [06:00<00:05, 19.02it/s]\u001b[A\n"," 98% 6038/6144 [06:00<00:05, 18.90it/s]\u001b[A\n"," 98% 6040/6144 [06:00<00:05, 19.07it/s]\u001b[A\n"," 98% 6042/6144 [06:01<00:05, 18.48it/s]\u001b[A\n"," 98% 6044/6144 [06:01<00:05, 18.48it/s]\u001b[A\n"," 98% 6046/6144 [06:01<00:05, 18.44it/s]\u001b[A\n"," 98% 6048/6144 [06:01<00:05, 18.61it/s]\u001b[A\n"," 98% 6050/6144 [06:01<00:05, 18.64it/s]\u001b[A\n"," 99% 6052/6144 [06:01<00:04, 18.80it/s]\u001b[A\n"," 99% 6054/6144 [06:01<00:04, 19.04it/s]\u001b[A\n"," 99% 6056/6144 [06:01<00:04, 18.97it/s]\u001b[A\n"," 99% 6058/6144 [06:01<00:04, 19.02it/s]\u001b[A\n"," 99% 6060/6144 [06:01<00:04, 18.99it/s]\u001b[A\n"," 99% 6062/6144 [06:02<00:04, 18.78it/s]\u001b[A\n"," 99% 6064/6144 [06:02<00:04, 19.00it/s]\u001b[A\n"," 99% 6066/6144 [06:02<00:04, 18.52it/s]\u001b[A\n"," 99% 6068/6144 [06:02<00:04, 18.62it/s]\u001b[A\n"," 99% 6070/6144 [06:02<00:03, 18.85it/s]\u001b[A\n"," 99% 6072/6144 [06:02<00:03, 18.86it/s]\u001b[A\n"," 99% 6074/6144 [06:02<00:03, 19.04it/s]\u001b[A\n"," 99% 6076/6144 [06:02<00:03, 18.68it/s]\u001b[A\n"," 99% 6078/6144 [06:02<00:03, 18.96it/s]\u001b[A\n"," 99% 6080/6144 [06:03<00:03, 17.19it/s]\u001b[A\n"," 99% 6082/6144 [06:03<00:03, 15.93it/s]\u001b[A\n"," 99% 6084/6144 [06:03<00:03, 15.24it/s]\u001b[A\n"," 99% 6086/6144 [06:03<00:03, 15.08it/s]\u001b[A\n"," 99% 6088/6144 [06:03<00:03, 14.34it/s]\u001b[A\n"," 99% 6090/6144 [06:03<00:03, 14.48it/s]\u001b[A\n"," 99% 6092/6144 [06:03<00:03, 14.68it/s]\u001b[A\n"," 99% 6094/6144 [06:04<00:03, 14.77it/s]\u001b[A\n"," 99% 6096/6144 [06:04<00:03, 14.99it/s]\u001b[A\n"," 99% 6098/6144 [06:04<00:03, 13.67it/s]\u001b[A\n"," 99% 6100/6144 [06:04<00:03, 13.76it/s]\u001b[A\n"," 99% 6102/6144 [06:04<00:02, 14.08it/s]\u001b[A\n"," 99% 6104/6144 [06:04<00:02, 14.50it/s]\u001b[A\n"," 99% 6106/6144 [06:04<00:02, 14.89it/s]\u001b[A\n"," 99% 6108/6144 [06:05<00:02, 14.93it/s]\u001b[A\n"," 99% 6110/6144 [06:05<00:02, 15.24it/s]\u001b[A\n"," 99% 6112/6144 [06:05<00:02, 15.09it/s]\u001b[A\n","100% 6114/6144 [06:05<00:02, 14.52it/s]\u001b[A\n","100% 6116/6144 [06:05<00:01, 14.69it/s]\u001b[A\n","100% 6118/6144 [06:05<00:01, 14.94it/s]\u001b[A\n","100% 6120/6144 [06:05<00:01, 14.34it/s]\u001b[A\n","100% 6122/6144 [06:06<00:01, 14.49it/s]\u001b[A\n","100% 6124/6144 [06:06<00:01, 14.32it/s]\u001b[A\n","100% 6126/6144 [06:06<00:01, 14.50it/s]\u001b[A\n","100% 6128/6144 [06:06<00:01, 14.95it/s]\u001b[A\n","100% 6130/6144 [06:06<00:00, 15.82it/s]\u001b[A\n","100% 6132/6144 [06:06<00:00, 16.77it/s]\u001b[A\n","100% 6134/6144 [06:06<00:00, 17.45it/s]\u001b[A\n","100% 6136/6144 [06:06<00:00, 17.72it/s]\u001b[A\n","100% 6138/6144 [06:06<00:00, 18.21it/s]\u001b[A\n","100% 6140/6144 [06:07<00:00, 18.57it/s]\u001b[A\n","100% 6142/6144 [06:07<00:00, 18.83it/s]\u001b[A\n","100% 6144/6144 [06:07<00:00, 16.73it/s]\n","Logging train inputs/ouputs\n","\u001b[35msteps:1\u001b[0m\n"," 1% 1/78 [07:06<9:07:09, 426.35s/it, bpd=5.3, g_l=5.3, gn=2.92, l=4.99, p_l=0.0227]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 3% 2/78 [07:11<6:20:02, 300.04s/it, bpd=5.32, g_l=5.32, gn=3.02, l=5.01, p_l=0.0226]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 4% 3/78 [07:16<4:24:25, 211.55s/it, bpd=6.39, g_l=6.39, gn=2.72, l=6.02, p_l=0.0225]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 5% 4/78 [07:21<3:04:30, 149.60s/it, bpd=4.44, g_l=4.44, gn=2.31, l=4.18, p_l=0.0221]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 6% 5/78 [07:26<2:09:15, 106.24s/it, bpd=3.69, g_l=3.69, gn=2.22, l=3.47, p_l=0.0214]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 8% 6/78 [07:31<1:31:05, 75.91s/it, bpd=3.62, g_l=3.62, gn=2.18, l=3.41, p_l=0.0203] /content/gdrive/MyDrive/slon/slon (4).txt\n"," 9% 7/78 [07:37<1:04:42, 54.69s/it, bpd=4.71, g_l=4.71, gn=2.14, l=4.43, p_l=0.0191]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 10% 8/78 [07:42<46:28, 39.84s/it, bpd=6.35, g_l=6.35, gn=2.28, l=5.98, p_l=0.0177] /content/gdrive/MyDrive/slon/slon (22).txt\n"," 12% 9/78 [07:47<33:52, 29.46s/it, bpd=4.76, g_l=4.76, gn=2.39, l=4.48, p_l=0.0162]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 13% 10/78 [07:52<25:09, 22.20s/it, bpd=5.09, g_l=5.09, gn=2.46, l=4.8, p_l=0.0146]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [07:58<19:06, 17.12s/it, bpd=5.28, g_l=5.28, gn=2.38, l=4.97, p_l=0.0132]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 15% 12/78 [08:03<14:55, 13.57s/it, bpd=5.62, g_l=5.62, gn=2.42, l=5.29, p_l=0.0118]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 17% 13/78 [08:08<11:59, 11.08s/it, bpd=5.26, g_l=5.26, gn=2.45, l=4.95, p_l=0.0106]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 18% 14/78 [08:13<09:57, 9.33s/it, bpd=5.15, g_l=5.15, gn=2.4, l=4.85, p_l=0.00932]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 19% 15/78 [08:19<08:29, 8.09s/it, bpd=5.08, g_l=5.08, gn=2.39, l=4.79, p_l=0.00807]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [08:24<07:27, 7.22s/it, bpd=6.01, g_l=6.01, gn=2.4, l=5.65, p_l=0.00702]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 22% 17/78 [08:29<06:42, 6.60s/it, bpd=5.26, g_l=5.26, gn=2.44, l=4.96, p_l=0.00582]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 23% 18/78 [08:34<06:09, 6.16s/it, bpd=5.01, g_l=5.01, gn=2.6, l=4.72, p_l=0.00499]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 24% 19/78 [08:39<05:46, 5.87s/it, bpd=6.01, g_l=6.01, gn=2.55, l=5.66, p_l=0.00398]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 26% 20/78 [08:44<05:28, 5.66s/it, bpd=4.69, g_l=4.69, gn=2.7, l=4.41, p_l=0.00322]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 27% 21/78 [08:50<05:14, 5.51s/it, bpd=5.17, g_l=5.17, gn=2.74, l=4.87, p_l=0.00248]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 28% 22/78 [08:55<05:02, 5.41s/it, bpd=5.34, g_l=5.34, gn=2.48, l=5.02, p_l=0.00186]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 29% 23/78 [09:00<04:53, 5.34s/it, bpd=5.93, g_l=5.93, gn=2.37, l=5.58, p_l=0.0014]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 31% 24/78 [09:05<04:46, 5.30s/it, bpd=4.47, g_l=4.47, gn=2.35, l=4.21, p_l=0.00103]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 32% 25/78 [09:10<04:39, 5.27s/it, bpd=4.72, g_l=4.72, gn=2.75, l=4.44, p_l=0.000768]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 33% 26/78 [09:16<04:33, 5.27s/it, bpd=4.71, g_l=4.71, gn=2.53, l=4.44, p_l=0.000572]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 35% 27/78 [09:21<04:27, 5.25s/it, bpd=5.1, g_l=5.1, gn=2.85, l=4.8, p_l=0.000437]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 36% 28/78 [09:26<04:21, 5.24s/it, bpd=5.19, g_l=5.19, gn=2.63, l=4.89, p_l=0.000326]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 37% 29/78 [09:31<04:16, 5.23s/it, bpd=4.42, g_l=4.42, gn=3.29, l=4.16, p_l=0.000253]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 38% 30/78 [09:36<04:10, 5.22s/it, bpd=5.04, g_l=5.04, gn=3.87, l=4.75, p_l=0.000206]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 40% 31/78 [09:42<04:05, 5.23s/it, bpd=6.69, g_l=6.69, gn=2.82, l=6.3, p_l=0.000172]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 41% 32/78 [09:47<04:00, 5.22s/it, bpd=4.51, g_l=4.51, gn=2.24, l=4.25, p_l=0.000145]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 42% 33/78 [09:52<03:54, 5.22s/it, bpd=5.45, g_l=5.45, gn=3.07, l=5.13, p_l=0.000129]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 44% 34/78 [09:57<03:49, 5.22s/it, bpd=6.2, g_l=6.2, gn=2.55, l=5.84, p_l=0.000115]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 45% 35/78 [10:03<03:43, 5.20s/it, bpd=6.57, g_l=6.57, gn=2.5, l=6.18, p_l=0.000103]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 46% 36/78 [10:08<03:38, 5.20s/it, bpd=6.7, g_l=6.7, gn=2.32, l=6.31, p_l=0.0001]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 47% 37/78 [10:13<03:32, 5.18s/it, bpd=5.09, g_l=5.09, gn=3.45, l=4.79, p_l=0.000102]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 49% 38/78 [10:18<03:27, 5.18s/it, bpd=5.53, g_l=5.53, gn=2.54, l=5.21, p_l=0.000108]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 50% 39/78 [10:23<03:21, 5.18s/it, bpd=4.86, g_l=4.86, gn=3.67, l=4.58, p_l=0.000108]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 51% 40/78 [10:28<03:16, 5.18s/it, bpd=5.09, g_l=5.09, gn=2.83, l=4.79, p_l=9.93e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 53% 41/78 [10:34<03:11, 5.17s/it, bpd=5.28, g_l=5.28, gn=2.97, l=4.97, p_l=9.49e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 54% 42/78 [10:39<03:06, 5.18s/it, bpd=3.98, g_l=3.98, gn=3.14, l=3.75, p_l=9.37e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 55% 43/78 [10:44<03:01, 5.19s/it, bpd=5.25, g_l=5.25, gn=2.96, l=4.94, p_l=8.29e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 56% 44/78 [10:49<02:56, 5.20s/it, bpd=4.81, g_l=4.81, gn=3.29, l=4.53, p_l=8.12e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 58% 45/78 [10:54<02:51, 5.21s/it, bpd=4.51, g_l=4.51, gn=5.03, l=4.25, p_l=7.46e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 59% 46/78 [11:00<02:46, 5.22s/it, bpd=6.6, g_l=6.6, gn=3.45, l=6.21, p_l=7.36e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [11:05<02:41, 5.22s/it, bpd=5.99, g_l=5.99, gn=3.14, l=5.64, p_l=7.02e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 62% 48/78 [11:10<02:36, 5.23s/it, bpd=6.51, g_l=6.51, gn=2.58, l=6.13, p_l=7.04e-5]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 63% 49/78 [11:15<02:31, 5.23s/it, bpd=5.24, g_l=5.24, gn=4.08, l=4.93, p_l=6.91e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 64% 50/78 [11:21<02:26, 5.23s/it, bpd=6.16, g_l=6.16, gn=4.36, l=5.8, p_l=6.86e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 65% 51/78 [11:26<02:20, 5.21s/it, bpd=6.54, g_l=6.54, gn=3.19, l=6.15, p_l=7.33e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 67% 52/78 [11:31<02:15, 5.19s/it, bpd=5.41, g_l=5.41, gn=4.64, l=5.09, p_l=7.15e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 68% 53/78 [11:36<02:09, 5.18s/it, bpd=6, g_l=6, gn=3.72, l=5.65, p_l=6.25e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 69% 54/78 [11:41<02:04, 5.18s/it, bpd=5.65, g_l=5.65, gn=5.81, l=5.32, p_l=5.11e-5]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 71% 55/78 [11:46<01:59, 5.19s/it, bpd=5.44, g_l=5.44, gn=3.33, l=5.12, p_l=4.05e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 72% 56/78 [11:52<01:54, 5.19s/it, bpd=5.94, g_l=5.94, gn=6.07, l=5.59, p_l=3.26e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 73% 57/78 [11:57<01:48, 5.18s/it, bpd=5.58, g_l=5.58, gn=5.63, l=5.25, p_l=2.8e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 74% 58/78 [12:02<01:43, 5.19s/it, bpd=6.06, g_l=6.06, gn=3.08, l=5.7, p_l=2.68e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 76% 59/78 [12:07<01:38, 5.20s/it, bpd=6.75, g_l=6.75, gn=3.2, l=6.35, p_l=2.58e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 77% 60/78 [12:12<01:33, 5.21s/it, bpd=5.06, g_l=5.06, gn=6.82, l=4.76, p_l=2.62e-5]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 78% 61/78 [12:18<01:28, 5.21s/it, bpd=4.71, g_l=4.71, gn=4.27, l=4.44, p_l=2.54e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 79% 62/78 [12:23<01:23, 5.23s/it, bpd=5.43, g_l=5.43, gn=3.81, l=5.11, p_l=2.61e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 81% 63/78 [12:28<01:18, 5.22s/it, bpd=5.92, g_l=5.92, gn=3.96, l=5.57, p_l=2.72e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 82% 64/78 [12:33<01:12, 5.21s/it, bpd=5.25, g_l=5.25, gn=4.66, l=4.94, p_l=2.77e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 83% 65/78 [12:39<01:07, 5.21s/it, bpd=5.07, g_l=5.07, gn=4.53, l=4.77, p_l=2.64e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 85% 66/78 [12:44<01:02, 5.21s/it, bpd=5.31, g_l=5.31, gn=4.36, l=5, p_l=2.47e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [12:49<00:57, 5.21s/it, bpd=4.79, g_l=4.79, gn=3.75, l=4.51, p_l=2.47e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 87% 68/78 [12:54<00:52, 5.21s/it, bpd=5.72, g_l=5.72, gn=3.75, l=5.38, p_l=2.5e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 88% 69/78 [12:59<00:46, 5.21s/it, bpd=5.26, g_l=5.26, gn=4.04, l=4.95, p_l=2.51e-5]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 90% 70/78 [13:05<00:41, 5.21s/it, bpd=5.52, g_l=5.52, gn=2.96, l=5.2, p_l=2.58e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 91% 71/78 [13:10<00:36, 5.20s/it, bpd=5.71, g_l=5.71, gn=3.18, l=5.37, p_l=2.47e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 92% 72/78 [13:15<00:31, 5.21s/it, bpd=5.59, g_l=5.59, gn=3.67, l=5.26, p_l=2.62e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [13:20<00:26, 5.20s/it, bpd=6.06, g_l=6.06, gn=5.66, l=5.7, p_l=2.82e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 95% 74/78 [13:25<00:20, 5.21s/it, bpd=5.7, g_l=5.7, gn=4.65, l=5.36, p_l=3.01e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 96% 75/78 [13:31<00:15, 5.20s/it, bpd=5.54, g_l=5.54, gn=6.04, l=5.21, p_l=3.46e-5]/content/gdrive/MyDrive/slon/slon (26).txt\n","100% 78/78 [13:46<00:00, 10.60s/it, bpd=6.06, g_l=6.06, gn=3.6, l=5.71, p_l=7.52e-5]\n","Train bpd: 5.3961 prime_loss: 0.0037 gen_loss: 5.3961 loss: 5.0787 gn: 3.3927 lr: 0.0001 lg_loss_scale: 16.1540 epoch: -1.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:78\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.90s/it, bpd=5.11, l=4.81]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:12, 1.77s/it, bpd=5.83, l=5.49]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 33% 3/9 [00:04<00:10, 1.68s/it, bpd=5.12, l=4.82]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:07, 1.59s/it, bpd=4.32, l=4.07]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.53s/it, bpd=5.3, l=4.99]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.49s/it, bpd=5.21, l=4.91]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.48s/it, bpd=5.12, l=4.82]\n","Ema bpd: 5.1598 prime_loss: 0.0226 gen_loss: 5.1598 loss: 4.8568 epoch: -1.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (31).txt\n","/content/gdrive/MyDrive/slon/slon (35).txt\n","/content/gdrive/MyDrive/slon/slon (28).txt\n"," 1% 1/78 [00:05<06:45, 5.26s/it, bpd=6.25, g_l=6.25, gn=6.3, l=5.88, p_l=9.38e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 3% 2/78 [00:10<06:36, 5.22s/it, bpd=5.56, g_l=5.56, gn=4.5, l=5.23, p_l=0.000115]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 4% 3/78 [00:15<06:28, 5.18s/it, bpd=4, g_l=4, gn=4.18, l=3.76, p_l=0.000157]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 5% 4/78 [00:20<06:22, 5.16s/it, bpd=5.77, g_l=5.77, gn=4.72, l=5.43, p_l=0.000202]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 6% 5/78 [00:25<06:15, 5.15s/it, bpd=6.38, g_l=6.38, gn=5.57, l=6.01, p_l=0.000227]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:30<06:09, 5.14s/it, bpd=5.47, g_l=5.47, gn=3.42, l=5.15, p_l=0.000237]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 9% 7/78 [00:35<06:05, 5.14s/it, bpd=6.23, g_l=6.23, gn=3.18, l=5.87, p_l=0.000256]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 10% 8/78 [00:41<05:59, 5.14s/it, bpd=5.24, g_l=5.24, gn=4.3, l=4.93, p_l=0.000241]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 12% 9/78 [00:46<05:55, 5.15s/it, bpd=5.18, g_l=5.18, gn=5.43, l=4.87, p_l=0.000219]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 13% 10/78 [00:51<05:49, 5.15s/it, bpd=6.18, g_l=6.18, gn=5.24, l=5.81, p_l=0.000192]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:56<05:45, 5.15s/it, bpd=5.02, g_l=5.02, gn=5.99, l=4.72, p_l=0.000181]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 15% 12/78 [01:01<05:40, 5.16s/it, bpd=4.89, g_l=4.89, gn=4.6, l=4.6, p_l=0.000177]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 17% 13/78 [01:06<05:36, 5.17s/it, bpd=5.03, g_l=5.03, gn=4.4, l=4.73, p_l=0.000179]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 18% 14/78 [01:12<05:32, 5.19s/it, bpd=6.2, g_l=6.2, gn=5.1, l=5.83, p_l=0.000205]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 19% 15/78 [01:17<05:27, 5.20s/it, bpd=6.23, g_l=6.23, gn=3.82, l=5.86, p_l=0.00023]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 21% 16/78 [01:22<05:22, 5.20s/it, bpd=5.61, g_l=5.61, gn=5.68, l=5.28, p_l=0.000243]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:27<05:17, 5.21s/it, bpd=5.99, g_l=5.99, gn=3.65, l=5.64, p_l=0.000261]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 23% 18/78 [01:33<05:12, 5.20s/it, bpd=5.08, g_l=5.08, gn=6.16, l=4.79, p_l=0.000295]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 24% 19/78 [01:38<05:07, 5.22s/it, bpd=5.39, g_l=5.39, gn=4.1, l=5.07, p_l=0.00033]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 26% 20/78 [01:43<05:02, 5.21s/it, bpd=5.44, g_l=5.44, gn=3.45, l=5.12, p_l=0.000378]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 27% 21/78 [01:48<04:56, 5.21s/it, bpd=5.21, g_l=5.21, gn=3.72, l=4.91, p_l=0.000454]/content/gdrive/MyDrive/slon/slon (11).txt\n","/usr/local/lib/python3.7/dist-packages/jukebox/utils/ema.py:45: UserWarning: This overload of add_ is deprecated:\n","\tadd_(Number alpha, Tensor other)\n","Consider using one of the following signatures instead:\n","\tadd_(Tensor other, *, Number alpha) (Triggered internally at ../torch/csrc/utils/python_arg_parser.cpp:1174.)\n"," state.mul_(self.mu).add_(1 - self.mu, p.data.float())\n"," 28% 22/78 [01:58<06:16, 6.72s/it, bpd=7.08, g_l=7.08, gn=4.79, l=6.67, p_l=0.000511]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 29% 23/78 [02:04<05:43, 6.25s/it, bpd=5.09, g_l=5.09, gn=4.06, l=4.79, p_l=0.000501]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 31% 24/78 [02:09<05:19, 5.92s/it, bpd=4.61, g_l=4.61, gn=4.38, l=4.34, p_l=0.000457]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 32% 25/78 [02:14<05:02, 5.71s/it, bpd=6.82, g_l=6.82, gn=3.24, l=6.42, p_l=0.000388]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 33% 26/78 [02:19<04:48, 5.56s/it, bpd=5.45, g_l=5.45, gn=4.79, l=5.13, p_l=0.000368]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 35% 27/78 [02:24<04:38, 5.46s/it, bpd=5.15, g_l=5.15, gn=3.89, l=4.85, p_l=0.000399]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 36% 28/78 [02:30<04:29, 5.40s/it, bpd=5.52, g_l=5.52, gn=4.22, l=5.2, p_l=0.000412]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 37% 29/78 [02:35<04:22, 5.35s/it, bpd=6.13, g_l=6.13, gn=4.22, l=5.77, p_l=0.000435]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 38% 30/78 [02:40<04:15, 5.33s/it, bpd=5.22, g_l=5.22, gn=5.68, l=4.91, p_l=0.00052]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 40% 31/78 [02:45<04:08, 5.29s/it, bpd=3.55, g_l=3.55, gn=3.8, l=3.34, p_l=0.00106]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 41% 32/78 [02:51<04:02, 5.26s/it, bpd=5.35, g_l=5.35, gn=5.66, l=5.04, p_l=0.00282]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 42% 33/78 [02:56<03:56, 5.25s/it, bpd=4.89, g_l=4.89, gn=4.33, l=4.6, p_l=0.0032]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 44% 34/78 [03:01<03:49, 5.22s/it, bpd=4.97, g_l=4.97, gn=4.2, l=4.67, p_l=0.000316]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 45% 35/78 [03:06<03:44, 5.21s/it, bpd=6.97, g_l=6.97, gn=3.28, l=6.56, p_l=0.000114]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 46% 36/78 [03:11<03:38, 5.20s/it, bpd=5.57, g_l=5.57, gn=4.63, l=5.24, p_l=7.02e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 47% 37/78 [03:17<03:33, 5.20s/it, bpd=6.39, g_l=6.39, gn=4.28, l=6.02, p_l=5.59e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 49% 38/78 [03:22<03:27, 5.19s/it, bpd=5.89, g_l=5.89, gn=5.5, l=5.55, p_l=5.04e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 50% 39/78 [03:27<03:22, 5.18s/it, bpd=5.33, g_l=5.33, gn=3.7, l=5.02, p_l=5.44e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 51% 40/78 [03:32<03:17, 5.19s/it, bpd=6.25, g_l=6.25, gn=4.61, l=5.88, p_l=5.14e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 53% 41/78 [03:37<03:11, 5.18s/it, bpd=5.86, g_l=5.86, gn=7.83, l=5.51, p_l=4.8e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 54% 42/78 [03:42<03:06, 5.19s/it, bpd=7.22, g_l=7.22, gn=5.17, l=6.79, p_l=5.16e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 55% 43/78 [03:48<03:01, 5.19s/it, bpd=5.6, g_l=5.6, gn=5.17, l=5.27, p_l=5.47e-5]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 56% 44/78 [03:53<02:56, 5.19s/it, bpd=5.2, g_l=5.2, gn=4.92, l=4.9, p_l=6.21e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 58% 45/78 [03:58<02:51, 5.19s/it, bpd=6.01, g_l=6.01, gn=3.93, l=5.65, p_l=5.54e-5]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 59% 46/78 [04:03<02:46, 5.19s/it, bpd=5.91, g_l=5.91, gn=6.44, l=5.56, p_l=5.25e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 60% 47/78 [04:08<02:41, 5.21s/it, bpd=5.87, g_l=5.87, gn=6.14, l=5.53, p_l=5.2e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 62% 48/78 [04:14<02:36, 5.21s/it, bpd=6.37, g_l=6.37, gn=4.64, l=6, p_l=5.08e-5]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 63% 49/78 [04:19<02:31, 5.22s/it, bpd=5.23, g_l=5.23, gn=6.31, l=4.92, p_l=5.54e-5]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 64% 50/78 [04:24<02:26, 5.22s/it, bpd=6.55, g_l=6.55, gn=4.91, l=6.17, p_l=5.54e-5]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 65% 51/78 [04:29<02:20, 5.20s/it, bpd=4.33, g_l=4.33, gn=4.1, l=4.07, p_l=5.21e-5]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 67% 52/78 [04:35<02:15, 5.21s/it, bpd=7.08, g_l=7.08, gn=4.52, l=6.66, p_l=4.8e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 68% 53/78 [04:40<02:10, 5.21s/it, bpd=4.91, g_l=4.91, gn=6.35, l=4.62, p_l=4.24e-5]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 69% 54/78 [04:45<02:05, 5.22s/it, bpd=6.48, g_l=6.48, gn=5.39, l=6.1, p_l=4.08e-5]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 71% 55/78 [04:50<01:59, 5.21s/it, bpd=6.26, g_l=6.26, gn=4.86, l=5.89, p_l=4.17e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 72% 56/78 [04:55<01:54, 5.20s/it, bpd=5.94, g_l=5.94, gn=6.43, l=5.59, p_l=4.5e-5]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 73% 57/78 [05:01<01:49, 5.19s/it, bpd=5.97, g_l=5.97, gn=6.44, l=5.62, p_l=5.21e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 74% 58/78 [05:06<01:43, 5.20s/it, bpd=5.17, g_l=5.17, gn=5.98, l=4.87, p_l=6.36e-5]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 76% 59/78 [05:11<01:38, 5.20s/it, bpd=4.49, g_l=4.49, gn=11.7, l=4.22, p_l=7.9e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 77% 60/78 [05:16<01:33, 5.20s/it, bpd=5.42, g_l=5.42, gn=4.76, l=5.1, p_l=9.35e-5]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 78% 61/78 [05:21<01:28, 5.20s/it, bpd=5.68, g_l=5.68, gn=4.66, l=5.35, p_l=0.000116]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 79% 62/78 [05:27<01:23, 5.20s/it, bpd=5.5, g_l=5.5, gn=4.52, l=5.18, p_l=0.000134]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 81% 63/78 [05:32<01:17, 5.19s/it, bpd=4.49, g_l=4.49, gn=5.02, l=4.23, p_l=0.000151]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 82% 64/78 [05:37<01:12, 5.20s/it, bpd=4.48, g_l=4.48, gn=6.08, l=4.21, p_l=0.000162]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 83% 65/78 [05:42<01:07, 5.20s/it, bpd=6.16, g_l=6.16, gn=9.16, l=5.8, p_l=0.000178]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 85% 66/78 [05:47<01:02, 5.20s/it, bpd=4.61, g_l=4.61, gn=4.29, l=4.33, p_l=0.00019]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 86% 67/78 [05:52<00:57, 5.19s/it, bpd=5.35, g_l=5.35, gn=7.31, l=5.03, p_l=0.000202]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 87% 68/78 [05:58<00:51, 5.19s/it, bpd=6.13, g_l=6.13, gn=8.06, l=5.77, p_l=0.000221]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:03<00:46, 5.19s/it, bpd=5.19, g_l=5.19, gn=4.59, l=4.89, p_l=0.000269]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 90% 70/78 [06:08<00:41, 5.18s/it, bpd=6.73, g_l=6.73, gn=3.92, l=6.33, p_l=0.000298]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 91% 71/78 [06:13<00:36, 5.20s/it, bpd=5.64, g_l=5.64, gn=4.77, l=5.31, p_l=0.000305]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 92% 72/78 [06:18<00:31, 5.20s/it, bpd=5.5, g_l=5.5, gn=5.52, l=5.18, p_l=0.000302]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 94% 73/78 [06:24<00:26, 5.20s/it, bpd=5.4, g_l=5.4, gn=4.04, l=5.08, p_l=0.000305]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 95% 74/78 [06:29<00:20, 5.20s/it, bpd=5.22, g_l=5.22, gn=3.61, l=4.91, p_l=0.000315]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [06:34<00:15, 5.20s/it, bpd=4.93, g_l=4.93, gn=4.29, l=4.64, p_l=0.00031]/content/gdrive/MyDrive/slon/slon (27).txt\n","100% 78/78 [06:50<00:00, 5.26s/it, bpd=5.73, g_l=5.73, gn=4.62, l=5.39, p_l=0.000304]\n","Train bpd: 5.6175 prime_loss: 0.0003 gen_loss: 5.6175 loss: 5.2871 gn: 5.0337 lr: 0.0003 lg_loss_scale: 16.4660 epoch: 0.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:156\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=4.99, l=4.7]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:13, 1.90s/it, bpd=4.92, l=4.63]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.75s/it, bpd=4.3, l=4.05]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=5.68, l=5.35]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=5.1, l=4.8]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=5.5, l=5.17]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=4.19, l=3.95]\n","Ema bpd: 5.0544 prime_loss: 0.0217 gen_loss: 5.0544 loss: 4.7576 epoch: 0.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (11).txt\n","/content/gdrive/MyDrive/slon/slon (24).txt\n"," 1% 1/78 [00:05<06:51, 5.34s/it, bpd=6.13, g_l=6.13, gn=5.94, l=5.77, p_l=0.000294]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 3% 2/78 [00:10<06:40, 5.27s/it, bpd=5.14, g_l=5.14, gn=7.02, l=4.84, p_l=0.000314]/content/gdrive/MyDrive/slon/slon (26).txt\n","\n","Overflow in backward. Loss 6.418869972229004, grad norm inf, lgscale 16.632000000000023, new lgscale 15.632000000000025\n"," 4% 3/78 [00:14<06:13, 4.99s/it, bpd=5.14, g_l=5.14, gn=7.02, l=4.84, p_l=0.000314]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 5% 4/78 [00:19<06:11, 5.01s/it, bpd=4.54, g_l=4.54, gn=11.4, l=4.28, p_l=0.00034]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 6% 5/78 [00:24<06:07, 5.04s/it, bpd=6.27, g_l=6.27, gn=4.44, l=5.9, p_l=0.000347]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 8% 6/78 [00:30<06:05, 5.08s/it, bpd=5.65, g_l=5.65, gn=4.49, l=5.32, p_l=0.000361]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 9% 7/78 [00:35<06:01, 5.09s/it, bpd=4.79, g_l=4.79, gn=5.18, l=4.51, p_l=0.000307]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 10% 8/78 [00:40<05:56, 5.10s/it, bpd=5.12, g_l=5.12, gn=5.62, l=4.82, p_l=0.000291]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 12% 9/78 [00:45<05:52, 5.11s/it, bpd=4.9, g_l=4.9, gn=5.36, l=4.61, p_l=0.000279]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 13% 10/78 [00:50<05:47, 5.12s/it, bpd=4.66, g_l=4.66, gn=3.31, l=4.39, p_l=0.000261]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 14% 11/78 [00:55<05:43, 5.13s/it, bpd=5.46, g_l=5.46, gn=4.33, l=5.14, p_l=0.000233]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 15% 12/78 [01:00<05:39, 5.14s/it, bpd=5.52, g_l=5.52, gn=4.93, l=5.19, p_l=0.000236]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 17% 13/78 [01:06<05:34, 5.14s/it, bpd=5.05, g_l=5.05, gn=3.77, l=4.75, p_l=0.000234]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 18% 14/78 [01:11<05:29, 5.15s/it, bpd=5.23, g_l=5.23, gn=5.33, l=4.92, p_l=0.000234]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 19% 15/78 [01:16<05:24, 5.16s/it, bpd=4.33, g_l=4.33, gn=5.21, l=4.07, p_l=0.000226]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:21<05:20, 5.17s/it, bpd=5.4, g_l=5.4, gn=4.1, l=5.08, p_l=0.000195]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 22% 17/78 [01:26<05:15, 5.18s/it, bpd=5.31, g_l=5.31, gn=3.59, l=4.99, p_l=0.000164]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 23% 18/78 [01:32<05:11, 5.19s/it, bpd=5.28, g_l=5.28, gn=4.03, l=4.97, p_l=0.000143]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 24% 19/78 [01:37<05:06, 5.20s/it, bpd=6.15, g_l=6.15, gn=4.59, l=5.79, p_l=0.000124]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 26% 20/78 [01:42<05:01, 5.20s/it, bpd=4.88, g_l=4.88, gn=8.98, l=4.59, p_l=0.00011]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 27% 21/78 [01:47<04:56, 5.20s/it, bpd=5.78, g_l=5.78, gn=5.15, l=5.44, p_l=0.000104]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 28% 22/78 [01:52<04:51, 5.20s/it, bpd=6.74, g_l=6.74, gn=4.8, l=6.34, p_l=9.98e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 29% 23/78 [01:58<04:46, 5.21s/it, bpd=5.47, g_l=5.47, gn=4.47, l=5.15, p_l=9.29e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 31% 24/78 [02:03<04:40, 5.20s/it, bpd=4.91, g_l=4.91, gn=6.53, l=4.62, p_l=9.04e-5]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 32% 25/78 [02:08<04:35, 5.20s/it, bpd=5.03, g_l=5.03, gn=5.5, l=4.73, p_l=9.23e-5]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 33% 26/78 [02:13<04:29, 5.19s/it, bpd=5.23, g_l=5.23, gn=5.24, l=4.92, p_l=9.52e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 35% 27/78 [02:18<04:23, 5.17s/it, bpd=4.67, g_l=4.67, gn=7.79, l=4.4, p_l=0.000106]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 36% 28/78 [02:23<04:19, 5.18s/it, bpd=5.55, g_l=5.55, gn=3.36, l=5.22, p_l=0.000119]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:29<04:13, 5.17s/it, bpd=5.45, g_l=5.45, gn=4.87, l=5.13, p_l=0.000146]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 38% 30/78 [02:34<04:08, 5.18s/it, bpd=5.75, g_l=5.75, gn=7.91, l=5.41, p_l=0.00014]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 40% 31/78 [02:39<04:03, 5.18s/it, bpd=5.5, g_l=5.5, gn=5.02, l=5.18, p_l=0.000131]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 41% 32/78 [02:44<03:57, 5.17s/it, bpd=5.53, g_l=5.53, gn=4.94, l=5.2, p_l=0.000133]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 42% 33/78 [02:49<03:52, 5.17s/it, bpd=6.09, g_l=6.09, gn=5.6, l=5.73, p_l=0.000131]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 44% 34/78 [02:55<03:47, 5.18s/it, bpd=7.03, g_l=7.03, gn=4.4, l=6.62, p_l=0.000126]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 45% 35/78 [03:00<03:43, 5.19s/it, bpd=6.57, g_l=6.57, gn=3.17, l=6.19, p_l=0.000109]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 46% 36/78 [03:05<03:37, 5.19s/it, bpd=6.22, g_l=6.22, gn=3.91, l=5.85, p_l=0.000113]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 47% 37/78 [03:10<03:32, 5.19s/it, bpd=5.67, g_l=5.67, gn=3.6, l=5.34, p_l=0.000124]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 49% 38/78 [03:15<03:27, 5.19s/it, bpd=5.93, g_l=5.93, gn=6.74, l=5.58, p_l=0.000135]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 50% 39/78 [03:20<03:22, 5.19s/it, bpd=6.81, g_l=6.81, gn=4.62, l=6.41, p_l=0.000142]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 51% 40/78 [03:26<03:17, 5.20s/it, bpd=6.88, g_l=6.88, gn=3.37, l=6.47, p_l=0.00014]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 53% 41/78 [03:31<03:12, 5.21s/it, bpd=6.57, g_l=6.57, gn=3.38, l=6.18, p_l=0.000147]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 54% 42/78 [03:36<03:07, 5.21s/it, bpd=5.39, g_l=5.39, gn=4.26, l=5.07, p_l=0.000145]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [03:41<03:02, 5.21s/it, bpd=6.08, g_l=6.08, gn=3.44, l=5.72, p_l=0.000141]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 56% 44/78 [03:47<02:56, 5.20s/it, bpd=5.38, g_l=5.38, gn=4.18, l=5.06, p_l=0.000135]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 58% 45/78 [03:57<03:39, 6.66s/it, bpd=5.77, g_l=5.77, gn=5.34, l=5.43, p_l=0.00013]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [04:02<03:18, 6.21s/it, bpd=5.7, g_l=5.7, gn=4.52, l=5.37, p_l=0.000106]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 60% 47/78 [04:07<03:02, 5.90s/it, bpd=6.55, g_l=6.55, gn=5.88, l=6.17, p_l=8.86e-5]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 62% 48/78 [04:12<02:50, 5.69s/it, bpd=5.22, g_l=5.22, gn=3.83, l=4.91, p_l=7.44e-5]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 63% 49/78 [04:17<02:40, 5.54s/it, bpd=6.96, g_l=6.96, gn=3.9, l=6.55, p_l=6.93e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 64% 50/78 [04:23<02:32, 5.44s/it, bpd=5.65, g_l=5.65, gn=3.96, l=5.32, p_l=7.04e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 65% 51/78 [04:28<02:25, 5.39s/it, bpd=6.88, g_l=6.88, gn=4.03, l=6.48, p_l=7.47e-5]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 67% 52/78 [04:33<02:19, 5.35s/it, bpd=5.23, g_l=5.23, gn=3.68, l=4.92, p_l=6.61e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 68% 53/78 [04:38<02:12, 5.32s/it, bpd=6.03, g_l=6.03, gn=3.55, l=5.68, p_l=6.27e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 69% 54/78 [04:44<02:06, 5.28s/it, bpd=5.79, g_l=5.79, gn=4.55, l=5.45, p_l=6.35e-5]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 71% 55/78 [04:49<02:01, 5.26s/it, bpd=5.39, g_l=5.39, gn=3.95, l=5.07, p_l=6.46e-5]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 72% 56/78 [04:54<01:55, 5.25s/it, bpd=5.51, g_l=5.51, gn=3.82, l=5.18, p_l=6.11e-5]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 73% 57/78 [04:59<01:49, 5.22s/it, bpd=5.33, g_l=5.33, gn=3.39, l=5.01, p_l=5.65e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 74% 58/78 [05:04<01:44, 5.21s/it, bpd=4.78, g_l=4.78, gn=4.24, l=4.5, p_l=5.34e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 76% 59/78 [05:09<01:38, 5.20s/it, bpd=5.72, g_l=5.72, gn=3.66, l=5.39, p_l=5e-5]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 77% 60/78 [05:15<01:33, 5.19s/it, bpd=4.73, g_l=4.73, gn=6.02, l=4.45, p_l=5.13e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 78% 61/78 [05:20<01:28, 5.18s/it, bpd=6.54, g_l=6.54, gn=4.84, l=6.16, p_l=5.98e-5]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 79% 62/78 [05:25<01:22, 5.17s/it, bpd=5.23, g_l=5.23, gn=3.71, l=4.92, p_l=6.67e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 81% 63/78 [05:30<01:17, 5.19s/it, bpd=6.39, g_l=6.39, gn=3.54, l=6.02, p_l=6.7e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [05:35<01:12, 5.19s/it, bpd=5.22, g_l=5.22, gn=3.22, l=4.91, p_l=6.04e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 83% 65/78 [05:41<01:07, 5.20s/it, bpd=4.86, g_l=4.86, gn=5.95, l=4.57, p_l=5.08e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 85% 66/78 [05:46<01:02, 5.20s/it, bpd=5.4, g_l=5.4, gn=3.64, l=5.09, p_l=4.11e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n","\n","Overflow in backward. Loss 4.498471260070801, grad norm nan, lgscale 15.884000000000032, new lgscale 14.884000000000032\n"," 86% 67/78 [05:50<00:54, 4.96s/it, bpd=5.4, g_l=5.4, gn=3.64, l=5.09, p_l=4.11e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 87% 68/78 [05:55<00:50, 5.03s/it, bpd=5.73, g_l=5.73, gn=5.38, l=5.39, p_l=3.6e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n","\n","Overflow in backward. Loss 5.061788558959961, grad norm nan, lgscale 14.888000000000034, new lgscale 13.888000000000034\n"," 88% 69/78 [06:00<00:43, 4.85s/it, bpd=5.73, g_l=5.73, gn=5.38, l=5.39, p_l=3.6e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 90% 70/78 [06:05<00:39, 4.95s/it, bpd=6.91, g_l=6.91, gn=9.03, l=6.5, p_l=3.27e-5]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 91% 71/78 [06:10<00:35, 5.02s/it, bpd=5.5, g_l=5.5, gn=3.51, l=5.18, p_l=2.97e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 92% 72/78 [06:15<00:30, 5.07s/it, bpd=6.55, g_l=6.55, gn=4.78, l=6.16, p_l=2.75e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:21<00:25, 5.12s/it, bpd=6.17, g_l=6.17, gn=5.27, l=5.81, p_l=2.33e-5]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 95% 74/78 [06:26<00:20, 5.14s/it, bpd=5.79, g_l=5.79, gn=3.09, l=5.45, p_l=2.02e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [06:31<00:15, 5.17s/it, bpd=5.68, g_l=5.68, gn=4.87, l=5.34, p_l=1.61e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n","100% 78/78 [06:47<00:00, 5.22s/it, bpd=5.28, g_l=5.28, gn=5.15, l=4.97, p_l=8.22e-6]\n","Train bpd: 5.6595 prime_loss: 0.0001 gen_loss: 5.6595 loss: 5.3266 gn: 4.8242 lr: 0.0003 lg_loss_scale: 15.5453 epoch: 1.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:231\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=5.26, l=4.95]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:13, 1.88s/it, bpd=5.05, l=4.75]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:04<00:10, 1.73s/it, bpd=4.32, l=4.07]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:08, 1.63s/it, bpd=5.21, l=4.9]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=5.11, l=4.81]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=4.93, l=4.64]/content/gdrive/MyDrive/slon/slon (6).txt\n","100% 9/9 [00:13<00:00, 1.49s/it, bpd=5.29, l=4.98]\n","Ema bpd: 4.9693 prime_loss: 0.0209 gen_loss: 4.9693 loss: 4.6775 epoch: 1.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (25).txt\n","/content/gdrive/MyDrive/slon/slon (31).txt\n"," 1% 1/78 [00:05<06:49, 5.32s/it, bpd=5.16, g_l=5.16, gn=3.4, l=4.85, p_l=7.6e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 3% 2/78 [00:10<06:41, 5.28s/it, bpd=5.71, g_l=5.71, gn=4.2, l=5.37, p_l=7.69e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:15<06:35, 5.28s/it, bpd=5.57, g_l=5.57, gn=6.58, l=5.24, p_l=8.2e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 5% 4/78 [00:21<06:30, 5.27s/it, bpd=5.13, g_l=5.13, gn=7.14, l=4.83, p_l=9.21e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 6% 5/78 [00:26<06:25, 5.28s/it, bpd=5.25, g_l=5.25, gn=4.73, l=4.94, p_l=9.52e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:20, 5.28s/it, bpd=6.8, g_l=6.8, gn=4.63, l=6.4, p_l=1.02e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 9% 7/78 [00:36<06:13, 5.26s/it, bpd=5.64, g_l=5.64, gn=13.6, l=5.31, p_l=1.07e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:239\u001b[0m\n"," 10% 8/78 [01:16<18:16, 15.66s/it, bpd=5.13, g_l=5.13, gn=4.1, l=4.82, p_l=1.13e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 12% 9/78 [01:22<14:28, 12.58s/it, bpd=6.19, g_l=6.19, gn=4.18, l=5.83, p_l=1.18e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n","\n","Overflow in backward. Loss 4.9994683265686035, grad norm nan, lgscale 13.960000000000036, new lgscale 12.960000000000036\n"," 13% 10/78 [01:26<11:27, 10.12s/it, bpd=6.19, g_l=6.19, gn=4.18, l=5.83, p_l=1.18e-5]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 14% 11/78 [01:31<09:42, 8.69s/it, bpd=5.12, g_l=5.12, gn=3.36, l=4.82, p_l=1.26e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 15% 12/78 [01:37<08:27, 7.69s/it, bpd=4.9, g_l=4.9, gn=3.93, l=4.61, p_l=1.3e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 17% 13/78 [01:42<07:38, 7.05s/it, bpd=4.98, g_l=4.98, gn=3.72, l=4.69, p_l=1.35e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 18% 14/78 [01:48<07:01, 6.59s/it, bpd=6.29, g_l=6.29, gn=6.51, l=5.92, p_l=1.52e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 19% 15/78 [01:53<06:34, 6.26s/it, bpd=5.55, g_l=5.55, gn=6.17, l=5.23, p_l=1.69e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 21% 16/78 [01:59<06:11, 5.99s/it, bpd=6.19, g_l=6.19, gn=4.57, l=5.83, p_l=1.9e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 22% 17/78 [02:04<05:53, 5.80s/it, bpd=5.79, g_l=5.79, gn=4, l=5.45, p_l=2.18e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 23% 18/78 [02:09<05:39, 5.66s/it, bpd=6.99, g_l=6.99, gn=4.99, l=6.58, p_l=2.44e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 24% 19/78 [02:15<05:26, 5.54s/it, bpd=5.26, g_l=5.26, gn=4.72, l=4.95, p_l=2.77e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 26% 20/78 [02:20<05:17, 5.47s/it, bpd=5.41, g_l=5.41, gn=5.25, l=5.09, p_l=3.16e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 27% 21/78 [02:25<05:05, 5.36s/it, bpd=4.73, g_l=4.73, gn=6.44, l=4.45, p_l=3.6e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 28% 22/78 [02:30<04:55, 5.28s/it, bpd=6.55, g_l=6.55, gn=4.28, l=6.17, p_l=4.18e-5]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 29% 23/78 [02:35<04:49, 5.26s/it, bpd=7.01, g_l=7.01, gn=3.41, l=6.6, p_l=5.05e-5]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 31% 24/78 [02:40<04:41, 5.21s/it, bpd=6.29, g_l=6.29, gn=5.68, l=5.92, p_l=5.77e-5]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 32% 25/78 [02:46<04:36, 5.21s/it, bpd=5.01, g_l=5.01, gn=4.4, l=4.72, p_l=6.43e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 33% 26/78 [02:51<04:30, 5.21s/it, bpd=6.2, g_l=6.2, gn=4.58, l=5.83, p_l=7.03e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 35% 27/78 [02:56<04:26, 5.23s/it, bpd=6.64, g_l=6.64, gn=4.67, l=6.25, p_l=8.01e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 36% 28/78 [03:01<04:22, 5.24s/it, bpd=5.32, g_l=5.32, gn=5.98, l=5.01, p_l=9.47e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 37% 29/78 [03:07<04:17, 5.26s/it, bpd=5.31, g_l=5.31, gn=4.4, l=5, p_l=0.000112]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 38% 30/78 [03:12<04:14, 5.29s/it, bpd=6.18, g_l=6.18, gn=3.76, l=5.82, p_l=0.000131]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 40% 31/78 [03:17<04:09, 5.30s/it, bpd=6.44, g_l=6.44, gn=4.73, l=6.06, p_l=0.000157]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 41% 32/78 [03:23<04:04, 5.30s/it, bpd=5.1, g_l=5.1, gn=4.48, l=4.8, p_l=0.000176]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 42% 33/78 [03:28<03:57, 5.29s/it, bpd=5.59, g_l=5.59, gn=4.46, l=5.26, p_l=0.000195]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 44% 34/78 [03:33<03:52, 5.28s/it, bpd=5.62, g_l=5.62, gn=3.95, l=5.29, p_l=0.00024]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 45% 35/78 [03:38<03:46, 5.28s/it, bpd=5.87, g_l=5.87, gn=4.91, l=5.53, p_l=0.000279]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 46% 36/78 [03:44<03:40, 5.26s/it, bpd=5.55, g_l=5.55, gn=3.71, l=5.22, p_l=0.000305]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 47% 37/78 [03:49<03:36, 5.27s/it, bpd=5.39, g_l=5.39, gn=4.96, l=5.07, p_l=0.000318]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 49% 38/78 [03:54<03:29, 5.24s/it, bpd=6.23, g_l=6.23, gn=4.74, l=5.86, p_l=0.000322]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 50% 39/78 [03:59<03:23, 5.23s/it, bpd=6.61, g_l=6.61, gn=4.8, l=6.22, p_l=0.000363]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 51% 40/78 [04:05<03:17, 5.21s/it, bpd=5.54, g_l=5.54, gn=4.11, l=5.22, p_l=0.000451]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 53% 41/78 [04:10<03:12, 5.19s/it, bpd=5.94, g_l=5.94, gn=3.44, l=5.59, p_l=0.000679]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 54% 42/78 [04:15<03:06, 5.18s/it, bpd=5.7, g_l=5.7, gn=3.98, l=5.36, p_l=0.000876]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 55% 43/78 [04:20<03:00, 5.17s/it, bpd=5.76, g_l=5.76, gn=3.5, l=5.42, p_l=0.000879]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 56% 44/78 [04:25<02:56, 5.18s/it, bpd=7.44, g_l=7.44, gn=4.06, l=7, p_l=0.000655]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 58% 45/78 [04:30<02:51, 5.19s/it, bpd=5.36, g_l=5.36, gn=3.2, l=5.05, p_l=0.000525]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 59% 46/78 [04:36<02:46, 5.19s/it, bpd=5.7, g_l=5.7, gn=4.1, l=5.37, p_l=0.000449]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 60% 47/78 [04:41<02:40, 5.19s/it, bpd=6.86, g_l=6.86, gn=4.14, l=6.46, p_l=0.000424]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 62% 48/78 [04:46<02:35, 5.19s/it, bpd=6.64, g_l=6.64, gn=3.92, l=6.25, p_l=0.000433]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 63% 49/78 [04:51<02:31, 5.21s/it, bpd=5.91, g_l=5.91, gn=5, l=5.56, p_l=0.000426]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 64% 50/78 [04:56<02:25, 5.21s/it, bpd=5.2, g_l=5.2, gn=10.5, l=4.89, p_l=0.000426]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 65% 51/78 [05:02<02:21, 5.22s/it, bpd=5.52, g_l=5.52, gn=4.59, l=5.2, p_l=0.000589]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 67% 52/78 [05:07<02:15, 5.22s/it, bpd=5.68, g_l=5.68, gn=4.62, l=5.34, p_l=0.000819]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 68% 53/78 [05:12<02:10, 5.21s/it, bpd=6.58, g_l=6.58, gn=4.69, l=6.19, p_l=0.00164]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 69% 54/78 [05:17<02:04, 5.21s/it, bpd=5.79, g_l=5.79, gn=3.63, l=5.45, p_l=0.00172]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 71% 55/78 [05:22<01:59, 5.20s/it, bpd=6.64, g_l=6.64, gn=16.9, l=6.25, p_l=0.00108]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 72% 56/78 [05:28<01:54, 5.21s/it, bpd=5.25, g_l=5.25, gn=4.14, l=4.94, p_l=0.000766]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 73% 57/78 [05:33<01:49, 5.21s/it, bpd=5.83, g_l=5.83, gn=3.87, l=5.48, p_l=0.000452]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 74% 58/78 [05:38<01:43, 5.20s/it, bpd=5.07, g_l=5.07, gn=4.33, l=4.78, p_l=0.000277]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 76% 59/78 [05:43<01:38, 5.19s/it, bpd=4.66, g_l=4.66, gn=4.4, l=4.38, p_l=0.000167]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 77% 60/78 [05:48<01:33, 5.18s/it, bpd=4.31, g_l=4.31, gn=3.63, l=4.05, p_l=0.000103]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 78% 61/78 [05:54<01:28, 5.19s/it, bpd=5.3, g_l=5.3, gn=5.28, l=4.99, p_l=6.27e-5]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 79% 62/78 [05:59<01:23, 5.19s/it, bpd=4.49, g_l=4.49, gn=23.4, l=4.22, p_l=3.86e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 81% 63/78 [06:04<01:18, 5.20s/it, bpd=5.27, g_l=5.27, gn=4.79, l=4.96, p_l=2.2e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 82% 64/78 [06:09<01:12, 5.20s/it, bpd=5.93, g_l=5.93, gn=7.06, l=5.58, p_l=1.12e-5]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 83% 65/78 [06:14<01:07, 5.19s/it, bpd=5.05, g_l=5.05, gn=4.06, l=4.76, p_l=6.14e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 85% 66/78 [06:20<01:02, 5.19s/it, bpd=6.7, g_l=6.7, gn=4.6, l=6.31, p_l=4.44e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [06:25<00:57, 5.18s/it, bpd=5.81, g_l=5.81, gn=4.1, l=5.47, p_l=2.97e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 87% 68/78 [06:30<00:51, 5.19s/it, bpd=5.32, g_l=5.32, gn=4.34, l=5, p_l=1.9e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 88% 69/78 [06:35<00:46, 5.19s/it, bpd=5.44, g_l=5.44, gn=5.36, l=5.12, p_l=1.2e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 90% 70/78 [06:43<00:47, 5.96s/it, bpd=5.01, g_l=5.01, gn=5.35, l=4.72, p_l=7.06e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 91% 71/78 [06:48<00:39, 5.70s/it, bpd=5.34, g_l=5.34, gn=4.23, l=5.03, p_l=4.3e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 92% 72/78 [06:53<00:33, 5.54s/it, bpd=4.46, g_l=4.46, gn=4.68, l=4.2, p_l=2.77e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 94% 73/78 [06:58<00:27, 5.43s/it, bpd=6.39, g_l=6.39, gn=4.56, l=6.01, p_l=2.07e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 95% 74/78 [07:04<00:21, 5.36s/it, bpd=5.55, g_l=5.55, gn=4.12, l=5.22, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 96% 75/78 [07:09<00:15, 5.32s/it, bpd=5.56, g_l=5.56, gn=4.5, l=5.23, p_l=1.12e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n","100% 78/78 [07:25<00:00, 5.71s/it, bpd=4.88, g_l=4.88, gn=6.68, l=4.59, p_l=1.16e-7]\n","Train bpd: 5.6597 prime_loss: 0.0002 gen_loss: 5.6597 loss: 5.3268 gn: 5.1798 lr: 0.0003 lg_loss_scale: 13.1929 epoch: 2.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:308\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.04s/it, bpd=5.11, l=4.81]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:13, 1.89s/it, bpd=4.96, l=4.67]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:04<00:10, 1.74s/it, bpd=4.45, l=4.18]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=5.77, l=5.44]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=4.6, l=4.33]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=4.9, l=4.61]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=5.2, l=4.9]\n","Ema bpd: 4.9763 prime_loss: 0.0200 gen_loss: 4.9763 loss: 4.6841 epoch: 2.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (25).txt\n","/content/gdrive/MyDrive/slon/slon (4).txt\n"," 1% 1/78 [00:05<07:03, 5.50s/it, bpd=5.59, g_l=5.59, gn=4.95, l=5.26, p_l=1.42e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 3% 2/78 [00:10<06:50, 5.41s/it, bpd=5.76, g_l=5.76, gn=3.73, l=5.43, p_l=2.55e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 4% 3/78 [00:15<06:41, 5.36s/it, bpd=5.4, g_l=5.4, gn=4.49, l=5.08, p_l=4.7e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 5% 4/78 [00:21<06:34, 5.33s/it, bpd=5.52, g_l=5.52, gn=4.27, l=5.19, p_l=5.9e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 6% 5/78 [00:26<06:28, 5.32s/it, bpd=4.81, g_l=4.81, gn=5.27, l=4.53, p_l=5.18e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 8% 6/78 [00:31<06:21, 5.30s/it, bpd=5.25, g_l=5.25, gn=4.67, l=4.94, p_l=4e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=5.07, g_l=5.07, gn=3.48, l=4.77, p_l=3.45e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 10% 8/78 [00:42<06:09, 5.27s/it, bpd=4.35, g_l=4.35, gn=4.25, l=4.1, p_l=2.36e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 12% 9/78 [00:47<06:02, 5.25s/it, bpd=5.4, g_l=5.4, gn=4.39, l=5.08, p_l=1.68e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 13% 10/78 [00:52<05:55, 5.23s/it, bpd=6.75, g_l=6.75, gn=4.87, l=6.36, p_l=1.5e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=5.56, g_l=5.56, gn=6.36, l=5.24, p_l=1.45e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 15% 12/78 [01:02<05:43, 5.21s/it, bpd=5.43, g_l=5.43, gn=4.6, l=5.12, p_l=1.59e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=5.5, g_l=5.5, gn=4.92, l=5.18, p_l=1.68e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=5.72, g_l=5.72, gn=5.64, l=5.38, p_l=1.93e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=5.32, g_l=5.32, gn=9.32, l=5.01, p_l=2.12e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:23<05:19, 5.16s/it, bpd=6.09, g_l=6.09, gn=6.31, l=5.73, p_l=2.36e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 22% 17/78 [01:28<05:15, 5.18s/it, bpd=5.12, g_l=5.12, gn=5.35, l=4.82, p_l=2.61e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 23% 18/78 [01:33<05:10, 5.17s/it, bpd=4.49, g_l=4.49, gn=3.62, l=4.22, p_l=2.91e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 24% 19/78 [01:39<05:05, 5.18s/it, bpd=5.44, g_l=5.44, gn=5.68, l=5.12, p_l=3.52e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 26% 20/78 [01:44<05:00, 5.19s/it, bpd=6.72, g_l=6.72, gn=4.12, l=6.33, p_l=4.22e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 27% 21/78 [01:49<04:56, 5.20s/it, bpd=5.25, g_l=5.25, gn=5.57, l=4.94, p_l=5.11e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 28% 22/78 [01:54<04:50, 5.20s/it, bpd=5.5, g_l=5.5, gn=4.91, l=5.17, p_l=6.2e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 29% 23/78 [02:00<04:46, 5.20s/it, bpd=5.89, g_l=5.89, gn=4.98, l=5.54, p_l=7.09e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 31% 24/78 [02:05<04:41, 5.22s/it, bpd=6.38, g_l=6.38, gn=3.88, l=6, p_l=8.17e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 32% 25/78 [02:10<04:36, 5.22s/it, bpd=4.87, g_l=4.87, gn=4.04, l=4.59, p_l=8.82e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=5.17, g_l=5.17, gn=5.35, l=4.87, p_l=9.57e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 35% 27/78 [02:20<04:26, 5.22s/it, bpd=6.09, g_l=6.09, gn=4.63, l=5.73, p_l=9.99e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=4.19, g_l=4.19, gn=3.87, l=3.94, p_l=1e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=4.64, g_l=4.64, gn=3.23, l=4.36, p_l=1.02e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=6.37, g_l=6.37, gn=4.29, l=5.99, p_l=1.04e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 40% 31/78 [02:41<04:04, 5.20s/it, bpd=6.06, g_l=6.06, gn=5.31, l=5.7, p_l=1.18e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 41% 32/78 [02:46<03:58, 5.19s/it, bpd=6.99, g_l=6.99, gn=4.44, l=6.58, p_l=1.4e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 42% 33/78 [02:52<03:53, 5.19s/it, bpd=5.12, g_l=5.12, gn=3.79, l=4.82, p_l=1.74e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 44% 34/78 [02:57<03:48, 5.19s/it, bpd=5.55, g_l=5.55, gn=4.3, l=5.22, p_l=2.15e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 45% 35/78 [03:02<03:42, 5.18s/it, bpd=6.42, g_l=6.42, gn=3.78, l=6.04, p_l=2.39e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 46% 36/78 [03:07<03:37, 5.18s/it, bpd=5.81, g_l=5.81, gn=3.68, l=5.47, p_l=2.4e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 47% 37/78 [03:12<03:32, 5.18s/it, bpd=5.02, g_l=5.02, gn=6.92, l=4.72, p_l=2.5e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 49% 38/78 [03:17<03:26, 5.17s/it, bpd=6.12, g_l=6.12, gn=4.05, l=5.76, p_l=2.45e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 50% 39/78 [03:23<03:21, 5.17s/it, bpd=5.36, g_l=5.36, gn=3.94, l=5.05, p_l=2.67e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 51% 40/78 [03:28<03:16, 5.16s/it, bpd=5.12, g_l=5.12, gn=4.11, l=4.82, p_l=2.63e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 53% 41/78 [03:33<03:11, 5.18s/it, bpd=5.66, g_l=5.66, gn=3.77, l=5.33, p_l=2.55e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 54% 42/78 [03:38<03:06, 5.17s/it, bpd=5.25, g_l=5.25, gn=3.67, l=4.94, p_l=2.43e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 55% 43/78 [03:43<03:01, 5.18s/it, bpd=5.6, g_l=5.6, gn=5.13, l=5.27, p_l=2.39e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 56% 44/78 [03:48<02:56, 5.18s/it, bpd=5.27, g_l=5.27, gn=5.07, l=4.96, p_l=2.48e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 58% 45/78 [03:54<02:50, 5.18s/it, bpd=5.53, g_l=5.53, gn=5.28, l=5.21, p_l=2.37e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [03:59<02:46, 5.19s/it, bpd=4.89, g_l=4.89, gn=5.38, l=4.6, p_l=2.11e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 60% 47/78 [04:04<02:40, 5.19s/it, bpd=4.39, g_l=4.39, gn=9.18, l=4.13, p_l=1.99e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 62% 48/78 [04:09<02:35, 5.20s/it, bpd=5.24, g_l=5.24, gn=4.16, l=4.94, p_l=1.88e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 63% 49/78 [04:14<02:30, 5.19s/it, bpd=5.38, g_l=5.38, gn=4.44, l=5.07, p_l=1.95e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 64% 50/78 [04:20<02:25, 5.19s/it, bpd=6.85, g_l=6.85, gn=5.17, l=6.45, p_l=2.12e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 65% 51/78 [04:25<02:19, 5.18s/it, bpd=5.52, g_l=5.52, gn=4.58, l=5.2, p_l=2.15e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 67% 52/78 [04:30<02:14, 5.17s/it, bpd=4.17, g_l=4.17, gn=34.4, l=3.92, p_l=1.95e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 68% 53/78 [04:35<02:09, 5.20s/it, bpd=5.44, g_l=5.44, gn=7.17, l=5.12, p_l=1.85e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 69% 54/78 [04:40<02:04, 5.20s/it, bpd=5.37, g_l=5.37, gn=4.02, l=5.06, p_l=1.76e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 71% 55/78 [04:46<01:59, 5.20s/it, bpd=4.9, g_l=4.9, gn=4.74, l=4.61, p_l=1.73e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 72% 56/78 [04:51<01:54, 5.20s/it, bpd=4.85, g_l=4.85, gn=11.2, l=4.57, p_l=1.77e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 73% 57/78 [04:56<01:49, 5.20s/it, bpd=5.41, g_l=5.41, gn=3.12, l=5.09, p_l=1.8e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 74% 58/78 [05:01<01:44, 5.21s/it, bpd=5.39, g_l=5.39, gn=4.36, l=5.08, p_l=1.9e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 76% 59/78 [05:06<01:38, 5.21s/it, bpd=6.35, g_l=6.35, gn=3.99, l=5.98, p_l=1.99e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 77% 60/78 [05:12<01:33, 5.21s/it, bpd=4.9, g_l=4.9, gn=3.02, l=4.61, p_l=2.18e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 78% 61/78 [05:17<01:28, 5.21s/it, bpd=5.42, g_l=5.42, gn=3.52, l=5.1, p_l=2.33e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 79% 62/78 [05:22<01:23, 5.20s/it, bpd=6.66, g_l=6.66, gn=3.07, l=6.27, p_l=2.46e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 81% 63/78 [05:27<01:17, 5.20s/it, bpd=5.89, g_l=5.89, gn=3.74, l=5.54, p_l=2.55e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 82% 64/78 [05:32<01:12, 5.20s/it, bpd=4.38, g_l=4.38, gn=5.08, l=4.12, p_l=2.53e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 83% 65/78 [05:38<01:07, 5.20s/it, bpd=5.72, g_l=5.72, gn=3.7, l=5.39, p_l=2.71e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 85% 66/78 [05:43<01:02, 5.20s/it, bpd=3.6, g_l=3.6, gn=4.19, l=3.39, p_l=2.76e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [05:48<00:57, 5.20s/it, bpd=5.81, g_l=5.81, gn=3.17, l=5.47, p_l=2.91e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 87% 68/78 [05:53<00:52, 5.20s/it, bpd=4.92, g_l=4.92, gn=3.4, l=4.63, p_l=2.93e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 88% 69/78 [05:58<00:46, 5.20s/it, bpd=4.7, g_l=4.7, gn=3.6, l=4.42, p_l=2.97e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 90% 70/78 [06:04<00:41, 5.20s/it, bpd=5.74, g_l=5.74, gn=3.43, l=5.41, p_l=2.86e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 91% 71/78 [06:09<00:36, 5.19s/it, bpd=5.45, g_l=5.45, gn=3.41, l=5.13, p_l=2.84e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 92% 72/78 [06:14<00:31, 5.20s/it, bpd=6.21, g_l=6.21, gn=3.41, l=5.84, p_l=2.79e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 94% 73/78 [06:19<00:25, 5.20s/it, bpd=4.9, g_l=4.9, gn=4.51, l=4.61, p_l=2.91e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 95% 74/78 [06:24<00:20, 5.19s/it, bpd=5.81, g_l=5.81, gn=3.2, l=5.47, p_l=2.85e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 96% 75/78 [06:30<00:15, 5.19s/it, bpd=4.97, g_l=4.97, gn=3.43, l=4.68, p_l=2.69e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n","100% 78/78 [06:45<00:00, 5.20s/it, bpd=6.51, g_l=6.51, gn=3.3, l=6.13, p_l=2.2e-6]\n","Train bpd: 5.4786 prime_loss: 0.0000 gen_loss: 5.4786 loss: 5.1563 gn: 4.9503 lr: 0.0003 lg_loss_scale: 13.3860 epoch: 3.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:386\u001b[0m\n"," 11% 1/9 [00:01<00:13, 1.74s/it, bpd=5.69, l=5.36]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:11, 1.65s/it, bpd=4.96, l=4.67]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 33% 3/9 [00:04<00:09, 1.60s/it, bpd=5.4, l=5.08]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:07, 1.54s/it, bpd=4.1, l=3.86]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:05, 1.49s/it, bpd=4.93, l=4.64]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:08<00:04, 1.46s/it, bpd=5.08, l=4.78]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.46s/it, bpd=4.62, l=4.35]\n","Ema bpd: 5.0602 prime_loss: 0.0200 gen_loss: 5.0602 loss: 4.7630 epoch: 3.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (27).txt\n","/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n"," 1% 1/78 [00:05<06:49, 5.32s/it, bpd=5.56, g_l=5.56, gn=4.55, l=5.24, p_l=2.06e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 3% 2/78 [00:10<06:42, 5.29s/it, bpd=5.02, g_l=5.02, gn=4.99, l=4.73, p_l=2.1e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 4% 3/78 [00:15<06:36, 5.28s/it, bpd=5.38, g_l=5.38, gn=4.24, l=5.07, p_l=2.18e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 5% 4/78 [00:21<06:31, 5.29s/it, bpd=4.99, g_l=4.99, gn=3.33, l=4.69, p_l=2.19e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 6% 5/78 [00:26<06:26, 5.29s/it, bpd=5.47, g_l=5.47, gn=4.5, l=5.15, p_l=2.15e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=5.16, g_l=5.16, gn=3.99, l=4.85, p_l=2.19e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 9% 7/78 [00:37<06:18, 5.33s/it, bpd=4.68, g_l=4.68, gn=4.34, l=4.4, p_l=2.31e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 10% 8/78 [00:42<06:10, 5.30s/it, bpd=6.18, g_l=6.18, gn=6.88, l=5.81, p_l=2.43e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 12% 9/78 [00:47<06:04, 5.28s/it, bpd=5.97, g_l=5.97, gn=3.47, l=5.62, p_l=2.74e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 13% 10/78 [00:52<05:56, 5.25s/it, bpd=6.47, g_l=6.47, gn=4.66, l=6.09, p_l=3.15e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=4.95, g_l=4.95, gn=3.61, l=4.66, p_l=3.42e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 15% 12/78 [01:03<05:43, 5.21s/it, bpd=6.11, g_l=6.11, gn=5.53, l=5.75, p_l=3.6e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 17% 13/78 [01:08<05:36, 5.18s/it, bpd=5.78, g_l=5.78, gn=3.66, l=5.44, p_l=3.58e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 18% 14/78 [01:18<07:03, 6.62s/it, bpd=5.5, g_l=5.5, gn=3.71, l=5.18, p_l=3.51e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 19% 15/78 [01:23<06:28, 6.17s/it, bpd=6.31, g_l=6.31, gn=5.41, l=5.94, p_l=3.48e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 21% 16/78 [01:28<06:03, 5.86s/it, bpd=4.59, g_l=4.59, gn=4.73, l=4.32, p_l=3.56e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 22% 17/78 [01:33<05:44, 5.65s/it, bpd=5.06, g_l=5.06, gn=6.22, l=4.76, p_l=3.6e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 23% 18/78 [01:38<05:32, 5.53s/it, bpd=4.61, g_l=4.61, gn=5.22, l=4.34, p_l=3.62e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 24% 19/78 [01:44<05:21, 5.46s/it, bpd=5.52, g_l=5.52, gn=3.53, l=5.19, p_l=3.76e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 26% 20/78 [01:49<05:14, 5.42s/it, bpd=5.37, g_l=5.37, gn=4.17, l=5.05, p_l=3.76e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 27% 21/78 [01:54<05:06, 5.37s/it, bpd=4.93, g_l=4.93, gn=6.86, l=4.64, p_l=3.9e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 28% 22/78 [01:59<04:58, 5.33s/it, bpd=6.55, g_l=6.55, gn=3.96, l=6.17, p_l=4.19e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 29% 23/78 [02:05<04:51, 5.30s/it, bpd=5.75, g_l=5.75, gn=4.55, l=5.42, p_l=4.58e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 31% 24/78 [02:10<04:44, 5.26s/it, bpd=5.61, g_l=5.61, gn=3.87, l=5.28, p_l=5.28e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 32% 25/78 [02:15<04:38, 5.25s/it, bpd=6.01, g_l=6.01, gn=4.85, l=5.66, p_l=6.07e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 33% 26/78 [02:20<04:31, 5.22s/it, bpd=5.53, g_l=5.53, gn=4.07, l=5.2, p_l=6.76e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 35% 27/78 [02:25<04:25, 5.21s/it, bpd=5.54, g_l=5.54, gn=3.9, l=5.21, p_l=7.15e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 36% 28/78 [02:31<04:19, 5.19s/it, bpd=5.25, g_l=5.25, gn=3.78, l=4.94, p_l=7.75e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 37% 29/78 [02:36<04:13, 5.18s/it, bpd=5.36, g_l=5.36, gn=3.63, l=5.04, p_l=7.9e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 38% 30/78 [02:41<04:08, 5.17s/it, bpd=6, g_l=6, gn=7.02, l=5.65, p_l=7.23e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 40% 31/78 [02:46<04:02, 5.16s/it, bpd=5.62, g_l=5.62, gn=3.52, l=5.29, p_l=7.03e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 41% 32/78 [02:51<03:58, 5.18s/it, bpd=5.05, g_l=5.05, gn=4.16, l=4.76, p_l=6.83e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 42% 33/78 [02:56<03:52, 5.18s/it, bpd=5.95, g_l=5.95, gn=3.51, l=5.6, p_l=7.25e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 44% 34/78 [03:02<03:47, 5.17s/it, bpd=5.23, g_l=5.23, gn=4.74, l=4.92, p_l=7.78e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 45% 35/78 [03:07<03:42, 5.17s/it, bpd=4.77, g_l=4.77, gn=3.9, l=4.49, p_l=8.27e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 46% 36/78 [03:12<03:37, 5.17s/it, bpd=6.36, g_l=6.36, gn=3.54, l=5.98, p_l=8.83e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 47% 37/78 [03:17<03:32, 5.18s/it, bpd=5.09, g_l=5.09, gn=4.34, l=4.79, p_l=9.4e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 49% 38/78 [03:22<03:27, 5.19s/it, bpd=6.97, g_l=6.97, gn=4.56, l=6.56, p_l=9.64e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 50% 39/78 [03:28<03:22, 5.20s/it, bpd=4.78, g_l=4.78, gn=5.11, l=4.5, p_l=9.19e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 51% 40/78 [03:33<03:17, 5.20s/it, bpd=6.42, g_l=6.42, gn=3.14, l=6.04, p_l=8.47e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 53% 41/78 [03:38<03:12, 5.19s/it, bpd=4.89, g_l=4.89, gn=8.72, l=4.6, p_l=8.6e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 54% 42/78 [03:43<03:06, 5.19s/it, bpd=5.36, g_l=5.36, gn=4.31, l=5.05, p_l=9.32e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 55% 43/78 [03:48<03:01, 5.19s/it, bpd=6.76, g_l=6.76, gn=3.38, l=6.36, p_l=1.01e-5]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 56% 44/78 [03:54<02:56, 5.20s/it, bpd=5.35, g_l=5.35, gn=5.7, l=5.03, p_l=1.12e-5]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 58% 45/78 [03:59<02:51, 5.20s/it, bpd=6.37, g_l=6.37, gn=3.49, l=6, p_l=1.24e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [04:04<02:46, 5.20s/it, bpd=4.62, g_l=4.62, gn=3.76, l=4.34, p_l=1.34e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 60% 47/78 [04:09<02:41, 5.21s/it, bpd=5.93, g_l=5.93, gn=4.07, l=5.59, p_l=1.37e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 62% 48/78 [04:14<02:36, 5.21s/it, bpd=5.13, g_l=5.13, gn=4.93, l=4.83, p_l=1.28e-5]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 63% 49/78 [04:20<02:31, 5.21s/it, bpd=4.65, g_l=4.65, gn=4.65, l=4.38, p_l=1.21e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 64% 50/78 [04:25<02:25, 5.21s/it, bpd=6.25, g_l=6.25, gn=3.84, l=5.88, p_l=1.16e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 65% 51/78 [04:30<02:20, 5.22s/it, bpd=4.24, g_l=4.24, gn=3.99, l=3.99, p_l=1.06e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [04:35<02:15, 5.21s/it, bpd=5.26, g_l=5.26, gn=3.81, l=4.95, p_l=9.62e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 68% 53/78 [04:40<02:10, 5.21s/it, bpd=4.78, g_l=4.78, gn=4.28, l=4.5, p_l=9.32e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 69% 54/78 [04:46<02:04, 5.21s/it, bpd=5.15, g_l=5.15, gn=4.48, l=4.84, p_l=9.29e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 71% 55/78 [04:51<01:59, 5.20s/it, bpd=5.4, g_l=5.4, gn=3.78, l=5.08, p_l=9.6e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 72% 56/78 [04:56<01:54, 5.22s/it, bpd=4.85, g_l=4.85, gn=3.5, l=4.56, p_l=9.68e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 73% 57/78 [05:01<01:49, 5.21s/it, bpd=6.58, g_l=6.58, gn=3.89, l=6.19, p_l=9.89e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 74% 58/78 [05:07<01:44, 5.22s/it, bpd=4.99, g_l=4.99, gn=5.03, l=4.69, p_l=9.85e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 76% 59/78 [05:12<01:39, 5.22s/it, bpd=6.59, g_l=6.59, gn=3.09, l=6.2, p_l=1e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 77% 60/78 [05:17<01:33, 5.21s/it, bpd=5.81, g_l=5.81, gn=4.2, l=5.46, p_l=9.83e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 78% 61/78 [05:22<01:28, 5.21s/it, bpd=5.18, g_l=5.18, gn=4.48, l=4.88, p_l=9.57e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 79% 62/78 [05:27<01:23, 5.20s/it, bpd=5.16, g_l=5.16, gn=5.03, l=4.86, p_l=9.47e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 81% 63/78 [05:33<01:18, 5.21s/it, bpd=4.02, g_l=4.02, gn=4.31, l=3.78, p_l=9.18e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 82% 64/78 [05:38<01:12, 5.21s/it, bpd=5.79, g_l=5.79, gn=3.63, l=5.45, p_l=9.06e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 83% 65/78 [05:43<01:07, 5.22s/it, bpd=5, g_l=5, gn=3.63, l=4.71, p_l=8.84e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 85% 66/78 [05:48<01:02, 5.21s/it, bpd=6.06, g_l=6.06, gn=3.34, l=5.7, p_l=8.91e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 86% 67/78 [05:53<00:57, 5.20s/it, bpd=5.15, g_l=5.15, gn=4.29, l=4.85, p_l=9.3e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 87% 68/78 [05:59<00:51, 5.20s/it, bpd=4.91, g_l=4.91, gn=3.45, l=4.62, p_l=9.28e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:04<00:46, 5.19s/it, bpd=4.38, g_l=4.38, gn=3.5, l=4.12, p_l=9.24e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 90% 70/78 [06:09<00:41, 5.20s/it, bpd=5.52, g_l=5.52, gn=3.77, l=5.19, p_l=8.92e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 91% 71/78 [06:14<00:36, 5.20s/it, bpd=5.25, g_l=5.25, gn=4.31, l=4.94, p_l=9.22e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 92% 72/78 [06:19<00:31, 5.20s/it, bpd=4.94, g_l=4.94, gn=3.11, l=4.65, p_l=9.41e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 94% 73/78 [06:25<00:25, 5.19s/it, bpd=5.84, g_l=5.84, gn=5.32, l=5.5, p_l=9.33e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 95% 74/78 [06:30<00:20, 5.19s/it, bpd=4.97, g_l=4.97, gn=3.88, l=4.67, p_l=8.8e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [06:35<00:15, 5.19s/it, bpd=3.72, g_l=3.72, gn=5.84, l=3.5, p_l=8.44e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n","100% 78/78 [06:51<00:00, 5.27s/it, bpd=4.78, g_l=4.78, gn=3.98, l=4.5, p_l=7.31e-6]\n","Train bpd: 5.4036 prime_loss: 0.0000 gen_loss: 5.4036 loss: 5.0857 gn: 4.3406 lr: 0.0003 lg_loss_scale: 13.6980 epoch: 4.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:464\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.06s/it, bpd=5.78, l=5.44]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.87s/it, bpd=5.2, l=4.9]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:04<00:10, 1.73s/it, bpd=4.87, l=4.59]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.63s/it, bpd=5.21, l=4.9]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=5.83, l=5.49]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=5.5, l=5.18]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.49s/it, bpd=4.57, l=4.3]\n","Ema bpd: 5.2432 prime_loss: 0.0189 gen_loss: 5.2432 loss: 4.9352 epoch: 4.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (25).txt\n","/content/gdrive/MyDrive/slon/slon (26).txt\n","/content/gdrive/MyDrive/slon/slon (19).txt\n"," 1% 1/78 [00:05<06:53, 5.37s/it, bpd=5.27, g_l=5.27, gn=3.61, l=4.96, p_l=7.19e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 3% 2/78 [00:10<06:45, 5.33s/it, bpd=5.76, g_l=5.76, gn=4.21, l=5.42, p_l=6.91e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 4% 3/78 [00:15<06:38, 5.31s/it, bpd=6.42, g_l=6.42, gn=4.15, l=6.05, p_l=6.52e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 5% 4/78 [00:21<06:32, 5.30s/it, bpd=5.59, g_l=5.59, gn=4.36, l=5.26, p_l=6.49e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 6% 5/78 [00:26<06:26, 5.30s/it, bpd=6.41, g_l=6.41, gn=3.29, l=6.03, p_l=6.47e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=4.68, g_l=4.68, gn=3.74, l=4.41, p_l=6.51e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=5.43, g_l=5.43, gn=5.07, l=5.11, p_l=6.12e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:08, 5.27s/it, bpd=4.84, g_l=4.84, gn=4.75, l=4.55, p_l=5.6e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 12% 9/78 [00:47<06:03, 5.26s/it, bpd=5.26, g_l=5.26, gn=4.62, l=4.95, p_l=5.09e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=5.36, g_l=5.36, gn=4.9, l=5.05, p_l=4.63e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 14% 11/78 [00:57<05:48, 5.21s/it, bpd=5.16, g_l=5.16, gn=3.94, l=4.85, p_l=4.47e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=5.16, g_l=5.16, gn=3.81, l=4.86, p_l=4.41e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:477\u001b[0m\n"," 17% 13/78 [01:43<17:09, 15.84s/it, bpd=4.19, g_l=4.19, gn=4.87, l=3.94, p_l=4.66e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 18% 14/78 [01:49<13:32, 12.70s/it, bpd=4.43, g_l=4.43, gn=3.28, l=4.17, p_l=5.23e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 19% 15/78 [01:54<10:58, 10.46s/it, bpd=6.35, g_l=6.35, gn=3.95, l=5.98, p_l=5.68e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:59<09:12, 8.90s/it, bpd=6.43, g_l=6.43, gn=4.53, l=6.05, p_l=5.74e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 22% 17/78 [02:05<08:00, 7.88s/it, bpd=6.15, g_l=6.15, gn=3, l=5.79, p_l=5.77e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 23% 18/78 [02:10<07:09, 7.16s/it, bpd=4.97, g_l=4.97, gn=4.56, l=4.68, p_l=6.04e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 24% 19/78 [02:16<06:33, 6.68s/it, bpd=6.68, g_l=6.68, gn=3.38, l=6.29, p_l=6.47e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 26% 20/78 [02:21<06:05, 6.30s/it, bpd=6.44, g_l=6.44, gn=3.91, l=6.06, p_l=7.36e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 27% 21/78 [02:26<05:43, 6.03s/it, bpd=6.04, g_l=6.04, gn=3.61, l=5.69, p_l=8e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 28% 22/78 [02:32<05:25, 5.81s/it, bpd=5.91, g_l=5.91, gn=3.69, l=5.57, p_l=8.43e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 29% 23/78 [02:37<05:09, 5.63s/it, bpd=4.94, g_l=4.94, gn=3.64, l=4.65, p_l=8.77e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 31% 24/78 [02:42<04:57, 5.51s/it, bpd=4.63, g_l=4.63, gn=4.02, l=4.36, p_l=8.97e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 32% 25/78 [02:47<04:45, 5.39s/it, bpd=6.3, g_l=6.3, gn=5.76, l=5.93, p_l=9.43e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 33% 26/78 [02:52<04:36, 5.32s/it, bpd=5.05, g_l=5.05, gn=6.35, l=4.75, p_l=1.01e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 35% 27/78 [02:57<04:28, 5.26s/it, bpd=5.36, g_l=5.36, gn=3.95, l=5.05, p_l=1.08e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 36% 28/78 [03:03<04:21, 5.23s/it, bpd=5.11, g_l=5.11, gn=4.06, l=4.81, p_l=1.12e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 37% 29/78 [03:08<04:14, 5.20s/it, bpd=5.4, g_l=5.4, gn=4.23, l=5.08, p_l=1.15e-5]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 38% 30/78 [03:13<04:08, 5.18s/it, bpd=5.34, g_l=5.34, gn=5.85, l=5.03, p_l=1.13e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 40% 31/78 [03:18<04:05, 5.22s/it, bpd=5.76, g_l=5.76, gn=3.82, l=5.42, p_l=1.1e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 41% 32/78 [03:23<04:00, 5.22s/it, bpd=6.5, g_l=6.5, gn=4.05, l=6.12, p_l=1.1e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 42% 33/78 [03:29<03:56, 5.26s/it, bpd=4.31, g_l=4.31, gn=5.2, l=4.06, p_l=1.08e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 44% 34/78 [03:34<03:51, 5.26s/it, bpd=5.38, g_l=5.38, gn=3.38, l=5.06, p_l=1.08e-5]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 45% 35/78 [03:39<03:47, 5.29s/it, bpd=5.08, g_l=5.08, gn=3.7, l=4.78, p_l=1.08e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 46% 36/78 [03:47<04:14, 6.05s/it, bpd=5.86, g_l=5.86, gn=5.29, l=5.52, p_l=1.05e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 47% 37/78 [03:53<03:59, 5.83s/it, bpd=4.93, g_l=4.93, gn=3.82, l=4.64, p_l=1.03e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 49% 38/78 [03:58<03:46, 5.66s/it, bpd=5.61, g_l=5.61, gn=4.23, l=5.28, p_l=9.74e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 50% 39/78 [04:03<03:35, 5.53s/it, bpd=5.11, g_l=5.11, gn=4.78, l=4.81, p_l=8.92e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 51% 40/78 [04:08<03:28, 5.48s/it, bpd=6.11, g_l=6.11, gn=3.44, l=5.75, p_l=7.79e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 53% 41/78 [04:14<03:19, 5.40s/it, bpd=4.76, g_l=4.76, gn=3.49, l=4.48, p_l=6.92e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 54% 42/78 [04:19<03:14, 5.39s/it, bpd=5.5, g_l=5.5, gn=3.62, l=5.17, p_l=6.29e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 55% 43/78 [04:24<03:07, 5.35s/it, bpd=4.08, g_l=4.08, gn=3.91, l=3.84, p_l=6.76e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 56% 44/78 [04:30<03:01, 5.32s/it, bpd=5.42, g_l=5.42, gn=4.07, l=5.11, p_l=7.59e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 58% 45/78 [04:35<02:54, 5.30s/it, bpd=4.88, g_l=4.88, gn=4.15, l=4.59, p_l=8.19e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 59% 46/78 [04:40<02:49, 5.28s/it, bpd=5.51, g_l=5.51, gn=3.56, l=5.18, p_l=8.48e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 60% 47/78 [04:45<02:43, 5.27s/it, bpd=6.72, g_l=6.72, gn=3.16, l=6.33, p_l=7.99e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 62% 48/78 [04:50<02:37, 5.25s/it, bpd=5.16, g_l=5.16, gn=3.97, l=4.86, p_l=7.3e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 63% 49/78 [04:56<02:32, 5.24s/it, bpd=6.77, g_l=6.77, gn=3.44, l=6.37, p_l=6.95e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 64% 50/78 [05:01<02:26, 5.23s/it, bpd=4.88, g_l=4.88, gn=3.58, l=4.6, p_l=6.65e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 65% 51/78 [05:06<02:21, 5.23s/it, bpd=6.01, g_l=6.01, gn=3.44, l=5.65, p_l=6.23e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 67% 52/78 [05:11<02:15, 5.22s/it, bpd=5.27, g_l=5.27, gn=3.8, l=4.96, p_l=5.72e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 68% 53/78 [05:16<02:10, 5.21s/it, bpd=4.75, g_l=4.75, gn=3.44, l=4.47, p_l=5.45e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 69% 54/78 [05:22<02:05, 5.21s/it, bpd=4.96, g_l=4.96, gn=3.57, l=4.66, p_l=5.06e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 71% 55/78 [05:27<01:59, 5.20s/it, bpd=4.86, g_l=4.86, gn=3.01, l=4.57, p_l=4.65e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 72% 56/78 [05:32<01:54, 5.21s/it, bpd=5.53, g_l=5.53, gn=3.15, l=5.21, p_l=4.27e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 73% 57/78 [05:37<01:49, 5.21s/it, bpd=4.62, g_l=4.62, gn=3.69, l=4.35, p_l=4.02e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 74% 58/78 [05:43<01:44, 5.21s/it, bpd=4.55, g_l=4.55, gn=4.38, l=4.28, p_l=3.73e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 76% 59/78 [05:48<01:38, 5.20s/it, bpd=5.86, g_l=5.86, gn=4.49, l=5.51, p_l=3.7e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 77% 60/78 [05:53<01:33, 5.20s/it, bpd=5.16, g_l=5.16, gn=3.39, l=4.86, p_l=3.82e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 78% 61/78 [05:58<01:28, 5.21s/it, bpd=5.56, g_l=5.56, gn=3.17, l=5.24, p_l=3.79e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 79% 62/78 [06:03<01:23, 5.20s/it, bpd=5.3, g_l=5.3, gn=3.5, l=4.99, p_l=3.87e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 81% 63/78 [06:09<01:18, 5.21s/it, bpd=5.07, g_l=5.07, gn=4.56, l=4.77, p_l=3.96e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [06:14<01:12, 5.20s/it, bpd=5.57, g_l=5.57, gn=4.23, l=5.25, p_l=4.26e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 83% 65/78 [06:19<01:07, 5.20s/it, bpd=4.69, g_l=4.69, gn=4.96, l=4.42, p_l=4.7e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 85% 66/78 [06:24<01:02, 5.19s/it, bpd=4.9, g_l=4.9, gn=4.42, l=4.62, p_l=5.11e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 86% 67/78 [06:29<00:57, 5.18s/it, bpd=5.3, g_l=5.3, gn=4.38, l=4.99, p_l=5.62e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [06:34<00:51, 5.20s/it, bpd=5.13, g_l=5.13, gn=3.63, l=4.83, p_l=6.29e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:40<00:46, 5.19s/it, bpd=6.82, g_l=6.82, gn=3.55, l=6.42, p_l=6.44e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 90% 70/78 [06:45<00:41, 5.20s/it, bpd=4.87, g_l=4.87, gn=3.74, l=4.58, p_l=5.81e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 91% 71/78 [06:50<00:36, 5.20s/it, bpd=4.79, g_l=4.79, gn=3.16, l=4.51, p_l=5.26e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 92% 72/78 [06:55<00:31, 5.19s/it, bpd=5.17, g_l=5.17, gn=4.67, l=4.87, p_l=4.92e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 94% 73/78 [07:00<00:25, 5.19s/it, bpd=5.07, g_l=5.07, gn=4.13, l=4.77, p_l=4.99e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 95% 74/78 [07:06<00:20, 5.19s/it, bpd=5.59, g_l=5.59, gn=3.95, l=5.26, p_l=5.27e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 96% 75/78 [07:11<00:15, 5.20s/it, bpd=5.12, g_l=5.12, gn=3.3, l=4.82, p_l=5.97e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n","100% 78/78 [07:27<00:00, 5.73s/it, bpd=6.83, g_l=6.83, gn=3.41, l=6.43, p_l=8.52e-6]\n","Train bpd: 5.4053 prime_loss: 0.0000 gen_loss: 5.4053 loss: 5.0873 gn: 4.0194 lr: 0.0003 lg_loss_scale: 14.0100 epoch: 5.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:542\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.00s/it, bpd=5.06, l=4.76]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.88s/it, bpd=5.02, l=4.73]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:05<00:10, 1.74s/it, bpd=5.69, l=5.36]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=4.3, l=4.05]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=4.96, l=4.67]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=4.88, l=4.6]/content/gdrive/MyDrive/slon/slon (6).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=5.15, l=4.85]\n","Ema bpd: 5.0150 prime_loss: 0.0183 gen_loss: 5.0150 loss: 4.7205 epoch: 5.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (3).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n"," 1% 1/78 [00:05<07:02, 5.49s/it, bpd=4.72, g_l=4.72, gn=3.49, l=4.44, p_l=9.5e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 3% 2/78 [00:10<06:50, 5.41s/it, bpd=5.79, g_l=5.79, gn=3.48, l=5.45, p_l=9.13e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:15<06:42, 5.36s/it, bpd=5.27, g_l=5.27, gn=3.41, l=4.96, p_l=8.55e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 5% 4/78 [00:21<06:36, 5.35s/it, bpd=5.51, g_l=5.51, gn=3.17, l=5.18, p_l=8.13e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 6% 5/78 [00:26<06:30, 5.35s/it, bpd=4.9, g_l=4.9, gn=3.4, l=4.61, p_l=8.05e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 8% 6/78 [00:31<06:24, 5.33s/it, bpd=5.94, g_l=5.94, gn=4.71, l=5.59, p_l=8.26e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 9% 7/78 [00:37<06:17, 5.32s/it, bpd=4.8, g_l=4.8, gn=4.47, l=4.52, p_l=8.73e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 10% 8/78 [00:42<06:10, 5.30s/it, bpd=6.57, g_l=6.57, gn=3.97, l=6.18, p_l=9.74e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 12% 9/78 [00:47<06:04, 5.28s/it, bpd=5.38, g_l=5.38, gn=4.6, l=5.06, p_l=1.07e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 13% 10/78 [00:52<05:56, 5.25s/it, bpd=5.38, g_l=5.38, gn=5.45, l=5.06, p_l=1.12e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 14% 11/78 [00:58<05:49, 5.22s/it, bpd=5.52, g_l=5.52, gn=4.44, l=5.19, p_l=1.18e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 15% 12/78 [01:03<05:43, 5.20s/it, bpd=4.66, g_l=4.66, gn=3.74, l=4.39, p_l=1.14e-5]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 17% 13/78 [01:08<05:36, 5.18s/it, bpd=6.13, g_l=6.13, gn=3.43, l=5.77, p_l=1.08e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 18% 14/78 [01:13<05:31, 5.17s/it, bpd=5.1, g_l=5.1, gn=3.62, l=4.8, p_l=1.05e-5]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=4.7, g_l=4.7, gn=3.35, l=4.42, p_l=1.05e-5]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 21% 16/78 [01:23<05:20, 5.17s/it, bpd=4.98, g_l=4.98, gn=4.11, l=4.69, p_l=9.89e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 22% 17/78 [01:28<05:15, 5.17s/it, bpd=6.48, g_l=6.48, gn=3.26, l=6.1, p_l=9.86e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 23% 18/78 [01:34<05:10, 5.17s/it, bpd=5.46, g_l=5.46, gn=3.15, l=5.14, p_l=9.15e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=5.58, g_l=5.58, gn=3.8, l=5.25, p_l=8.95e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=5.04, g_l=5.04, gn=4, l=4.75, p_l=8.78e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 27% 21/78 [01:49<04:56, 5.21s/it, bpd=3.91, g_l=3.91, gn=4.4, l=3.68, p_l=8.66e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 28% 22/78 [01:55<04:51, 5.21s/it, bpd=4.62, g_l=4.62, gn=3.78, l=4.35, p_l=8.68e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 29% 23/78 [02:00<04:46, 5.21s/it, bpd=5.75, g_l=5.75, gn=4, l=5.41, p_l=8.61e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 31% 24/78 [02:05<04:40, 5.20s/it, bpd=4.41, g_l=4.41, gn=3.88, l=4.15, p_l=8.65e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 32% 25/78 [02:10<04:35, 5.20s/it, bpd=5.66, g_l=5.66, gn=7.46, l=5.33, p_l=9.18e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 33% 26/78 [02:15<04:30, 5.21s/it, bpd=4.81, g_l=4.81, gn=4.18, l=4.53, p_l=9.34e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 35% 27/78 [02:21<04:25, 5.20s/it, bpd=4.52, g_l=4.52, gn=6.08, l=4.26, p_l=9.26e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 36% 28/78 [02:26<04:20, 5.20s/it, bpd=4.43, g_l=4.43, gn=4.19, l=4.17, p_l=8.96e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:31<04:14, 5.20s/it, bpd=5.19, g_l=5.19, gn=3.96, l=4.89, p_l=8.15e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 38% 30/78 [02:36<04:09, 5.19s/it, bpd=5.2, g_l=5.2, gn=4.18, l=4.89, p_l=7.69e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 40% 31/78 [02:41<04:03, 5.18s/it, bpd=4.7, g_l=4.7, gn=3.36, l=4.42, p_l=7.41e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 41% 32/78 [02:46<03:58, 5.18s/it, bpd=5.24, g_l=5.24, gn=3.91, l=4.93, p_l=7.41e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 42% 33/78 [02:52<03:53, 5.18s/it, bpd=3.76, g_l=3.76, gn=5.22, l=3.54, p_l=7.39e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 44% 34/78 [02:57<03:48, 5.19s/it, bpd=4.89, g_l=4.89, gn=5.16, l=4.6, p_l=7.33e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 45% 35/78 [03:02<03:43, 5.19s/it, bpd=5.22, g_l=5.22, gn=3.6, l=4.91, p_l=7.12e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 46% 36/78 [03:07<03:37, 5.19s/it, bpd=5.11, g_l=5.11, gn=3.28, l=4.81, p_l=7.43e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 47% 37/78 [03:12<03:32, 5.18s/it, bpd=6.45, g_l=6.45, gn=3.41, l=6.07, p_l=7.83e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 49% 38/78 [03:18<03:27, 5.18s/it, bpd=7.36, g_l=7.36, gn=3.12, l=6.93, p_l=8.02e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 50% 39/78 [03:23<03:21, 5.17s/it, bpd=5.22, g_l=5.22, gn=3.66, l=4.91, p_l=8.06e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 51% 40/78 [03:28<03:17, 5.19s/it, bpd=5.52, g_l=5.52, gn=3.52, l=5.2, p_l=8.14e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 53% 41/78 [03:33<03:11, 5.18s/it, bpd=5.45, g_l=5.45, gn=3.2, l=5.13, p_l=8.05e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 54% 42/78 [03:38<03:07, 5.19s/it, bpd=5.19, g_l=5.19, gn=4.98, l=4.88, p_l=8.8e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 55% 43/78 [03:44<03:01, 5.19s/it, bpd=5.52, g_l=5.52, gn=3.29, l=5.19, p_l=1.03e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 56% 44/78 [03:49<02:56, 5.19s/it, bpd=3.97, g_l=3.97, gn=4.02, l=3.74, p_l=1.33e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 58% 45/78 [03:54<02:51, 5.19s/it, bpd=5.75, g_l=5.75, gn=4.59, l=5.41, p_l=1.7e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 59% 46/78 [03:59<02:45, 5.19s/it, bpd=6.35, g_l=6.35, gn=4.5, l=5.97, p_l=2.21e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 60% 47/78 [04:04<02:41, 5.20s/it, bpd=5.53, g_l=5.53, gn=3.57, l=5.21, p_l=2.71e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 62% 48/78 [04:09<02:35, 5.19s/it, bpd=4.62, g_l=4.62, gn=6.22, l=4.35, p_l=3.05e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 63% 49/78 [04:15<02:30, 5.20s/it, bpd=6.57, g_l=6.57, gn=4.01, l=6.18, p_l=3.31e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 64% 50/78 [04:20<02:25, 5.20s/it, bpd=6.37, g_l=6.37, gn=4.28, l=6, p_l=3.24e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 65% 51/78 [04:25<02:20, 5.19s/it, bpd=4.92, g_l=4.92, gn=3.86, l=4.63, p_l=3.01e-5]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 67% 52/78 [04:30<02:15, 5.20s/it, bpd=4.93, g_l=4.93, gn=3.61, l=4.64, p_l=2.83e-5]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 68% 53/78 [04:35<02:09, 5.19s/it, bpd=5.03, g_l=5.03, gn=3.57, l=4.73, p_l=2.59e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 69% 54/78 [04:41<02:04, 5.20s/it, bpd=4.65, g_l=4.65, gn=3.48, l=4.38, p_l=2.42e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 71% 55/78 [04:46<01:59, 5.20s/it, bpd=5.25, g_l=5.25, gn=3.51, l=4.94, p_l=2.33e-5]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 72% 56/78 [04:51<01:54, 5.20s/it, bpd=5, g_l=5, gn=5.08, l=4.71, p_l=2.31e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 73% 57/78 [04:56<01:49, 5.20s/it, bpd=5.01, g_l=5.01, gn=4.7, l=4.72, p_l=2.21e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 74% 58/78 [05:07<02:14, 6.73s/it, bpd=5.74, g_l=5.74, gn=4.34, l=5.4, p_l=2.21e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 76% 59/78 [05:12<01:58, 6.24s/it, bpd=4.98, g_l=4.98, gn=4.3, l=4.68, p_l=2.25e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 77% 60/78 [05:17<01:46, 5.93s/it, bpd=4.68, g_l=4.68, gn=3.66, l=4.41, p_l=2.41e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 78% 61/78 [05:22<01:36, 5.71s/it, bpd=5.13, g_l=5.13, gn=4.1, l=4.83, p_l=2.52e-5]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 79% 62/78 [05:27<01:28, 5.56s/it, bpd=4.64, g_l=4.64, gn=3.35, l=4.37, p_l=2.45e-5]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 81% 63/78 [05:33<01:21, 5.47s/it, bpd=4.81, g_l=4.81, gn=4.62, l=4.53, p_l=2.33e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 82% 64/78 [05:38<01:15, 5.40s/it, bpd=4.73, g_l=4.73, gn=4.64, l=4.45, p_l=2.49e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 83% 65/78 [05:43<01:09, 5.36s/it, bpd=4.23, g_l=4.23, gn=4.93, l=3.98, p_l=2.81e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 85% 66/78 [05:48<01:03, 5.32s/it, bpd=4.45, g_l=4.45, gn=4.73, l=4.19, p_l=3.25e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [05:53<00:58, 5.30s/it, bpd=5.64, g_l=5.64, gn=4.08, l=5.31, p_l=3.56e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 87% 68/78 [05:59<00:52, 5.27s/it, bpd=5.68, g_l=5.68, gn=7.82, l=5.34, p_l=3.86e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 88% 69/78 [06:04<00:47, 5.24s/it, bpd=5.01, g_l=5.01, gn=4.49, l=4.72, p_l=4.13e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 90% 70/78 [06:09<00:41, 5.22s/it, bpd=4.42, g_l=4.42, gn=4.43, l=4.16, p_l=4.22e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 91% 71/78 [06:14<00:36, 5.20s/it, bpd=5.28, g_l=5.28, gn=3.53, l=4.97, p_l=4.33e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 92% 72/78 [06:19<00:31, 5.20s/it, bpd=6.59, g_l=6.59, gn=4.29, l=6.21, p_l=3.98e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:25<00:25, 5.19s/it, bpd=5.87, g_l=5.87, gn=3.99, l=5.52, p_l=3.88e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 95% 74/78 [06:30<00:20, 5.19s/it, bpd=6.66, g_l=6.66, gn=3.16, l=6.27, p_l=4e-5]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 96% 75/78 [06:35<00:15, 5.18s/it, bpd=4.48, g_l=4.48, gn=4.47, l=4.22, p_l=4.46e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n","100% 78/78 [06:51<00:00, 5.27s/it, bpd=5.82, g_l=5.82, gn=3.34, l=5.48, p_l=4.32e-5]\n","Train bpd: 5.2512 prime_loss: 0.0000 gen_loss: 5.2512 loss: 4.9423 gn: 4.1350 lr: 0.0003 lg_loss_scale: 14.3220 epoch: 6.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:620\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.90s/it, bpd=4.94, l=4.65]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:12, 1.78s/it, bpd=5.4, l=5.08]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 33% 3/9 [00:04<00:10, 1.72s/it, bpd=5, l=4.71]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.63s/it, bpd=5.32, l=5.01]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=5.43, l=5.11]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=4.25, l=4]/content/gdrive/MyDrive/slon/slon (6).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=4.91, l=4.62]\n","Ema bpd: 5.1065 prime_loss: 0.0179 gen_loss: 5.1065 loss: 4.8066 epoch: 6.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (22).txt\n","/content/gdrive/MyDrive/slon/slon (33).txt\n","/content/gdrive/MyDrive/slon/slon (17).txt\n"," 1% 1/78 [00:05<06:51, 5.34s/it, bpd=4.16, g_l=4.16, gn=4.26, l=3.92, p_l=3.79e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 3% 2/78 [00:10<06:43, 5.31s/it, bpd=5.21, g_l=5.21, gn=3.3, l=4.91, p_l=3.17e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 4% 3/78 [00:15<06:36, 5.29s/it, bpd=4.89, g_l=4.89, gn=3.71, l=4.6, p_l=2.71e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 5% 4/78 [00:21<06:31, 5.30s/it, bpd=4.84, g_l=4.84, gn=4.08, l=4.55, p_l=2.37e-5]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 6% 5/78 [00:26<06:26, 5.29s/it, bpd=6.48, g_l=6.48, gn=3.61, l=6.1, p_l=2.18e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=6.13, g_l=6.13, gn=3.5, l=5.77, p_l=1.92e-5]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 9% 7/78 [00:36<06:13, 5.27s/it, bpd=5.69, g_l=5.69, gn=4.17, l=5.36, p_l=1.67e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 10% 8/78 [00:42<06:06, 5.24s/it, bpd=5.27, g_l=5.27, gn=3.58, l=4.96, p_l=1.43e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 12% 9/78 [00:47<06:00, 5.23s/it, bpd=5.86, g_l=5.86, gn=3.39, l=5.51, p_l=1.16e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 13% 10/78 [00:52<05:54, 5.21s/it, bpd=5.05, g_l=5.05, gn=3.42, l=4.75, p_l=9.54e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 14% 11/78 [00:57<05:48, 5.20s/it, bpd=5.69, g_l=5.69, gn=4.25, l=5.36, p_l=7.75e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=4.65, g_l=4.65, gn=4.09, l=4.38, p_l=6.76e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 17% 13/78 [01:07<05:36, 5.18s/it, bpd=6.26, g_l=6.26, gn=3.58, l=5.89, p_l=6.23e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 18% 14/78 [01:13<05:31, 5.17s/it, bpd=5.9, g_l=5.9, gn=3.78, l=5.55, p_l=5.73e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=3.93, g_l=3.93, gn=3.72, l=3.7, p_l=5.15e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:23<05:21, 5.18s/it, bpd=6.77, g_l=6.77, gn=3.72, l=6.37, p_l=4.87e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 22% 17/78 [01:28<05:16, 5.18s/it, bpd=5.64, g_l=5.64, gn=3.18, l=5.3, p_l=5e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 23% 18/78 [01:33<05:11, 5.20s/it, bpd=4.84, g_l=4.84, gn=3.66, l=4.55, p_l=5.05e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=5.73, g_l=5.73, gn=3.17, l=5.39, p_l=5.11e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=4.78, g_l=4.78, gn=3.09, l=4.5, p_l=5.12e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 27% 21/78 [01:49<04:56, 5.20s/it, bpd=4.09, g_l=4.09, gn=3.36, l=3.85, p_l=5.22e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 28% 22/78 [01:54<04:51, 5.20s/it, bpd=5.04, g_l=5.04, gn=3.97, l=4.74, p_l=5.3e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 29% 23/78 [01:59<04:46, 5.21s/it, bpd=4.96, g_l=4.96, gn=4.17, l=4.67, p_l=4.9e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=5.75, g_l=5.75, gn=3.23, l=5.41, p_l=4.54e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 32% 25/78 [02:10<04:36, 5.22s/it, bpd=5.29, g_l=5.29, gn=3.74, l=4.98, p_l=4.06e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 33% 26/78 [02:15<04:31, 5.21s/it, bpd=4.94, g_l=4.94, gn=4.52, l=4.65, p_l=3.56e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 35% 27/78 [02:20<04:25, 5.21s/it, bpd=5.93, g_l=5.93, gn=3.71, l=5.58, p_l=3.3e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 36% 28/78 [02:25<04:20, 5.20s/it, bpd=5.23, g_l=5.23, gn=3.94, l=4.92, p_l=3.26e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=4.64, g_l=4.64, gn=3.07, l=4.37, p_l=3.51e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 38% 30/78 [02:36<04:10, 5.21s/it, bpd=4.82, g_l=4.82, gn=3.83, l=4.54, p_l=3.91e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 40% 31/78 [02:41<04:04, 5.20s/it, bpd=4.71, g_l=4.71, gn=3.39, l=4.43, p_l=4.1e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 41% 32/78 [02:46<03:59, 5.20s/it, bpd=5.2, g_l=5.2, gn=3.9, l=4.9, p_l=4.19e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 42% 33/78 [02:51<03:53, 5.19s/it, bpd=5.54, g_l=5.54, gn=4.57, l=5.21, p_l=4.2e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 44% 34/78 [02:57<03:47, 5.18s/it, bpd=5.34, g_l=5.34, gn=3.66, l=5.03, p_l=4.12e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 45% 35/78 [03:02<03:42, 5.17s/it, bpd=6.55, g_l=6.55, gn=3.69, l=6.16, p_l=3.91e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 46% 36/78 [03:07<03:36, 5.17s/it, bpd=5.73, g_l=5.73, gn=7.57, l=5.39, p_l=3.58e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 47% 37/78 [03:12<03:32, 5.17s/it, bpd=5.5, g_l=5.5, gn=4.17, l=5.18, p_l=3.51e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:17<03:26, 5.17s/it, bpd=4.91, g_l=4.91, gn=4.96, l=4.62, p_l=3.41e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 50% 39/78 [03:23<03:22, 5.18s/it, bpd=4.5, g_l=4.5, gn=3.77, l=4.23, p_l=3.58e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 51% 40/78 [03:28<03:16, 5.18s/it, bpd=5.11, g_l=5.11, gn=3.94, l=4.81, p_l=3.89e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 53% 41/78 [03:33<03:11, 5.18s/it, bpd=6.08, g_l=6.08, gn=4.16, l=5.72, p_l=4.54e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 54% 42/78 [03:38<03:06, 5.18s/it, bpd=5.29, g_l=5.29, gn=4.6, l=4.98, p_l=5.05e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 55% 43/78 [03:43<03:01, 5.19s/it, bpd=4.72, g_l=4.72, gn=3.98, l=4.44, p_l=5.54e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 56% 44/78 [03:48<02:56, 5.19s/it, bpd=5.02, g_l=5.02, gn=3.89, l=4.72, p_l=5.72e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 58% 45/78 [03:54<02:51, 5.19s/it, bpd=5.14, g_l=5.14, gn=4.16, l=4.84, p_l=5.9e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [03:59<02:46, 5.21s/it, bpd=5.29, g_l=5.29, gn=3.73, l=4.98, p_l=6.26e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 60% 47/78 [04:04<02:41, 5.20s/it, bpd=5.93, g_l=5.93, gn=4.59, l=5.58, p_l=6.56e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 62% 48/78 [04:09<02:35, 5.20s/it, bpd=4.71, g_l=4.71, gn=4.07, l=4.44, p_l=6.58e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 63% 49/78 [04:14<02:30, 5.19s/it, bpd=5.31, g_l=5.31, gn=4.76, l=5, p_l=6.79e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 64% 50/78 [04:20<02:25, 5.19s/it, bpd=5.33, g_l=5.33, gn=3.86, l=5.01, p_l=7.03e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 65% 51/78 [04:25<02:20, 5.20s/it, bpd=5.72, g_l=5.72, gn=3.41, l=5.38, p_l=7.41e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 67% 52/78 [04:30<02:15, 5.20s/it, bpd=5.93, g_l=5.93, gn=3.13, l=5.58, p_l=7.94e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 68% 53/78 [04:35<02:10, 5.21s/it, bpd=5.04, g_l=5.04, gn=5.81, l=4.74, p_l=8.59e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 69% 54/78 [04:40<02:05, 5.21s/it, bpd=4.94, g_l=4.94, gn=4.06, l=4.65, p_l=9.11e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 71% 55/78 [04:46<01:59, 5.21s/it, bpd=5.79, g_l=5.79, gn=3.48, l=5.45, p_l=9.51e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 72% 56/78 [04:51<01:54, 5.21s/it, bpd=4.5, g_l=4.5, gn=4.63, l=4.24, p_l=9.6e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 73% 57/78 [04:56<01:49, 5.20s/it, bpd=6.03, g_l=6.03, gn=3.61, l=5.68, p_l=9.63e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 74% 58/78 [05:01<01:44, 5.21s/it, bpd=5.22, g_l=5.22, gn=3.46, l=4.91, p_l=1.02e-5]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 76% 59/78 [05:07<01:38, 5.21s/it, bpd=5.02, g_l=5.02, gn=3.88, l=4.73, p_l=1.07e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 77% 60/78 [05:12<01:33, 5.21s/it, bpd=3.65, g_l=3.65, gn=4.78, l=3.44, p_l=1.16e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 78% 61/78 [05:17<01:28, 5.21s/it, bpd=4.1, g_l=4.1, gn=3.65, l=3.86, p_l=1.25e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 79% 62/78 [05:22<01:23, 5.20s/it, bpd=6.57, g_l=6.57, gn=4.71, l=6.18, p_l=1.23e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 81% 63/78 [05:27<01:18, 5.20s/it, bpd=4.81, g_l=4.81, gn=4.31, l=4.52, p_l=1.19e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 82% 64/78 [05:32<01:12, 5.19s/it, bpd=6.99, g_l=6.99, gn=3.48, l=6.58, p_l=1.06e-5]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 83% 65/78 [05:38<01:07, 5.20s/it, bpd=4.71, g_l=4.71, gn=3.89, l=4.44, p_l=9.74e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 85% 66/78 [05:43<01:02, 5.19s/it, bpd=4.83, g_l=4.83, gn=6, l=4.55, p_l=9.49e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 86% 67/78 [05:48<00:57, 5.19s/it, bpd=5.39, g_l=5.39, gn=3.79, l=5.08, p_l=9.44e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [05:53<00:51, 5.18s/it, bpd=4.71, g_l=4.71, gn=3.15, l=4.44, p_l=9.63e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 88% 69/78 [05:58<00:46, 5.18s/it, bpd=5.37, g_l=5.37, gn=3.6, l=5.05, p_l=9.65e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 90% 70/78 [06:04<00:41, 5.19s/it, bpd=4.46, g_l=4.46, gn=3.68, l=4.19, p_l=9.79e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 91% 71/78 [06:09<00:36, 5.19s/it, bpd=6.23, g_l=6.23, gn=2.98, l=5.87, p_l=1.07e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 92% 72/78 [06:14<00:31, 5.20s/it, bpd=4.22, g_l=4.22, gn=3.8, l=3.97, p_l=1.17e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 94% 73/78 [06:19<00:26, 5.20s/it, bpd=4.67, g_l=4.67, gn=3.91, l=4.39, p_l=1.33e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 95% 74/78 [06:24<00:20, 5.20s/it, bpd=4.75, g_l=4.75, gn=3.86, l=4.47, p_l=1.52e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 96% 75/78 [06:30<00:15, 5.19s/it, bpd=5.45, g_l=5.45, gn=3.8, l=5.13, p_l=1.68e-5]/content/gdrive/MyDrive/slon/slon (12).txt\n","100% 78/78 [06:45<00:00, 5.20s/it, bpd=5.06, g_l=5.06, gn=3.38, l=4.76, p_l=1.77e-5]\n","Train bpd: 5.2482 prime_loss: 0.0000 gen_loss: 5.2482 loss: 4.9395 gn: 3.9364 lr: 0.0003 lg_loss_scale: 14.6340 epoch: 7.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:698\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.89s/it, bpd=4.99, l=4.7]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:12, 1.79s/it, bpd=5.18, l=4.88]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:04<00:10, 1.67s/it, bpd=4.91, l=4.62]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:07, 1.59s/it, bpd=5.35, l=5.03]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.53s/it, bpd=4.76, l=4.48]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.49s/it, bpd=5.17, l=4.86]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.49s/it, bpd=5.88, l=5.54]\n","Ema bpd: 5.1673 prime_loss: 0.0179 gen_loss: 5.1673 loss: 4.8638 epoch: 7.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (11).txt\n","/content/gdrive/MyDrive/slon/slon (4).txt\n","/content/gdrive/MyDrive/slon/slon (28).txt\n"," 1% 1/78 [00:05<06:53, 5.37s/it, bpd=4.55, g_l=4.55, gn=4.13, l=4.28, p_l=1.7e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 3% 2/78 [00:15<08:40, 6.85s/it, bpd=5.03, g_l=5.03, gn=4.33, l=4.74, p_l=1.59e-5]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 4% 3/78 [00:20<07:57, 6.37s/it, bpd=3.86, g_l=3.86, gn=3.56, l=3.63, p_l=1.61e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 5% 4/78 [00:26<07:26, 6.04s/it, bpd=5, g_l=5, gn=4.01, l=4.71, p_l=1.63e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 6% 5/78 [00:31<07:04, 5.82s/it, bpd=4.77, g_l=4.77, gn=3.95, l=4.49, p_l=1.63e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 8% 6/78 [00:36<06:47, 5.66s/it, bpd=5.84, g_l=5.84, gn=6.02, l=5.5, p_l=1.6e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 9% 7/78 [00:42<06:33, 5.54s/it, bpd=4.79, g_l=4.79, gn=3.95, l=4.51, p_l=1.57e-5]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 10% 8/78 [00:47<06:22, 5.47s/it, bpd=4.66, g_l=4.66, gn=5.68, l=4.38, p_l=1.5e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 12% 9/78 [00:52<06:12, 5.39s/it, bpd=4.85, g_l=4.85, gn=3.76, l=4.56, p_l=1.39e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:57<06:03, 5.35s/it, bpd=5.77, g_l=5.77, gn=7.14, l=5.43, p_l=1.19e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 14% 11/78 [01:03<05:55, 5.31s/it, bpd=5.96, g_l=5.96, gn=3.44, l=5.61, p_l=1.01e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 15% 12/78 [01:08<05:47, 5.27s/it, bpd=5.04, g_l=5.04, gn=3.81, l=4.74, p_l=8.25e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 17% 13/78 [01:13<05:40, 5.24s/it, bpd=5.63, g_l=5.63, gn=4.27, l=5.3, p_l=6.75e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 18% 14/78 [01:18<05:32, 5.20s/it, bpd=6.23, g_l=6.23, gn=3.66, l=5.86, p_l=5.63e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 19% 15/78 [01:23<05:26, 5.19s/it, bpd=5.48, g_l=5.48, gn=4.08, l=5.16, p_l=4.96e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 21% 16/78 [01:28<05:20, 5.17s/it, bpd=5.43, g_l=5.43, gn=3.45, l=5.11, p_l=4.67e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:715\u001b[0m\n"," 22% 17/78 [02:07<15:21, 15.11s/it, bpd=4.71, g_l=4.71, gn=3.73, l=4.43, p_l=4.38e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 23% 18/78 [02:12<12:10, 12.18s/it, bpd=5.25, g_l=5.25, gn=3.33, l=4.94, p_l=4.54e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 24% 19/78 [02:17<09:55, 10.10s/it, bpd=4.79, g_l=4.79, gn=3.35, l=4.51, p_l=4.48e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [02:23<08:24, 8.70s/it, bpd=4.78, g_l=4.78, gn=3.51, l=4.5, p_l=4.33e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 27% 21/78 [02:28<07:19, 7.72s/it, bpd=4.75, g_l=4.75, gn=4.61, l=4.47, p_l=4.15e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 28% 22/78 [02:34<06:35, 7.07s/it, bpd=4.57, g_l=4.57, gn=3.22, l=4.3, p_l=4.09e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 29% 23/78 [02:39<06:02, 6.59s/it, bpd=4.38, g_l=4.38, gn=3.94, l=4.12, p_l=3.92e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 31% 24/78 [02:44<05:36, 6.24s/it, bpd=6.53, g_l=6.53, gn=3.14, l=6.15, p_l=3.84e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 32% 25/78 [02:50<05:16, 5.98s/it, bpd=5.37, g_l=5.37, gn=3.65, l=5.06, p_l=3.88e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 33% 26/78 [02:55<04:59, 5.76s/it, bpd=4.72, g_l=4.72, gn=3.62, l=4.44, p_l=3.99e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 35% 27/78 [03:00<04:47, 5.63s/it, bpd=6.4, g_l=6.4, gn=4.18, l=6.03, p_l=4.37e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 36% 28/78 [03:06<04:34, 5.48s/it, bpd=5.11, g_l=5.11, gn=3.84, l=4.81, p_l=4.76e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [03:11<04:24, 5.40s/it, bpd=6.41, g_l=6.41, gn=6.97, l=6.04, p_l=5.13e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 38% 30/78 [03:16<04:14, 5.31s/it, bpd=4.71, g_l=4.71, gn=4.13, l=4.43, p_l=5.61e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 40% 31/78 [03:21<04:06, 5.25s/it, bpd=4.79, g_l=4.79, gn=3.79, l=4.51, p_l=6.05e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 41% 32/78 [03:26<04:00, 5.23s/it, bpd=5.01, g_l=5.01, gn=6.41, l=4.71, p_l=6.57e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 42% 33/78 [03:31<03:53, 5.20s/it, bpd=4.59, g_l=4.59, gn=4.46, l=4.32, p_l=6.87e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 44% 34/78 [03:37<03:50, 5.23s/it, bpd=4.69, g_l=4.69, gn=3.51, l=4.42, p_l=7.22e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 45% 35/78 [03:42<03:44, 5.23s/it, bpd=4.93, g_l=4.93, gn=4.95, l=4.64, p_l=7.93e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 46% 36/78 [03:47<03:40, 5.26s/it, bpd=5.26, g_l=5.26, gn=3.41, l=4.95, p_l=9.04e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 47% 37/78 [03:52<03:35, 5.26s/it, bpd=5.32, g_l=5.32, gn=4.37, l=5.01, p_l=9.75e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:58<03:30, 5.27s/it, bpd=6.72, g_l=6.72, gn=3.59, l=6.33, p_l=1.03e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 50% 39/78 [04:03<03:26, 5.30s/it, bpd=5.22, g_l=5.22, gn=3.85, l=4.91, p_l=1.03e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 51% 40/78 [04:08<03:21, 5.29s/it, bpd=4.79, g_l=4.79, gn=4.05, l=4.51, p_l=1.04e-5]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 53% 41/78 [04:14<03:16, 5.31s/it, bpd=3.9, g_l=3.9, gn=4.53, l=3.67, p_l=1.06e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 54% 42/78 [04:19<03:10, 5.29s/it, bpd=6.06, g_l=6.06, gn=4.25, l=5.71, p_l=1.13e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 55% 43/78 [04:24<03:07, 5.37s/it, bpd=5.46, g_l=5.46, gn=3.52, l=5.14, p_l=1.22e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 56% 44/78 [04:30<03:00, 5.32s/it, bpd=4.86, g_l=4.86, gn=5.25, l=4.57, p_l=1.31e-5]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 58% 45/78 [04:35<02:54, 5.30s/it, bpd=6.16, g_l=6.16, gn=4.81, l=5.8, p_l=1.4e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 59% 46/78 [04:40<02:49, 5.29s/it, bpd=6.25, g_l=6.25, gn=4.33, l=5.89, p_l=1.5e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [04:45<02:43, 5.26s/it, bpd=4.42, g_l=4.42, gn=4.05, l=4.16, p_l=1.46e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 62% 48/78 [04:51<02:38, 5.27s/it, bpd=4.24, g_l=4.24, gn=5.4, l=3.99, p_l=1.39e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 63% 49/78 [04:56<02:31, 5.24s/it, bpd=4.91, g_l=4.91, gn=3.49, l=4.62, p_l=1.35e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 64% 50/78 [05:01<02:26, 5.23s/it, bpd=4.59, g_l=4.59, gn=3.64, l=4.32, p_l=1.27e-5]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 65% 51/78 [05:06<02:20, 5.22s/it, bpd=6.39, g_l=6.39, gn=4.14, l=6.02, p_l=1.18e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 67% 52/78 [05:11<02:15, 5.20s/it, bpd=4.82, g_l=4.82, gn=3.83, l=4.54, p_l=1.19e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 68% 53/78 [05:17<02:09, 5.20s/it, bpd=5.18, g_l=5.18, gn=3.51, l=4.88, p_l=1.26e-5]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 69% 54/78 [05:22<02:04, 5.19s/it, bpd=4.97, g_l=4.97, gn=3.13, l=4.68, p_l=1.29e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 71% 55/78 [05:27<01:59, 5.20s/it, bpd=6.02, g_l=6.02, gn=3.45, l=5.66, p_l=1.38e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 72% 56/78 [05:32<01:54, 5.20s/it, bpd=4.62, g_l=4.62, gn=4.25, l=4.35, p_l=1.46e-5]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 73% 57/78 [05:37<01:49, 5.21s/it, bpd=4.71, g_l=4.71, gn=3.27, l=4.44, p_l=1.51e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 74% 58/78 [05:43<01:44, 5.21s/it, bpd=5.38, g_l=5.38, gn=3.32, l=5.06, p_l=1.47e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 76% 59/78 [05:48<01:38, 5.20s/it, bpd=5.23, g_l=5.23, gn=3.93, l=4.92, p_l=1.39e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 77% 60/78 [05:53<01:33, 5.20s/it, bpd=4.92, g_l=4.92, gn=3.66, l=4.63, p_l=1.34e-5]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 78% 61/78 [05:58<01:28, 5.20s/it, bpd=5.66, g_l=5.66, gn=2.98, l=5.33, p_l=1.31e-5]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 79% 62/78 [06:03<01:23, 5.21s/it, bpd=4.65, g_l=4.65, gn=3.87, l=4.37, p_l=1.32e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 81% 63/78 [06:09<01:18, 5.21s/it, bpd=5.12, g_l=5.12, gn=3.4, l=4.82, p_l=1.37e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 82% 64/78 [06:14<01:13, 5.22s/it, bpd=4.36, g_l=4.36, gn=3.67, l=4.1, p_l=1.33e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 83% 65/78 [06:19<01:07, 5.21s/it, bpd=4.41, g_l=4.41, gn=3.42, l=4.15, p_l=1.31e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 85% 66/78 [06:24<01:02, 5.20s/it, bpd=6.59, g_l=6.59, gn=3.15, l=6.2, p_l=1.35e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [06:29<00:57, 5.20s/it, bpd=4.71, g_l=4.71, gn=4.24, l=4.43, p_l=1.41e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 87% 68/78 [06:35<00:51, 5.20s/it, bpd=5.79, g_l=5.79, gn=2.92, l=5.45, p_l=1.49e-5]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 88% 69/78 [06:40<00:46, 5.21s/it, bpd=4.82, g_l=4.82, gn=4.05, l=4.53, p_l=1.57e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 90% 70/78 [06:45<00:41, 5.20s/it, bpd=5.07, g_l=5.07, gn=5.64, l=4.77, p_l=1.64e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 91% 71/78 [06:50<00:36, 5.21s/it, bpd=5.29, g_l=5.29, gn=4.88, l=4.98, p_l=1.74e-5]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 92% 72/78 [06:56<00:31, 5.21s/it, bpd=5.2, g_l=5.2, gn=3.61, l=4.89, p_l=1.87e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 94% 73/78 [07:01<00:25, 5.19s/it, bpd=5, g_l=5, gn=4.28, l=4.7, p_l=1.93e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 95% 74/78 [07:06<00:20, 5.18s/it, bpd=4.63, g_l=4.63, gn=4.49, l=4.36, p_l=1.91e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 96% 75/78 [07:11<00:15, 5.18s/it, bpd=5.43, g_l=5.43, gn=3.41, l=5.11, p_l=1.84e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n","100% 78/78 [07:27<00:00, 5.74s/it, bpd=4.65, g_l=4.65, gn=3.31, l=4.38, p_l=1.61e-5]\n","Train bpd: 5.1628 prime_loss: 0.0000 gen_loss: 5.1628 loss: 4.8591 gn: 4.0365 lr: 0.0003 lg_loss_scale: 14.9460 epoch: 8.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:776\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.05s/it, bpd=5.07, l=4.77]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.90s/it, bpd=5.68, l=5.35]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 33% 3/9 [00:05<00:10, 1.75s/it, bpd=5.37, l=5.05]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=4.64, l=4.37]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=4.89, l=4.6]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=4.55, l=4.29]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=5.73, l=5.4]\n","Ema bpd: 5.1396 prime_loss: 0.0173 gen_loss: 5.1396 loss: 4.8377 epoch: 8.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (17).txt\n"," 1% 1/78 [00:05<06:54, 5.39s/it, bpd=4.56, g_l=4.56, gn=2.98, l=4.29, p_l=1.48e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 3% 2/78 [00:10<06:44, 5.33s/it, bpd=5.77, g_l=5.77, gn=3.31, l=5.43, p_l=1.32e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 4% 3/78 [00:15<06:38, 5.31s/it, bpd=4.51, g_l=4.51, gn=3.02, l=4.25, p_l=1.23e-5]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 5% 4/78 [00:21<06:32, 5.30s/it, bpd=5.93, g_l=5.93, gn=3.11, l=5.58, p_l=1.24e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 6% 5/78 [00:26<06:26, 5.30s/it, bpd=6, g_l=6, gn=3.18, l=5.65, p_l=1.31e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=5.37, g_l=5.37, gn=3.62, l=5.05, p_l=1.5e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 9% 7/78 [00:36<06:14, 5.27s/it, bpd=5.94, g_l=5.94, gn=3.27, l=5.59, p_l=1.66e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 10% 8/78 [00:42<06:08, 5.27s/it, bpd=4.82, g_l=4.82, gn=4.19, l=4.54, p_l=1.7e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 12% 9/78 [00:47<06:01, 5.25s/it, bpd=4.89, g_l=4.89, gn=2.93, l=4.6, p_l=1.55e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 13% 10/78 [00:52<05:55, 5.23s/it, bpd=4.25, g_l=4.25, gn=5.36, l=4, p_l=1.33e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 14% 11/78 [00:57<05:49, 5.21s/it, bpd=4.82, g_l=4.82, gn=4.35, l=4.54, p_l=1.21e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 15% 12/78 [01:02<05:42, 5.20s/it, bpd=4.05, g_l=4.05, gn=4.44, l=3.81, p_l=1.13e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=5.33, g_l=5.33, gn=4.29, l=5.02, p_l=1.08e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=5.13, g_l=5.13, gn=2.97, l=4.83, p_l=1.09e-5]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 19% 15/78 [01:18<05:26, 5.19s/it, bpd=5.2, g_l=5.2, gn=3.78, l=4.9, p_l=1.17e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=5.01, g_l=5.01, gn=5.43, l=4.72, p_l=1.24e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:28<05:16, 5.18s/it, bpd=6.57, g_l=6.57, gn=3.37, l=6.18, p_l=1.34e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 23% 18/78 [01:33<05:10, 5.18s/it, bpd=5.09, g_l=5.09, gn=3.78, l=4.79, p_l=1.31e-5]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 24% 19/78 [01:39<05:05, 5.18s/it, bpd=4.63, g_l=4.63, gn=3.63, l=4.36, p_l=1.15e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 26% 20/78 [01:44<05:01, 5.19s/it, bpd=5.07, g_l=5.07, gn=5.04, l=4.77, p_l=9.49e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 27% 21/78 [01:49<04:56, 5.19s/it, bpd=6.44, g_l=6.44, gn=3.63, l=6.06, p_l=8.31e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 28% 22/78 [01:54<04:51, 5.21s/it, bpd=5.03, g_l=5.03, gn=5.13, l=4.74, p_l=8.02e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 29% 23/78 [02:00<04:46, 5.22s/it, bpd=6.41, g_l=6.41, gn=3.28, l=6.03, p_l=7.44e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 31% 24/78 [02:10<06:06, 6.78s/it, bpd=4.69, g_l=4.69, gn=3.63, l=4.42, p_l=7.21e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 32% 25/78 [02:15<05:32, 6.28s/it, bpd=4.84, g_l=4.84, gn=3.47, l=4.55, p_l=7.09e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 33% 26/78 [02:20<05:09, 5.95s/it, bpd=4.49, g_l=4.49, gn=5.29, l=4.23, p_l=6.82e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 35% 27/78 [02:25<04:52, 5.73s/it, bpd=4.47, g_l=4.47, gn=4.04, l=4.21, p_l=6.47e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 36% 28/78 [02:31<04:39, 5.59s/it, bpd=5.65, g_l=5.65, gn=3.14, l=5.32, p_l=6.08e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 37% 29/78 [02:36<04:28, 5.49s/it, bpd=4.96, g_l=4.96, gn=3.77, l=4.67, p_l=6.07e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 38% 30/78 [02:41<04:19, 5.40s/it, bpd=4.57, g_l=4.57, gn=4.5, l=4.31, p_l=6.48e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 40% 31/78 [02:46<04:11, 5.35s/it, bpd=6.37, g_l=6.37, gn=5.37, l=6, p_l=6.99e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 41% 32/78 [02:52<04:04, 5.31s/it, bpd=5.23, g_l=5.23, gn=3.45, l=4.92, p_l=8.06e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 42% 33/78 [02:57<03:58, 5.29s/it, bpd=4.65, g_l=4.65, gn=3.56, l=4.38, p_l=9.14e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 44% 34/78 [03:02<03:51, 5.27s/it, bpd=6.31, g_l=6.31, gn=3.56, l=5.94, p_l=1.02e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 45% 35/78 [03:07<03:45, 5.25s/it, bpd=4.77, g_l=4.77, gn=3.65, l=4.49, p_l=1e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 46% 36/78 [03:12<03:39, 5.23s/it, bpd=4.72, g_l=4.72, gn=3.23, l=4.45, p_l=9.32e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 47% 37/78 [03:18<03:33, 5.21s/it, bpd=4.59, g_l=4.59, gn=3.02, l=4.32, p_l=8.5e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 49% 38/78 [03:23<03:28, 5.20s/it, bpd=6.91, g_l=6.91, gn=3.98, l=6.5, p_l=7.97e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 50% 39/78 [03:28<03:22, 5.19s/it, bpd=5.25, g_l=5.25, gn=5.1, l=4.94, p_l=7.54e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 51% 40/78 [03:33<03:17, 5.19s/it, bpd=4.12, g_l=4.12, gn=6.46, l=3.88, p_l=7.02e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 53% 41/78 [03:38<03:11, 5.19s/it, bpd=4.46, g_l=4.46, gn=3.17, l=4.2, p_l=6.34e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 54% 42/78 [03:44<03:06, 5.19s/it, bpd=5.63, g_l=5.63, gn=4.26, l=5.3, p_l=5.64e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 55% 43/78 [03:49<03:01, 5.20s/it, bpd=4.47, g_l=4.47, gn=4.22, l=4.21, p_l=4.74e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 56% 44/78 [03:54<02:56, 5.19s/it, bpd=5.97, g_l=5.97, gn=4.2, l=5.62, p_l=3.98e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 58% 45/78 [03:59<02:51, 5.20s/it, bpd=4.46, g_l=4.46, gn=3.86, l=4.2, p_l=3.53e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 59% 46/78 [04:04<02:46, 5.20s/it, bpd=5.59, g_l=5.59, gn=3.45, l=5.26, p_l=3.45e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 60% 47/78 [04:10<02:41, 5.21s/it, bpd=5.04, g_l=5.04, gn=5.64, l=4.74, p_l=3.42e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 62% 48/78 [04:15<02:36, 5.20s/it, bpd=4.54, g_l=4.54, gn=3.14, l=4.27, p_l=3.68e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 63% 49/78 [04:20<02:30, 5.20s/it, bpd=6.63, g_l=6.63, gn=3.45, l=6.24, p_l=3.98e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 64% 50/78 [04:25<02:25, 5.21s/it, bpd=3.8, g_l=3.8, gn=3.72, l=3.58, p_l=4.98e-6]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 65% 51/78 [04:30<02:20, 5.20s/it, bpd=4.77, g_l=4.77, gn=5.02, l=4.49, p_l=6.04e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [04:36<02:15, 5.21s/it, bpd=4.76, g_l=4.76, gn=3.95, l=4.48, p_l=6.87e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 68% 53/78 [04:41<02:10, 5.21s/it, bpd=5.6, g_l=5.6, gn=3.37, l=5.27, p_l=7.52e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 69% 54/78 [04:46<02:05, 5.22s/it, bpd=4.76, g_l=4.76, gn=3.94, l=4.48, p_l=7.63e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 71% 55/78 [04:51<02:00, 5.22s/it, bpd=5.92, g_l=5.92, gn=3.16, l=5.57, p_l=7.35e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 72% 56/78 [04:56<01:54, 5.21s/it, bpd=4.21, g_l=4.21, gn=6.62, l=3.96, p_l=7.58e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 73% 57/78 [05:02<01:49, 5.20s/it, bpd=5.59, g_l=5.59, gn=5.63, l=5.26, p_l=7.95e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 74% 58/78 [05:07<01:43, 5.19s/it, bpd=4.59, g_l=4.59, gn=4.25, l=4.32, p_l=8.53e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 76% 59/78 [05:12<01:38, 5.19s/it, bpd=5.36, g_l=5.36, gn=3.95, l=5.05, p_l=9.15e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 77% 60/78 [05:17<01:33, 5.19s/it, bpd=4.08, g_l=4.08, gn=3.83, l=3.84, p_l=9.7e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 78% 61/78 [05:22<01:28, 5.18s/it, bpd=3.93, g_l=3.93, gn=3.53, l=3.7, p_l=9.2e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 79% 62/78 [05:28<01:23, 5.19s/it, bpd=4.65, g_l=4.65, gn=4.37, l=4.38, p_l=8.92e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 81% 63/78 [05:33<01:17, 5.19s/it, bpd=4.68, g_l=4.68, gn=3.87, l=4.4, p_l=8.52e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 82% 64/78 [05:38<01:12, 5.20s/it, bpd=5.38, g_l=5.38, gn=3.8, l=5.06, p_l=8.23e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 83% 65/78 [05:43<01:07, 5.21s/it, bpd=5.23, g_l=5.23, gn=3.13, l=4.93, p_l=8.2e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 85% 66/78 [05:48<01:02, 5.22s/it, bpd=5.44, g_l=5.44, gn=4.3, l=5.12, p_l=8.65e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 86% 67/78 [05:54<00:57, 5.23s/it, bpd=5.23, g_l=5.23, gn=3.94, l=4.93, p_l=9.1e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 87% 68/78 [05:59<00:52, 5.24s/it, bpd=6.48, g_l=6.48, gn=3.68, l=6.1, p_l=9.85e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 88% 69/78 [06:04<00:47, 5.23s/it, bpd=5.18, g_l=5.18, gn=4.57, l=4.88, p_l=1.15e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 90% 70/78 [06:09<00:41, 5.22s/it, bpd=5.56, g_l=5.56, gn=4.89, l=5.23, p_l=1.2e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 91% 71/78 [06:15<00:36, 5.21s/it, bpd=5.44, g_l=5.44, gn=4.37, l=5.12, p_l=1.2e-5]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 92% 72/78 [06:20<00:31, 5.19s/it, bpd=6.27, g_l=6.27, gn=4.08, l=5.9, p_l=1.22e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:25<00:26, 5.20s/it, bpd=6, g_l=6, gn=4.28, l=5.65, p_l=1.24e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 95% 74/78 [06:30<00:20, 5.20s/it, bpd=4.61, g_l=4.61, gn=3.43, l=4.34, p_l=1.19e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [06:35<00:15, 5.20s/it, bpd=5.03, g_l=5.03, gn=3.39, l=4.74, p_l=1.05e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n","100% 78/78 [06:51<00:00, 5.28s/it, bpd=4.85, g_l=4.85, gn=3.81, l=4.57, p_l=6.97e-6]\n","Train bpd: 5.1455 prime_loss: 0.0000 gen_loss: 5.1455 loss: 4.8428 gn: 3.9816 lr: 0.0003 lg_loss_scale: 15.2580 epoch: 9.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:854\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.04s/it, bpd=4.84, l=4.56]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.92s/it, bpd=4.67, l=4.4]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.76s/it, bpd=5.04, l=4.75]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=5.13, l=4.83]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=4.05, l=3.81]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=4.93, l=4.64]/content/gdrive/MyDrive/slon/slon (6).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=5.06, l=4.77]\n","Ema bpd: 4.9103 prime_loss: 0.0171 gen_loss: 4.9103 loss: 4.6218 epoch: 9.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (23).txt\n","/content/gdrive/MyDrive/slon/slon (27).txt\n","/content/gdrive/MyDrive/slon/slon (13).txt\n"," 1% 1/78 [00:05<07:00, 5.46s/it, bpd=5.01, g_l=5.01, gn=2.98, l=4.71, p_l=6.27e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 3% 2/78 [00:10<06:48, 5.38s/it, bpd=4.84, g_l=4.84, gn=4.18, l=4.56, p_l=5.81e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 4% 3/78 [00:15<06:41, 5.35s/it, bpd=6.47, g_l=6.47, gn=3.33, l=6.09, p_l=5.63e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 5% 4/78 [00:21<06:34, 5.33s/it, bpd=5.16, g_l=5.16, gn=3.03, l=4.86, p_l=5.7e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 6% 5/78 [00:26<06:29, 5.33s/it, bpd=5.81, g_l=5.81, gn=3.18, l=5.46, p_l=6.2e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 8% 6/78 [00:31<06:22, 5.31s/it, bpd=4.91, g_l=4.91, gn=4.01, l=4.62, p_l=6.63e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 9% 7/78 [00:37<06:16, 5.30s/it, bpd=4.97, g_l=4.97, gn=3.74, l=4.68, p_l=7.1e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 10% 8/78 [00:42<06:08, 5.27s/it, bpd=5.28, g_l=5.28, gn=4.02, l=4.97, p_l=7.26e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 12% 9/78 [00:47<06:02, 5.25s/it, bpd=5.45, g_l=5.45, gn=3.69, l=5.13, p_l=6.85e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 13% 10/78 [00:52<05:55, 5.23s/it, bpd=4.41, g_l=4.41, gn=4.34, l=4.16, p_l=6.08e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 14% 11/78 [00:57<05:48, 5.20s/it, bpd=5.53, g_l=5.53, gn=4.01, l=5.2, p_l=5.6e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 15% 12/78 [01:03<05:43, 5.20s/it, bpd=5.74, g_l=5.74, gn=4.14, l=5.4, p_l=5.33e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=4.88, g_l=4.88, gn=3.82, l=4.59, p_l=5.2e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=4.81, g_l=4.81, gn=3.92, l=4.53, p_l=5.32e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=4.32, g_l=4.32, gn=4.61, l=4.07, p_l=5.42e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 21% 16/78 [01:23<05:20, 5.17s/it, bpd=4.68, g_l=4.68, gn=4.06, l=4.4, p_l=5.63e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:28<05:15, 5.18s/it, bpd=4.78, g_l=4.78, gn=5, l=4.5, p_l=5.79e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 23% 18/78 [01:34<05:11, 5.18s/it, bpd=4.87, g_l=4.87, gn=3.79, l=4.58, p_l=5.7e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=4.63, g_l=4.63, gn=3.73, l=4.35, p_l=5.64e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 26% 20/78 [01:44<05:02, 5.21s/it, bpd=4.44, g_l=4.44, gn=4.74, l=4.18, p_l=5.85e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 27% 21/78 [01:49<04:56, 5.21s/it, bpd=4.99, g_l=4.99, gn=4.12, l=4.7, p_l=5.88e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 28% 22/78 [01:54<04:51, 5.21s/it, bpd=4.55, g_l=4.55, gn=3.89, l=4.28, p_l=5.91e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 29% 23/78 [02:00<04:46, 5.21s/it, bpd=4.82, g_l=4.82, gn=4.01, l=4.54, p_l=5.97e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 31% 24/78 [02:05<04:41, 5.22s/it, bpd=5.99, g_l=5.99, gn=3.49, l=5.63, p_l=5.82e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=4.33, g_l=4.33, gn=3.43, l=4.08, p_l=5.77e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=5.97, g_l=5.97, gn=3.54, l=5.62, p_l=5.84e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 35% 27/78 [02:21<04:26, 5.22s/it, bpd=5.96, g_l=5.96, gn=3.24, l=5.61, p_l=5.97e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=5.85, g_l=5.85, gn=3.68, l=5.51, p_l=6.01e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=4.85, g_l=4.85, gn=4.05, l=4.56, p_l=6.07e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 38% 30/78 [02:36<04:09, 5.21s/it, bpd=6.14, g_l=6.14, gn=3.68, l=5.78, p_l=6.26e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 40% 31/78 [02:41<04:05, 5.21s/it, bpd=4.53, g_l=4.53, gn=3.7, l=4.26, p_l=6.27e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 41% 32/78 [02:47<03:59, 5.21s/it, bpd=5.63, g_l=5.63, gn=3.16, l=5.3, p_l=6.79e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 42% 33/78 [02:52<03:54, 5.22s/it, bpd=4.08, g_l=4.08, gn=3.42, l=3.84, p_l=7.25e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 44% 34/78 [02:57<03:49, 5.21s/it, bpd=4.57, g_l=4.57, gn=6.34, l=4.3, p_l=7.75e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 45% 35/78 [03:02<03:43, 5.20s/it, bpd=4.87, g_l=4.87, gn=4.11, l=4.58, p_l=8.26e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:07<03:38, 5.20s/it, bpd=6.59, g_l=6.59, gn=3.15, l=6.2, p_l=9.57e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 47% 37/78 [03:13<03:32, 5.19s/it, bpd=5.94, g_l=5.94, gn=3.28, l=5.59, p_l=1.12e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 49% 38/78 [03:18<03:28, 5.20s/it, bpd=4.6, g_l=4.6, gn=3.2, l=4.33, p_l=1.42e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 50% 39/78 [03:23<03:23, 5.21s/it, bpd=4.44, g_l=4.44, gn=5.05, l=4.18, p_l=1.86e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 51% 40/78 [03:28<03:18, 5.21s/it, bpd=4.99, g_l=4.99, gn=3.6, l=4.69, p_l=2.32e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 53% 41/78 [03:33<03:12, 5.20s/it, bpd=5.89, g_l=5.89, gn=3.67, l=5.55, p_l=2.72e-5]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 54% 42/78 [03:39<03:07, 5.20s/it, bpd=4.35, g_l=4.35, gn=4.11, l=4.1, p_l=3e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 55% 43/78 [03:44<03:01, 5.19s/it, bpd=3.43, g_l=3.43, gn=4.99, l=3.23, p_l=3.21e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 56% 44/78 [03:49<02:56, 5.19s/it, bpd=4.9, g_l=4.9, gn=3.75, l=4.61, p_l=3.26e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 58% 45/78 [03:54<02:51, 5.19s/it, bpd=6.53, g_l=6.53, gn=3.08, l=6.15, p_l=3.17e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 59% 46/78 [04:05<03:36, 6.77s/it, bpd=4.66, g_l=4.66, gn=4.26, l=4.39, p_l=2.75e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 60% 47/78 [04:10<03:14, 6.27s/it, bpd=4.37, g_l=4.37, gn=3.22, l=4.11, p_l=2.39e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 62% 48/78 [04:15<02:58, 5.94s/it, bpd=4.49, g_l=4.49, gn=3.88, l=4.23, p_l=2.14e-5]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 63% 49/78 [04:20<02:45, 5.71s/it, bpd=4.95, g_l=4.95, gn=3.62, l=4.66, p_l=1.98e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 64% 50/78 [04:25<02:36, 5.57s/it, bpd=4.58, g_l=4.58, gn=3.84, l=4.31, p_l=1.97e-5]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 65% 51/78 [04:31<02:28, 5.49s/it, bpd=5.36, g_l=5.36, gn=3.36, l=5.04, p_l=1.95e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 67% 52/78 [04:36<02:20, 5.42s/it, bpd=5.59, g_l=5.59, gn=3.08, l=5.26, p_l=1.69e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 68% 53/78 [04:41<02:14, 5.38s/it, bpd=5.69, g_l=5.69, gn=4.98, l=5.35, p_l=1.51e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 69% 54/78 [04:46<02:07, 5.33s/it, bpd=4.36, g_l=4.36, gn=4.17, l=4.11, p_l=1.37e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 71% 55/78 [04:52<02:01, 5.30s/it, bpd=4.32, g_l=4.32, gn=3.87, l=4.07, p_l=1.3e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 72% 56/78 [04:57<01:55, 5.27s/it, bpd=4.93, g_l=4.93, gn=4.26, l=4.64, p_l=1.11e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 73% 57/78 [05:02<01:50, 5.24s/it, bpd=4.64, g_l=4.64, gn=3.49, l=4.36, p_l=9e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 74% 58/78 [05:07<01:44, 5.22s/it, bpd=6.3, g_l=6.3, gn=3.68, l=5.93, p_l=7.4e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 76% 59/78 [05:12<01:38, 5.20s/it, bpd=5.15, g_l=5.15, gn=3.03, l=4.84, p_l=6.38e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 77% 60/78 [05:17<01:33, 5.20s/it, bpd=6.39, g_l=6.39, gn=3.16, l=6.01, p_l=5.95e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 78% 61/78 [05:23<01:28, 5.19s/it, bpd=4.78, g_l=4.78, gn=4.75, l=4.5, p_l=5.61e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 79% 62/78 [05:28<01:23, 5.19s/it, bpd=5.8, g_l=5.8, gn=3.38, l=5.46, p_l=5.34e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 81% 63/78 [05:33<01:17, 5.19s/it, bpd=5.03, g_l=5.03, gn=3.5, l=4.74, p_l=4.82e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 82% 64/78 [05:38<01:12, 5.19s/it, bpd=5.35, g_l=5.35, gn=3.4, l=5.04, p_l=4.7e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 83% 65/78 [05:43<01:07, 5.19s/it, bpd=4.84, g_l=4.84, gn=4.87, l=4.56, p_l=4.44e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 85% 66/78 [05:49<01:02, 5.19s/it, bpd=4.36, g_l=4.36, gn=3.68, l=4.1, p_l=3.91e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 86% 67/78 [05:54<00:57, 5.21s/it, bpd=5.65, g_l=5.65, gn=3.04, l=5.31, p_l=3.56e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 87% 68/78 [05:59<00:52, 5.21s/it, bpd=6.1, g_l=6.1, gn=3.41, l=5.74, p_l=3.3e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 88% 69/78 [06:04<00:46, 5.21s/it, bpd=5.1, g_l=5.1, gn=3.85, l=4.8, p_l=2.92e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 90% 70/78 [06:09<00:41, 5.21s/it, bpd=5.05, g_l=5.05, gn=3.28, l=4.76, p_l=2.72e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 91% 71/78 [06:15<00:36, 5.21s/it, bpd=5.71, g_l=5.71, gn=3.9, l=5.38, p_l=2.38e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 92% 72/78 [06:20<00:31, 5.21s/it, bpd=4.87, g_l=4.87, gn=4.83, l=4.58, p_l=2.33e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:25<00:26, 5.20s/it, bpd=4.8, g_l=4.8, gn=3.76, l=4.52, p_l=2.34e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 95% 74/78 [06:30<00:20, 5.22s/it, bpd=4.87, g_l=4.87, gn=3.51, l=4.59, p_l=2.42e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 96% 75/78 [06:35<00:15, 5.21s/it, bpd=4.32, g_l=4.32, gn=3.03, l=4.06, p_l=2.66e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n","100% 78/78 [06:51<00:00, 5.28s/it, bpd=4.83, g_l=4.83, gn=4.33, l=4.55, p_l=2.73e-6]\n","Train bpd: 5.0783 prime_loss: 0.0000 gen_loss: 5.0783 loss: 4.7796 gn: 3.8088 lr: 0.0003 lg_loss_scale: 15.5700 epoch: 10.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:932\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.91s/it, bpd=4.69, l=4.41]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:12, 1.84s/it, bpd=4.52, l=4.25]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 33% 3/9 [00:04<00:10, 1.71s/it, bpd=4.97, l=4.68]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:08, 1.61s/it, bpd=5.33, l=5.02]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.55s/it, bpd=4.55, l=4.29]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.50s/it, bpd=4.69, l=4.41]/content/gdrive/MyDrive/slon/slon (5).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=4.91, l=4.62]\n","Ema bpd: 4.7768 prime_loss: 0.0166 gen_loss: 4.7768 loss: 4.4962 epoch: 10.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (28).txt\n","/content/gdrive/MyDrive/slon/slon (35).txt\n"," 1% 1/78 [00:05<06:58, 5.44s/it, bpd=4.39, g_l=4.39, gn=3.29, l=4.13, p_l=2.68e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 3% 2/78 [00:10<06:47, 5.37s/it, bpd=3.35, g_l=3.35, gn=4.37, l=3.15, p_l=2.72e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 4% 3/78 [00:15<06:40, 5.33s/it, bpd=5.5, g_l=5.5, gn=3.61, l=5.17, p_l=2.92e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 5% 4/78 [00:21<06:33, 5.32s/it, bpd=4.91, g_l=4.91, gn=3.95, l=4.62, p_l=3.28e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 6% 5/78 [00:26<06:28, 5.32s/it, bpd=6.24, g_l=6.24, gn=3.32, l=5.88, p_l=3.37e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:22, 5.31s/it, bpd=4.4, g_l=4.4, gn=3.51, l=4.15, p_l=3.35e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=4.13, g_l=4.13, gn=4.42, l=3.89, p_l=3.15e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 10% 8/78 [00:42<06:09, 5.28s/it, bpd=4.48, g_l=4.48, gn=3.27, l=4.21, p_l=3.07e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 12% 9/78 [00:47<06:03, 5.26s/it, bpd=4.22, g_l=4.22, gn=3.18, l=3.97, p_l=3.2e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=6, g_l=6, gn=3.46, l=5.65, p_l=3.33e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=5.57, g_l=5.57, gn=3.56, l=5.24, p_l=3.41e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 15% 12/78 [01:03<05:43, 5.21s/it, bpd=4.68, g_l=4.68, gn=7.25, l=4.41, p_l=3.46e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=4.9, g_l=4.9, gn=3.58, l=4.61, p_l=3.61e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 18% 14/78 [01:13<05:31, 5.17s/it, bpd=4.64, g_l=4.64, gn=3.28, l=4.36, p_l=3.71e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 19% 15/78 [01:18<05:26, 5.18s/it, bpd=6.19, g_l=6.19, gn=3.38, l=5.83, p_l=3.54e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 21% 16/78 [01:23<05:20, 5.17s/it, bpd=4.44, g_l=4.44, gn=4.1, l=4.18, p_l=3.24e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 22% 17/78 [01:28<05:16, 5.18s/it, bpd=4.96, g_l=4.96, gn=4.42, l=4.66, p_l=3.09e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 23% 18/78 [01:34<05:11, 5.19s/it, bpd=4.9, g_l=4.9, gn=3.97, l=4.61, p_l=2.99e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 24% 19/78 [01:39<05:07, 5.21s/it, bpd=4.81, g_l=4.81, gn=3.73, l=4.53, p_l=2.87e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=4.16, g_l=4.16, gn=3.93, l=3.91, p_l=2.7e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:953\u001b[0m\n"," 27% 21/78 [02:25<15:06, 15.90s/it, bpd=5.32, g_l=5.32, gn=4.14, l=5.01, p_l=2.57e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 28% 22/78 [02:30<11:56, 12.80s/it, bpd=6.47, g_l=6.47, gn=4.64, l=6.09, p_l=2.43e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 29% 23/78 [02:36<09:39, 10.53s/it, bpd=6.29, g_l=6.29, gn=3.26, l=5.92, p_l=2.22e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 31% 24/78 [02:41<08:07, 9.02s/it, bpd=5.48, g_l=5.48, gn=3.05, l=5.16, p_l=2.14e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 32% 25/78 [02:47<07:01, 7.94s/it, bpd=5.24, g_l=5.24, gn=3.36, l=4.93, p_l=2.03e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 33% 26/78 [02:52<06:17, 7.25s/it, bpd=6.3, g_l=6.3, gn=4.06, l=5.93, p_l=1.99e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 35% 27/78 [02:58<05:42, 6.73s/it, bpd=4.56, g_l=4.56, gn=4.17, l=4.29, p_l=1.94e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 36% 28/78 [03:03<05:17, 6.34s/it, bpd=5.7, g_l=5.7, gn=3.98, l=5.36, p_l=1.95e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 37% 29/78 [03:09<04:55, 6.04s/it, bpd=4.45, g_l=4.45, gn=3.14, l=4.18, p_l=2.07e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 38% 30/78 [03:14<04:39, 5.83s/it, bpd=4.65, g_l=4.65, gn=4.8, l=4.37, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 40% 31/78 [03:19<04:25, 5.65s/it, bpd=5.08, g_l=5.08, gn=3.59, l=4.78, p_l=2.1e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 41% 32/78 [03:24<04:12, 5.50s/it, bpd=4.74, g_l=4.74, gn=3.35, l=4.46, p_l=2.12e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 42% 33/78 [03:29<04:03, 5.41s/it, bpd=4.68, g_l=4.68, gn=2.9, l=4.41, p_l=2.18e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 44% 34/78 [03:35<03:54, 5.33s/it, bpd=4.8, g_l=4.8, gn=3.58, l=4.52, p_l=2.22e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 45% 35/78 [03:40<03:48, 5.30s/it, bpd=4.8, g_l=4.8, gn=3.65, l=4.52, p_l=2.34e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 46% 36/78 [03:45<03:41, 5.26s/it, bpd=4.76, g_l=4.76, gn=4, l=4.48, p_l=2.39e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 47% 37/78 [03:50<03:35, 5.25s/it, bpd=5.76, g_l=5.76, gn=3.75, l=5.42, p_l=2.4e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:55<03:29, 5.24s/it, bpd=6.06, g_l=6.06, gn=4.08, l=5.71, p_l=2.5e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 50% 39/78 [04:01<03:25, 5.27s/it, bpd=4.8, g_l=4.8, gn=3.85, l=4.52, p_l=2.51e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 51% 40/78 [04:06<03:20, 5.27s/it, bpd=4.41, g_l=4.41, gn=3.74, l=4.15, p_l=2.62e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 53% 41/78 [04:11<03:15, 5.27s/it, bpd=5.5, g_l=5.5, gn=3.19, l=5.18, p_l=2.85e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 54% 42/78 [04:17<03:10, 5.29s/it, bpd=5.69, g_l=5.69, gn=3.35, l=5.36, p_l=2.94e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 55% 43/78 [04:22<03:04, 5.28s/it, bpd=4.84, g_l=4.84, gn=3.57, l=4.56, p_l=3.1e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 56% 44/78 [04:27<03:01, 5.33s/it, bpd=6.16, g_l=6.16, gn=3.37, l=5.8, p_l=3.49e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 58% 45/78 [04:33<02:55, 5.32s/it, bpd=5.82, g_l=5.82, gn=3.61, l=5.48, p_l=3.86e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 59% 46/78 [04:38<02:50, 5.33s/it, bpd=7.1, g_l=7.1, gn=3.36, l=6.68, p_l=4.23e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 60% 47/78 [04:43<02:44, 5.31s/it, bpd=4.51, g_l=4.51, gn=3.78, l=4.24, p_l=4.67e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 62% 48/78 [04:49<02:39, 5.32s/it, bpd=5.47, g_l=5.47, gn=3.4, l=5.15, p_l=5.12e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 63% 49/78 [04:54<02:33, 5.29s/it, bpd=6.08, g_l=6.08, gn=3.33, l=5.73, p_l=5.75e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 64% 50/78 [04:59<02:27, 5.26s/it, bpd=4.66, g_l=4.66, gn=3.33, l=4.39, p_l=6.02e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 65% 51/78 [05:04<02:21, 5.23s/it, bpd=4.9, g_l=4.9, gn=3.51, l=4.61, p_l=6.13e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 67% 52/78 [05:09<02:15, 5.20s/it, bpd=4.46, g_l=4.46, gn=3.9, l=4.2, p_l=5.79e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 68% 53/78 [05:14<02:09, 5.19s/it, bpd=5.02, g_l=5.02, gn=4.97, l=4.72, p_l=5.53e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 69% 54/78 [05:20<02:04, 5.17s/it, bpd=5.27, g_l=5.27, gn=3.11, l=4.96, p_l=5.36e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 71% 55/78 [05:25<01:59, 5.18s/it, bpd=5.19, g_l=5.19, gn=4.78, l=4.89, p_l=4.97e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 72% 56/78 [05:30<01:54, 5.18s/it, bpd=4.78, g_l=4.78, gn=4.01, l=4.49, p_l=4.65e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 73% 57/78 [05:35<01:49, 5.20s/it, bpd=4.62, g_l=4.62, gn=3.64, l=4.35, p_l=4.58e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 74% 58/78 [05:40<01:44, 5.20s/it, bpd=4.5, g_l=4.5, gn=3.32, l=4.23, p_l=4.7e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 76% 59/78 [05:46<01:38, 5.20s/it, bpd=5.08, g_l=5.08, gn=3.9, l=4.78, p_l=5.04e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 77% 60/78 [05:51<01:33, 5.20s/it, bpd=5.22, g_l=5.22, gn=4.92, l=4.92, p_l=5.51e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 78% 61/78 [05:56<01:28, 5.21s/it, bpd=4.59, g_l=4.59, gn=3.94, l=4.32, p_l=5.94e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 79% 62/78 [06:01<01:23, 5.22s/it, bpd=4.96, g_l=4.96, gn=3.56, l=4.67, p_l=6.14e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 81% 63/78 [06:07<01:18, 5.21s/it, bpd=3.82, g_l=3.82, gn=4.44, l=3.6, p_l=6.16e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 82% 64/78 [06:12<01:13, 5.23s/it, bpd=4.28, g_l=4.28, gn=4.87, l=4.03, p_l=5.93e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 83% 65/78 [06:17<01:07, 5.23s/it, bpd=4.44, g_l=4.44, gn=3.89, l=4.18, p_l=5.78e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 85% 66/78 [06:22<01:02, 5.23s/it, bpd=4.28, g_l=4.28, gn=4.16, l=4.03, p_l=5.69e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 86% 67/78 [06:27<00:57, 5.22s/it, bpd=4.77, g_l=4.77, gn=3.38, l=4.49, p_l=5.78e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [06:35<01:00, 6.02s/it, bpd=4.82, g_l=4.82, gn=3.17, l=4.54, p_l=5.63e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 88% 69/78 [06:40<00:51, 5.76s/it, bpd=5.42, g_l=5.42, gn=3.84, l=5.1, p_l=5.25e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 90% 70/78 [06:46<00:44, 5.59s/it, bpd=4.93, g_l=4.93, gn=3.85, l=4.64, p_l=4.94e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 91% 71/78 [06:51<00:38, 5.47s/it, bpd=5.19, g_l=5.19, gn=3.27, l=4.88, p_l=4.92e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 92% 72/78 [06:56<00:32, 5.38s/it, bpd=5.55, g_l=5.55, gn=4.16, l=5.22, p_l=5.22e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 94% 73/78 [07:01<00:26, 5.32s/it, bpd=5.76, g_l=5.76, gn=3.46, l=5.42, p_l=5.87e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 95% 74/78 [07:06<00:21, 5.28s/it, bpd=4.81, g_l=4.81, gn=3.91, l=4.52, p_l=6.3e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 96% 75/78 [07:12<00:15, 5.27s/it, bpd=6.31, g_l=6.31, gn=3.28, l=5.94, p_l=6.39e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n","100% 78/78 [07:27<00:00, 5.74s/it, bpd=4.95, g_l=4.95, gn=3.79, l=4.66, p_l=4.46e-6]\n","Train bpd: 5.0579 prime_loss: 0.0000 gen_loss: 5.0579 loss: 4.7604 gn: 3.8687 lr: 0.0003 lg_loss_scale: 15.8820 epoch: 11.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1010\u001b[0m\n"," 11% 1/9 [00:01<00:14, 1.78s/it, bpd=4.85, l=4.57]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 22% 2/9 [00:03<00:11, 1.69s/it, bpd=5.39, l=5.07]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:04<00:09, 1.62s/it, bpd=5.08, l=4.78]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:07, 1.56s/it, bpd=5.06, l=4.76]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.51s/it, bpd=4.93, l=4.64]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 67% 6/9 [00:08<00:04, 1.48s/it, bpd=4.11, l=3.86]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.47s/it, bpd=4.29, l=4.03]\n","Ema bpd: 4.8407 prime_loss: 0.0164 gen_loss: 4.8407 loss: 4.5563 epoch: 11.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (32).txt\n","/content/gdrive/MyDrive/slon/slon (27).txt\n","/content/gdrive/MyDrive/slon/slon (23).txt\n"," 1% 1/78 [00:05<06:52, 5.36s/it, bpd=5.96, g_l=5.96, gn=6.41, l=5.61, p_l=3.85e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 3% 2/78 [00:10<06:44, 5.32s/it, bpd=4.41, g_l=4.41, gn=6.3, l=4.15, p_l=3.24e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 4% 3/78 [00:15<06:37, 5.29s/it, bpd=5.27, g_l=5.27, gn=4.05, l=4.96, p_l=2.73e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 5% 4/78 [00:21<06:32, 5.30s/it, bpd=4.66, g_l=4.66, gn=3.56, l=4.39, p_l=2.27e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 6% 5/78 [00:26<06:25, 5.29s/it, bpd=6.18, g_l=6.18, gn=3.47, l=5.81, p_l=2e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 8% 6/78 [00:31<06:20, 5.28s/it, bpd=4.74, g_l=4.74, gn=3.69, l=4.46, p_l=1.82e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:36<06:13, 5.26s/it, bpd=4.45, g_l=4.45, gn=3.25, l=4.19, p_l=1.83e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 10% 8/78 [00:42<06:06, 5.23s/it, bpd=6.25, g_l=6.25, gn=3.16, l=5.88, p_l=1.8e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 12% 9/78 [00:47<06:00, 5.22s/it, bpd=4.48, g_l=4.48, gn=3.75, l=4.22, p_l=1.88e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 13% 10/78 [00:52<05:53, 5.20s/it, bpd=5.75, g_l=5.75, gn=3.98, l=5.41, p_l=1.98e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:48, 5.20s/it, bpd=6.45, g_l=6.45, gn=3.39, l=6.07, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=5.06, g_l=5.06, gn=4.32, l=4.76, p_l=2.23e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 17% 13/78 [01:07<05:37, 5.19s/it, bpd=4.7, g_l=4.7, gn=5.13, l=4.42, p_l=2.44e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 18% 14/78 [01:13<05:32, 5.19s/it, bpd=4.91, g_l=4.91, gn=3.11, l=4.62, p_l=2.66e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 19% 15/78 [01:18<05:27, 5.20s/it, bpd=4.35, g_l=4.35, gn=3.32, l=4.09, p_l=2.76e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=5.73, g_l=5.73, gn=3.46, l=5.39, p_l=2.89e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 22% 17/78 [01:28<05:15, 5.18s/it, bpd=4.58, g_l=4.58, gn=4.36, l=4.31, p_l=2.99e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 23% 18/78 [01:33<05:10, 5.18s/it, bpd=4.76, g_l=4.76, gn=3.52, l=4.48, p_l=3.11e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 24% 19/78 [01:39<05:05, 5.18s/it, bpd=4.67, g_l=4.67, gn=6.99, l=4.39, p_l=3.52e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 26% 20/78 [01:44<05:00, 5.18s/it, bpd=4.63, g_l=4.63, gn=4.41, l=4.36, p_l=3.91e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 27% 21/78 [01:49<04:55, 5.19s/it, bpd=4.95, g_l=4.95, gn=3.53, l=4.66, p_l=4.35e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 28% 22/78 [01:54<04:50, 5.19s/it, bpd=4.7, g_l=4.7, gn=4.26, l=4.42, p_l=4.98e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 29% 23/78 [01:59<04:45, 5.19s/it, bpd=5.46, g_l=5.46, gn=3.86, l=5.14, p_l=5.61e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 31% 24/78 [02:05<04:40, 5.20s/it, bpd=5.37, g_l=5.37, gn=3.15, l=5.06, p_l=6.24e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 32% 25/78 [02:10<04:35, 5.19s/it, bpd=5.06, g_l=5.06, gn=3.27, l=4.76, p_l=7.06e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 33% 26/78 [02:15<04:29, 5.18s/it, bpd=4.49, g_l=4.49, gn=3.36, l=4.22, p_l=8.36e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 35% 27/78 [02:20<04:24, 5.18s/it, bpd=5.72, g_l=5.72, gn=3.07, l=5.38, p_l=1.12e-5]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 36% 28/78 [02:25<04:18, 5.17s/it, bpd=4.28, g_l=4.28, gn=2.97, l=4.02, p_l=1.43e-5]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 37% 29/78 [02:30<04:14, 5.19s/it, bpd=5.89, g_l=5.89, gn=4.94, l=5.55, p_l=1.67e-5]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=3.84, g_l=3.84, gn=6.01, l=3.61, p_l=1.74e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 40% 31/78 [02:41<04:04, 5.21s/it, bpd=5.97, g_l=5.97, gn=3.7, l=5.62, p_l=1.75e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 41% 32/78 [02:46<03:59, 5.20s/it, bpd=4.86, g_l=4.86, gn=3.47, l=4.58, p_l=1.77e-5]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 42% 33/78 [02:51<03:53, 5.20s/it, bpd=5.65, g_l=5.65, gn=3.25, l=5.32, p_l=1.71e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 44% 34/78 [02:56<03:48, 5.19s/it, bpd=4.99, g_l=4.99, gn=6.6, l=4.69, p_l=1.84e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 45% 35/78 [03:02<03:43, 5.19s/it, bpd=4.4, g_l=4.4, gn=3.39, l=4.14, p_l=1.94e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:07<03:37, 5.19s/it, bpd=4.2, g_l=4.2, gn=3.23, l=3.95, p_l=2.13e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 47% 37/78 [03:12<03:32, 5.19s/it, bpd=4.53, g_l=4.53, gn=3.28, l=4.27, p_l=2.24e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 49% 38/78 [03:17<03:28, 5.20s/it, bpd=4.22, g_l=4.22, gn=3.18, l=3.97, p_l=2.11e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 50% 39/78 [03:22<03:23, 5.21s/it, bpd=4.07, g_l=4.07, gn=3.78, l=3.83, p_l=2e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 51% 40/78 [03:28<03:17, 5.21s/it, bpd=4.64, g_l=4.64, gn=4.3, l=4.37, p_l=1.89e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 53% 41/78 [03:33<03:12, 5.20s/it, bpd=4.38, g_l=4.38, gn=3.16, l=4.12, p_l=1.67e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 54% 42/78 [03:38<03:07, 5.21s/it, bpd=5.51, g_l=5.51, gn=2.98, l=5.18, p_l=1.53e-5]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 55% 43/78 [03:43<03:01, 5.20s/it, bpd=6.14, g_l=6.14, gn=3.17, l=5.78, p_l=1.43e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 56% 44/78 [03:48<02:56, 5.20s/it, bpd=5.52, g_l=5.52, gn=2.98, l=5.19, p_l=1.34e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 58% 45/78 [03:54<02:51, 5.19s/it, bpd=4.89, g_l=4.89, gn=5.27, l=4.6, p_l=1.24e-5]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 59% 46/78 [03:59<02:45, 5.19s/it, bpd=5.59, g_l=5.59, gn=3.2, l=5.26, p_l=1.2e-5]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 60% 47/78 [04:04<02:41, 5.19s/it, bpd=4.22, g_l=4.22, gn=5.87, l=3.98, p_l=1.21e-5]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 62% 48/78 [04:09<02:35, 5.19s/it, bpd=4.93, g_l=4.93, gn=4.36, l=4.64, p_l=1.2e-5]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 63% 49/78 [04:14<02:30, 5.20s/it, bpd=5.96, g_l=5.96, gn=3.83, l=5.61, p_l=1.17e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 64% 50/78 [04:20<02:25, 5.20s/it, bpd=5.1, g_l=5.1, gn=4.05, l=4.8, p_l=1.14e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 65% 51/78 [04:25<02:20, 5.19s/it, bpd=5.24, g_l=5.24, gn=3.58, l=4.93, p_l=1.14e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 67% 52/78 [04:30<02:15, 5.19s/it, bpd=4.93, g_l=4.93, gn=4.02, l=4.64, p_l=1.12e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 68% 53/78 [04:35<02:09, 5.19s/it, bpd=4.91, g_l=4.91, gn=3.97, l=4.63, p_l=1.16e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 69% 54/78 [04:40<02:04, 5.19s/it, bpd=4.5, g_l=4.5, gn=3.93, l=4.23, p_l=1.15e-5]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 71% 55/78 [04:46<01:59, 5.19s/it, bpd=4.25, g_l=4.25, gn=3.79, l=4, p_l=1.07e-5]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 72% 56/78 [04:51<01:54, 5.21s/it, bpd=4.96, g_l=4.96, gn=4.61, l=4.67, p_l=1.07e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 73% 57/78 [04:56<01:49, 5.21s/it, bpd=5.48, g_l=5.48, gn=3.34, l=5.16, p_l=1.07e-5]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 74% 58/78 [05:01<01:44, 5.23s/it, bpd=5.17, g_l=5.17, gn=3.14, l=4.86, p_l=1.06e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 76% 59/78 [05:06<01:39, 5.22s/it, bpd=4.74, g_l=4.74, gn=4.58, l=4.46, p_l=1e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 77% 60/78 [05:12<01:33, 5.22s/it, bpd=3.92, g_l=3.92, gn=3.33, l=3.69, p_l=8.97e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 78% 61/78 [05:17<01:28, 5.21s/it, bpd=6.09, g_l=6.09, gn=3.64, l=5.73, p_l=8.03e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 79% 62/78 [05:22<01:23, 5.20s/it, bpd=4.91, g_l=4.91, gn=4.6, l=4.62, p_l=7.28e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 81% 63/78 [05:27<01:17, 5.20s/it, bpd=5.33, g_l=5.33, gn=3.35, l=5.02, p_l=6.93e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 82% 64/78 [05:32<01:12, 5.19s/it, bpd=5.4, g_l=5.4, gn=3.85, l=5.08, p_l=6.8e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 83% 65/78 [05:38<01:07, 5.19s/it, bpd=5.7, g_l=5.7, gn=3.72, l=5.37, p_l=7.04e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 85% 66/78 [05:43<01:02, 5.19s/it, bpd=4.84, g_l=4.84, gn=3.03, l=4.55, p_l=7.77e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 86% 67/78 [05:48<00:57, 5.19s/it, bpd=6.13, g_l=6.13, gn=3.16, l=5.77, p_l=8.33e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 87% 68/78 [05:53<00:51, 5.19s/it, bpd=6.13, g_l=6.13, gn=3.39, l=5.77, p_l=8.5e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 88% 69/78 [05:58<00:46, 5.19s/it, bpd=5.28, g_l=5.28, gn=3.18, l=4.97, p_l=7.61e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 90% 70/78 [06:04<00:41, 5.18s/it, bpd=5.97, g_l=5.97, gn=3.41, l=5.62, p_l=6.99e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 91% 71/78 [06:09<00:36, 5.17s/it, bpd=5.54, g_l=5.54, gn=4.46, l=5.21, p_l=6.39e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 92% 72/78 [06:14<00:31, 5.18s/it, bpd=4.23, g_l=4.23, gn=4.01, l=3.98, p_l=5.75e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 94% 73/78 [06:19<00:25, 5.17s/it, bpd=6.1, g_l=6.1, gn=3.09, l=5.74, p_l=5.3e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 95% 74/78 [06:24<00:20, 5.19s/it, bpd=3.78, g_l=3.78, gn=3.85, l=3.56, p_l=4.95e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [06:29<00:15, 5.19s/it, bpd=4.69, g_l=4.69, gn=3.53, l=4.41, p_l=4.5e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n","100% 78/78 [06:45<00:00, 5.20s/it, bpd=3.29, g_l=3.29, gn=3.77, l=3.09, p_l=3.54e-6]\n","Train bpd: 5.0263 prime_loss: 0.0000 gen_loss: 5.0263 loss: 4.7306 gn: 3.8740 lr: 0.0003 lg_loss_scale: 16.1940 epoch: 12.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1088\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.01s/it, bpd=4.67, l=4.4]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 22% 2/9 [00:03<00:13, 1.87s/it, bpd=5.77, l=5.43]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:04<00:10, 1.73s/it, bpd=4.6, l=4.33]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:08, 1.62s/it, bpd=4.97, l=4.68]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.55s/it, bpd=4.55, l=4.28]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=5.42, l=5.1]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.49s/it, bpd=5.15, l=4.85]\n","Ema bpd: 5.0360 prime_loss: 0.0164 gen_loss: 5.0360 loss: 4.7401 epoch: 12.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (15).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (11).txt\n"," 1% 1/78 [00:05<06:57, 5.42s/it, bpd=4.68, g_l=4.68, gn=3.4, l=4.41, p_l=3.34e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 3% 2/78 [00:10<06:47, 5.36s/it, bpd=4.28, g_l=4.28, gn=3.95, l=4.03, p_l=3.22e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 4% 3/78 [00:15<06:40, 5.34s/it, bpd=4.36, g_l=4.36, gn=4.19, l=4.1, p_l=3.25e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 5% 4/78 [00:21<06:33, 5.32s/it, bpd=4.5, g_l=4.5, gn=4.3, l=4.23, p_l=3.2e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 6% 5/78 [00:26<06:29, 5.33s/it, bpd=5.32, g_l=5.32, gn=3.69, l=5.01, p_l=3.27e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:23, 5.32s/it, bpd=5.53, g_l=5.53, gn=3.99, l=5.21, p_l=3.45e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 9% 7/78 [00:37<06:16, 5.30s/it, bpd=5.65, g_l=5.65, gn=3.3, l=5.32, p_l=3.44e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:09, 5.28s/it, bpd=4.28, g_l=4.28, gn=3.51, l=4.03, p_l=3.5e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 12% 9/78 [00:47<06:02, 5.26s/it, bpd=5.13, g_l=5.13, gn=3.35, l=4.83, p_l=3.5e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=4.36, g_l=4.36, gn=3, l=4.1, p_l=3.58e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 14% 11/78 [00:57<05:49, 5.21s/it, bpd=4.21, g_l=4.21, gn=4.65, l=3.96, p_l=3.57e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 15% 12/78 [01:07<07:20, 6.67s/it, bpd=5.05, g_l=5.05, gn=3.96, l=4.76, p_l=3.55e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 17% 13/78 [01:13<06:43, 6.20s/it, bpd=6.74, g_l=6.74, gn=3.76, l=6.34, p_l=3.63e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 18% 14/78 [01:18<06:15, 5.86s/it, bpd=4.5, g_l=4.5, gn=4.29, l=4.23, p_l=3.86e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 19% 15/78 [01:23<05:55, 5.64s/it, bpd=4.11, g_l=4.11, gn=3.51, l=3.87, p_l=3.96e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 21% 16/78 [01:28<05:40, 5.50s/it, bpd=4.28, g_l=4.28, gn=4, l=4.03, p_l=3.63e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:33<05:30, 5.41s/it, bpd=4.47, g_l=4.47, gn=3.57, l=4.2, p_l=3.03e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 23% 18/78 [01:39<05:23, 5.39s/it, bpd=5.54, g_l=5.54, gn=4.4, l=5.21, p_l=2.66e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 24% 19/78 [01:44<05:16, 5.36s/it, bpd=4.59, g_l=4.59, gn=4.21, l=4.32, p_l=2.42e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:49<05:09, 5.34s/it, bpd=4.67, g_l=4.67, gn=4.36, l=4.39, p_l=2.2e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 27% 21/78 [01:54<05:02, 5.30s/it, bpd=5.08, g_l=5.08, gn=3.86, l=4.78, p_l=2.12e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 28% 22/78 [02:00<04:56, 5.29s/it, bpd=4.35, g_l=4.35, gn=3.89, l=4.09, p_l=2.02e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 29% 23/78 [02:05<04:49, 5.27s/it, bpd=4.51, g_l=4.51, gn=4.09, l=4.25, p_l=1.91e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 31% 24/78 [02:10<04:42, 5.24s/it, bpd=4.6, g_l=4.6, gn=4.61, l=4.33, p_l=2.09e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 32% 25/78 [02:15<04:36, 5.22s/it, bpd=6.19, g_l=6.19, gn=3.41, l=5.83, p_l=2.33e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 33% 26/78 [02:20<04:30, 5.20s/it, bpd=5.72, g_l=5.72, gn=3.49, l=5.38, p_l=2.38e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 35% 27/78 [02:25<04:24, 5.19s/it, bpd=5.07, g_l=5.07, gn=3.32, l=4.77, p_l=2.38e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 36% 28/78 [02:31<04:19, 5.18s/it, bpd=4.76, g_l=4.76, gn=4.74, l=4.48, p_l=2.36e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:36<04:14, 5.18s/it, bpd=6.14, g_l=6.14, gn=3.85, l=5.78, p_l=2.4e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 38% 30/78 [02:41<04:08, 5.17s/it, bpd=4.57, g_l=4.57, gn=3.21, l=4.31, p_l=2.43e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 40% 31/78 [02:46<04:03, 5.18s/it, bpd=4.32, g_l=4.32, gn=3.48, l=4.06, p_l=2.52e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 41% 32/78 [02:51<03:58, 5.18s/it, bpd=5.87, g_l=5.87, gn=3.5, l=5.52, p_l=2.39e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 42% 33/78 [02:56<03:52, 5.17s/it, bpd=5.21, g_l=5.21, gn=3.6, l=4.91, p_l=2.3e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 44% 34/78 [03:02<03:47, 5.16s/it, bpd=4.82, g_l=4.82, gn=3.75, l=4.54, p_l=2.25e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 45% 35/78 [03:07<03:42, 5.17s/it, bpd=5.67, g_l=5.67, gn=3.61, l=5.34, p_l=2.23e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 46% 36/78 [03:12<03:37, 5.18s/it, bpd=5.58, g_l=5.58, gn=2.99, l=5.25, p_l=2.28e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 47% 37/78 [03:17<03:32, 5.19s/it, bpd=4.88, g_l=4.88, gn=3.29, l=4.59, p_l=2.34e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:22<03:27, 5.20s/it, bpd=4.88, g_l=4.88, gn=3.22, l=4.59, p_l=2.36e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 50% 39/78 [03:28<03:22, 5.20s/it, bpd=4.33, g_l=4.33, gn=3.4, l=4.07, p_l=2.24e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 51% 40/78 [03:33<03:17, 5.21s/it, bpd=4.48, g_l=4.48, gn=3.54, l=4.22, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 53% 41/78 [03:38<03:12, 5.21s/it, bpd=4.77, g_l=4.77, gn=3.9, l=4.49, p_l=2.12e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 54% 42/78 [03:43<03:07, 5.20s/it, bpd=5.19, g_l=5.19, gn=6.71, l=4.88, p_l=2.26e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [03:48<03:01, 5.20s/it, bpd=4.74, g_l=4.74, gn=4.52, l=4.46, p_l=2.32e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 56% 44/78 [03:54<02:56, 5.19s/it, bpd=5.4, g_l=5.4, gn=4.35, l=5.08, p_l=2.42e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 58% 45/78 [03:59<02:51, 5.21s/it, bpd=4.76, g_l=4.76, gn=3.98, l=4.48, p_l=2.61e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 59% 46/78 [04:04<02:46, 5.21s/it, bpd=4.43, g_l=4.43, gn=3.15, l=4.17, p_l=2.74e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 60% 47/78 [04:09<02:41, 5.22s/it, bpd=6.22, g_l=6.22, gn=3.87, l=5.86, p_l=2.73e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 62% 48/78 [04:15<02:36, 5.22s/it, bpd=6.75, g_l=6.75, gn=3.16, l=6.35, p_l=2.77e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 63% 49/78 [04:20<02:31, 5.22s/it, bpd=5.14, g_l=5.14, gn=3.62, l=4.84, p_l=2.7e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 64% 50/78 [04:25<02:26, 5.22s/it, bpd=5.03, g_l=5.03, gn=4.15, l=4.73, p_l=2.64e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 65% 51/78 [04:30<02:21, 5.22s/it, bpd=5.01, g_l=5.01, gn=3.39, l=4.72, p_l=2.63e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 67% 52/78 [04:35<02:15, 5.22s/it, bpd=3.51, g_l=3.51, gn=2.94, l=3.3, p_l=2.57e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 68% 53/78 [04:41<02:10, 5.21s/it, bpd=3.91, g_l=3.91, gn=3.25, l=3.68, p_l=2.57e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 69% 54/78 [04:46<02:05, 5.21s/it, bpd=4.74, g_l=4.74, gn=5.51, l=4.46, p_l=2.74e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 71% 55/78 [04:51<01:59, 5.21s/it, bpd=4.39, g_l=4.39, gn=4.55, l=4.14, p_l=2.81e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 72% 56/78 [04:56<01:54, 5.21s/it, bpd=5.76, g_l=5.76, gn=3.73, l=5.42, p_l=2.97e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [05:01<01:49, 5.20s/it, bpd=5.48, g_l=5.48, gn=2.88, l=5.16, p_l=3.09e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 74% 58/78 [05:07<01:44, 5.20s/it, bpd=4.64, g_l=4.64, gn=4.01, l=4.37, p_l=3.02e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 76% 59/78 [05:12<01:38, 5.19s/it, bpd=4, g_l=4, gn=3.65, l=3.77, p_l=2.91e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 77% 60/78 [05:17<01:33, 5.18s/it, bpd=5.51, g_l=5.51, gn=3.97, l=5.19, p_l=2.94e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 78% 61/78 [05:22<01:28, 5.19s/it, bpd=6.39, g_l=6.39, gn=3.85, l=6.01, p_l=2.71e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 79% 62/78 [05:27<01:22, 5.18s/it, bpd=4.27, g_l=4.27, gn=3.97, l=4.02, p_l=2.55e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 81% 63/78 [05:33<01:17, 5.18s/it, bpd=4.11, g_l=4.11, gn=5.56, l=3.87, p_l=2.34e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [05:38<01:12, 5.17s/it, bpd=4.16, g_l=4.16, gn=5.24, l=3.92, p_l=2.2e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 83% 65/78 [05:43<01:07, 5.18s/it, bpd=5.01, g_l=5.01, gn=4.18, l=4.71, p_l=2.17e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 85% 66/78 [05:48<01:02, 5.17s/it, bpd=4.62, g_l=4.62, gn=4.42, l=4.35, p_l=1.98e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 86% 67/78 [05:53<00:56, 5.18s/it, bpd=4.62, g_l=4.62, gn=3.88, l=4.35, p_l=1.82e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 87% 68/78 [05:58<00:51, 5.18s/it, bpd=4.87, g_l=4.87, gn=12.3, l=4.59, p_l=1.78e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 88% 69/78 [06:04<00:46, 5.18s/it, bpd=4.17, g_l=4.17, gn=3.97, l=3.92, p_l=1.74e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 90% 70/78 [06:09<00:41, 5.17s/it, bpd=4.72, g_l=4.72, gn=3.4, l=4.44, p_l=1.69e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 91% 71/78 [06:14<00:36, 5.17s/it, bpd=4.26, g_l=4.26, gn=3.84, l=4.01, p_l=1.66e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 92% 72/78 [06:19<00:30, 5.16s/it, bpd=4.29, g_l=4.29, gn=3.51, l=4.04, p_l=1.54e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 94% 73/78 [06:24<00:25, 5.16s/it, bpd=5.86, g_l=5.86, gn=4.96, l=5.51, p_l=1.43e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 95% 74/78 [06:29<00:20, 5.16s/it, bpd=5.12, g_l=5.12, gn=4.37, l=4.82, p_l=1.33e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 96% 75/78 [06:35<00:15, 5.16s/it, bpd=4.92, g_l=4.92, gn=4.48, l=4.63, p_l=1.22e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n","100% 78/78 [06:50<00:00, 5.27s/it, bpd=5.59, g_l=5.59, gn=3.87, l=5.26, p_l=1.06e-6]\n","Train bpd: 4.9423 prime_loss: 0.0000 gen_loss: 4.9423 loss: 4.6516 gn: 4.0006 lr: 0.0003 lg_loss_scale: 16.5060 epoch: 13.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1166\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=5.69, l=5.35]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:13, 1.90s/it, bpd=4.91, l=4.62]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.75s/it, bpd=5.15, l=4.84]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=5.16, l=4.85]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=4.85, l=4.57]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=5.19, l=4.89]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=5.64, l=5.31]\n","Ema bpd: 5.1223 prime_loss: 0.0161 gen_loss: 5.1223 loss: 4.8214 epoch: 13.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (11).txt\n","/content/gdrive/MyDrive/slon/slon (30).txt\n"," 1% 1/78 [00:05<07:00, 5.46s/it, bpd=5.36, g_l=5.36, gn=3.36, l=5.05, p_l=1.06e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 3% 2/78 [00:10<06:49, 5.39s/it, bpd=5.36, g_l=5.36, gn=3.42, l=5.04, p_l=1.09e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 4% 3/78 [00:15<06:41, 5.35s/it, bpd=5.56, g_l=5.56, gn=3.45, l=5.24, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 5% 4/78 [00:21<06:37, 5.37s/it, bpd=4.45, g_l=4.45, gn=3.65, l=4.19, p_l=1.2e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 6% 5/78 [00:26<06:30, 5.34s/it, bpd=5.16, g_l=5.16, gn=3.62, l=4.85, p_l=1.29e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 8% 6/78 [00:31<06:22, 5.31s/it, bpd=6.08, g_l=6.08, gn=3.6, l=5.73, p_l=1.37e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=5.75, g_l=5.75, gn=3.29, l=5.41, p_l=1.54e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:08, 5.26s/it, bpd=5.18, g_l=5.18, gn=3.06, l=4.88, p_l=1.69e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 12% 9/78 [00:47<06:00, 5.23s/it, bpd=5.93, g_l=5.93, gn=3.53, l=5.58, p_l=1.86e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 13% 10/78 [00:52<05:54, 5.21s/it, bpd=4.45, g_l=4.45, gn=3.62, l=4.19, p_l=1.94e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 14% 11/78 [00:57<05:47, 5.19s/it, bpd=5.32, g_l=5.32, gn=3.37, l=5, p_l=2.04e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n","\n","Overflow in backward. Loss 4.393082618713379, grad norm inf, lgscale 16.708000000000172, new lgscale 15.708000000000174\n"," 15% 12/78 [01:02<05:26, 4.95s/it, bpd=5.32, g_l=5.32, gn=3.37, l=5, p_l=2.04e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 17% 13/78 [01:07<05:25, 5.01s/it, bpd=5.42, g_l=5.42, gn=3.19, l=5.1, p_l=2.17e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 18% 14/78 [01:12<05:23, 5.06s/it, bpd=4.99, g_l=4.99, gn=3.5, l=4.7, p_l=2.37e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 19% 15/78 [01:17<05:21, 5.10s/it, bpd=4.59, g_l=4.59, gn=3.52, l=4.32, p_l=2.64e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 21% 16/78 [01:22<05:17, 5.12s/it, bpd=4.31, g_l=4.31, gn=3.17, l=4.06, p_l=2.83e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 22% 17/78 [01:28<05:13, 5.14s/it, bpd=5.04, g_l=5.04, gn=3.51, l=4.74, p_l=2.91e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 23% 18/78 [01:33<05:09, 5.16s/it, bpd=5.07, g_l=5.07, gn=3.7, l=4.78, p_l=2.98e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 24% 19/78 [01:38<05:05, 5.18s/it, bpd=5.92, g_l=5.92, gn=3.41, l=5.57, p_l=2.91e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 26% 20/78 [01:43<05:01, 5.19s/it, bpd=4.52, g_l=4.52, gn=4.25, l=4.25, p_l=2.7e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 27% 21/78 [01:48<04:56, 5.21s/it, bpd=4.41, g_l=4.41, gn=4.07, l=4.15, p_l=2.79e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 28% 22/78 [01:54<04:51, 5.20s/it, bpd=4.52, g_l=4.52, gn=4.02, l=4.25, p_l=2.99e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 29% 23/78 [01:59<04:46, 5.20s/it, bpd=3.73, g_l=3.73, gn=3.41, l=3.51, p_l=3.31e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 31% 24/78 [02:04<04:40, 5.19s/it, bpd=4.74, g_l=4.74, gn=3.58, l=4.46, p_l=3.64e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 32% 25/78 [02:09<04:34, 5.18s/it, bpd=6.41, g_l=6.41, gn=3.33, l=6.03, p_l=4.34e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1191\u001b[0m\n"," 33% 26/78 [02:50<13:48, 15.94s/it, bpd=3.68, g_l=3.68, gn=4.5, l=3.47, p_l=4.61e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 35% 27/78 [02:55<10:49, 12.73s/it, bpd=5.48, g_l=5.48, gn=4.22, l=5.15, p_l=4.69e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 36% 28/78 [03:01<08:43, 10.47s/it, bpd=4.77, g_l=4.77, gn=4.71, l=4.49, p_l=4.72e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 37% 29/78 [03:06<07:16, 8.91s/it, bpd=4.35, g_l=4.35, gn=3.61, l=4.1, p_l=4.87e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 38% 30/78 [03:11<06:16, 7.85s/it, bpd=4.25, g_l=4.25, gn=3.66, l=4, p_l=5.01e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 40% 31/78 [03:17<05:33, 7.10s/it, bpd=4.45, g_l=4.45, gn=3.27, l=4.18, p_l=5.3e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 41% 32/78 [03:22<05:04, 6.63s/it, bpd=4.63, g_l=4.63, gn=3.71, l=4.36, p_l=5.56e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 42% 33/78 [03:27<04:40, 6.24s/it, bpd=4.97, g_l=4.97, gn=4.45, l=4.67, p_l=5.88e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 44% 34/78 [03:33<04:23, 6.00s/it, bpd=4.58, g_l=4.58, gn=4.19, l=4.31, p_l=6.74e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 45% 35/78 [03:41<04:40, 6.53s/it, bpd=4.49, g_l=4.49, gn=3.36, l=4.23, p_l=7.65e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 46% 36/78 [03:46<04:18, 6.16s/it, bpd=5.21, g_l=5.21, gn=4.68, l=4.91, p_l=8.24e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 47% 37/78 [03:51<04:00, 5.87s/it, bpd=4.29, g_l=4.29, gn=3.18, l=4.04, p_l=9.3e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 49% 38/78 [03:57<03:48, 5.72s/it, bpd=5.02, g_l=5.02, gn=4.06, l=4.72, p_l=9.76e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 50% 39/78 [04:02<03:36, 5.55s/it, bpd=5.17, g_l=5.17, gn=3.35, l=4.86, p_l=1e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 51% 40/78 [04:07<03:27, 5.46s/it, bpd=4.86, g_l=4.86, gn=4.02, l=4.58, p_l=9.84e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 53% 41/78 [04:12<03:18, 5.37s/it, bpd=5.08, g_l=5.08, gn=3.92, l=4.78, p_l=9.34e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 54% 42/78 [04:17<03:11, 5.32s/it, bpd=4.67, g_l=4.67, gn=3.73, l=4.4, p_l=9.02e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [04:23<03:06, 5.32s/it, bpd=4.76, g_l=4.76, gn=5.98, l=4.48, p_l=8.41e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 56% 44/78 [04:28<02:59, 5.29s/it, bpd=6.91, g_l=6.91, gn=3.25, l=6.5, p_l=7.59e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 58% 45/78 [04:33<02:54, 5.29s/it, bpd=4.6, g_l=4.6, gn=4.32, l=4.33, p_l=6.33e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [04:38<02:48, 5.28s/it, bpd=5.8, g_l=5.8, gn=2.99, l=5.46, p_l=5.39e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 60% 47/78 [04:44<02:43, 5.29s/it, bpd=4.29, g_l=4.29, gn=6.6, l=4.03, p_l=4.63e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 62% 48/78 [04:49<02:38, 5.28s/it, bpd=4.48, g_l=4.48, gn=3.83, l=4.22, p_l=4.01e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 63% 49/78 [04:54<02:33, 5.29s/it, bpd=4.45, g_l=4.45, gn=3.33, l=4.19, p_l=3.86e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 64% 50/78 [05:00<02:27, 5.28s/it, bpd=5.84, g_l=5.84, gn=3.08, l=5.5, p_l=3.8e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 65% 51/78 [05:05<02:22, 5.27s/it, bpd=4.08, g_l=4.08, gn=4.38, l=3.84, p_l=3.54e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 67% 52/78 [05:10<02:16, 5.26s/it, bpd=4.51, g_l=4.51, gn=3.21, l=4.24, p_l=3.11e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 68% 53/78 [05:15<02:11, 5.26s/it, bpd=4.82, g_l=4.82, gn=3.51, l=4.54, p_l=2.56e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 69% 54/78 [05:21<02:06, 5.27s/it, bpd=5.45, g_l=5.45, gn=4.08, l=5.13, p_l=2.19e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 71% 55/78 [05:26<02:00, 5.26s/it, bpd=4.26, g_l=4.26, gn=3.45, l=4.01, p_l=1.89e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 72% 56/78 [05:31<01:56, 5.29s/it, bpd=4.1, g_l=4.1, gn=3.78, l=3.86, p_l=1.59e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 73% 57/78 [05:36<01:50, 5.27s/it, bpd=5.08, g_l=5.08, gn=3.58, l=4.78, p_l=1.4e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 74% 58/78 [05:42<01:45, 5.27s/it, bpd=4.4, g_l=4.4, gn=4.16, l=4.14, p_l=1.25e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 76% 59/78 [05:47<01:39, 5.25s/it, bpd=4.89, g_l=4.89, gn=3.79, l=4.61, p_l=1.11e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 77% 60/78 [05:52<01:34, 5.24s/it, bpd=5.39, g_l=5.39, gn=3.75, l=5.08, p_l=9.86e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 78% 61/78 [05:57<01:29, 5.24s/it, bpd=4.32, g_l=4.32, gn=3.66, l=4.07, p_l=8.93e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 79% 62/78 [06:02<01:23, 5.21s/it, bpd=4.88, g_l=4.88, gn=3.51, l=4.59, p_l=8.37e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 81% 63/78 [06:08<01:18, 5.20s/it, bpd=4.57, g_l=4.57, gn=4.09, l=4.3, p_l=8.22e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 82% 64/78 [06:13<01:12, 5.19s/it, bpd=4.73, g_l=4.73, gn=4.97, l=4.45, p_l=7.82e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 83% 65/78 [06:18<01:07, 5.19s/it, bpd=4.56, g_l=4.56, gn=3.42, l=4.29, p_l=7.64e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 85% 66/78 [06:23<01:02, 5.19s/it, bpd=4.03, g_l=4.03, gn=6.45, l=3.79, p_l=7.47e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 86% 67/78 [06:28<00:57, 5.20s/it, bpd=4.56, g_l=4.56, gn=3.24, l=4.29, p_l=7.41e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 87% 68/78 [06:34<00:51, 5.20s/it, bpd=4.44, g_l=4.44, gn=6.31, l=4.18, p_l=7.26e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 88% 69/78 [06:39<00:46, 5.20s/it, bpd=4.95, g_l=4.95, gn=3.22, l=4.66, p_l=7.1e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 90% 70/78 [06:44<00:41, 5.20s/it, bpd=4.7, g_l=4.7, gn=3.33, l=4.42, p_l=7.17e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 91% 71/78 [06:49<00:36, 5.20s/it, bpd=5.05, g_l=5.05, gn=3.35, l=4.75, p_l=6.93e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 92% 72/78 [06:54<00:31, 5.20s/it, bpd=4.54, g_l=4.54, gn=3.29, l=4.27, p_l=7.22e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 94% 73/78 [07:00<00:26, 5.21s/it, bpd=5.38, g_l=5.38, gn=3.44, l=5.06, p_l=7.56e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 95% 74/78 [07:05<00:20, 5.22s/it, bpd=5.08, g_l=5.08, gn=4.63, l=4.78, p_l=7.93e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 96% 75/78 [07:10<00:15, 5.22s/it, bpd=5.23, g_l=5.23, gn=4.34, l=4.92, p_l=7.87e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n","100% 78/78 [07:26<00:00, 5.73s/it, bpd=4.53, g_l=4.53, gn=4.45, l=4.26, p_l=7.32e-7]\n","Train bpd: 4.8717 prime_loss: 0.0000 gen_loss: 4.8717 loss: 4.5851 gn: 3.8270 lr: 0.0003 lg_loss_scale: 15.9589 epoch: 14.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1243\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.05s/it, bpd=4.92, l=4.63]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:13, 1.89s/it, bpd=4.98, l=4.68]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:04<00:10, 1.74s/it, bpd=4.82, l=4.54]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=5.09, l=4.79]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=5.18, l=4.87]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=3.9, l=3.67]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=5.62, l=5.29]\n","Ema bpd: 5.0660 prime_loss: 0.0158 gen_loss: 5.0660 loss: 4.7683 epoch: 14.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (23).txt\n","/content/gdrive/MyDrive/slon/slon (11).txt\n","/content/gdrive/MyDrive/slon/slon (22).txt\n"," 1% 1/78 [00:05<06:57, 5.42s/it, bpd=5.09, g_l=5.09, gn=3.49, l=4.79, p_l=7.68e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 3% 2/78 [00:10<06:48, 5.38s/it, bpd=4.31, g_l=4.31, gn=3.97, l=4.05, p_l=8.79e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 4% 3/78 [00:15<06:41, 5.35s/it, bpd=4.89, g_l=4.89, gn=3.3, l=4.6, p_l=9.82e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 5% 4/78 [00:21<06:34, 5.33s/it, bpd=5.98, g_l=5.98, gn=3.08, l=5.63, p_l=1.14e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 6% 5/78 [00:26<06:28, 5.32s/it, bpd=4.74, g_l=4.74, gn=3.6, l=4.46, p_l=1.35e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 8% 6/78 [00:31<06:21, 5.29s/it, bpd=4.75, g_l=4.75, gn=3.8, l=4.47, p_l=1.53e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 9% 7/78 [00:37<06:14, 5.28s/it, bpd=4.28, g_l=4.28, gn=2.98, l=4.03, p_l=1.71e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 10% 8/78 [00:42<06:07, 5.25s/it, bpd=4.27, g_l=4.27, gn=3.78, l=4.01, p_l=1.83e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 12% 9/78 [00:47<06:00, 5.23s/it, bpd=4.1, g_l=4.1, gn=3.54, l=3.85, p_l=1.87e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 13% 10/78 [00:52<05:53, 5.20s/it, bpd=4.5, g_l=4.5, gn=3.48, l=4.23, p_l=1.91e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 14% 11/78 [00:57<05:47, 5.19s/it, bpd=4.38, g_l=4.38, gn=4.61, l=4.12, p_l=2.15e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 15% 12/78 [01:02<05:42, 5.18s/it, bpd=4.49, g_l=4.49, gn=3.13, l=4.23, p_l=2.46e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 17% 13/78 [01:08<05:36, 5.17s/it, bpd=4.29, g_l=4.29, gn=3.62, l=4.03, p_l=2.64e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=3.24, g_l=3.24, gn=4.39, l=3.05, p_l=2.82e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 19% 15/78 [01:18<05:26, 5.18s/it, bpd=4.54, g_l=4.54, gn=3.36, l=4.28, p_l=2.97e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=5.5, g_l=5.5, gn=5.27, l=5.18, p_l=3.08e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 22% 17/78 [01:28<05:16, 5.18s/it, bpd=3.96, g_l=3.96, gn=6.18, l=3.73, p_l=3.18e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 23% 18/78 [01:33<05:10, 5.18s/it, bpd=5.24, g_l=5.24, gn=3.18, l=4.93, p_l=3.46e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 24% 19/78 [01:39<05:05, 5.18s/it, bpd=4.83, g_l=4.83, gn=3.43, l=4.55, p_l=3.63e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:44<05:00, 5.18s/it, bpd=5, g_l=5, gn=3.11, l=4.7, p_l=3.4e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 27% 21/78 [01:49<04:56, 5.20s/it, bpd=4.22, g_l=4.22, gn=4.3, l=3.97, p_l=3.09e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 28% 22/78 [01:54<04:51, 5.20s/it, bpd=4.62, g_l=4.62, gn=3.87, l=4.34, p_l=2.8e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 29% 23/78 [02:00<04:47, 5.22s/it, bpd=4.82, g_l=4.82, gn=4.13, l=4.54, p_l=2.55e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 31% 24/78 [02:05<04:42, 5.22s/it, bpd=5.58, g_l=5.58, gn=3.35, l=5.25, p_l=2.29e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 32% 25/78 [02:10<04:37, 5.23s/it, bpd=5.52, g_l=5.52, gn=3.02, l=5.2, p_l=2.05e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=4.4, g_l=4.4, gn=3.44, l=4.14, p_l=1.77e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 35% 27/78 [02:20<04:26, 5.22s/it, bpd=4.37, g_l=4.37, gn=3.56, l=4.11, p_l=1.58e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=3.85, g_l=3.85, gn=5.43, l=3.63, p_l=1.47e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 37% 29/78 [02:31<04:14, 5.19s/it, bpd=3.63, g_l=3.63, gn=4.16, l=3.42, p_l=1.37e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 38% 30/78 [02:36<04:08, 5.18s/it, bpd=5.35, g_l=5.35, gn=3.26, l=5.03, p_l=1.39e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 40% 31/78 [02:41<04:02, 5.17s/it, bpd=5.4, g_l=5.4, gn=3.27, l=5.08, p_l=1.55e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 41% 32/78 [02:46<03:57, 5.17s/it, bpd=4.41, g_l=4.41, gn=3.24, l=4.15, p_l=1.92e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 42% 33/78 [02:51<03:52, 5.16s/it, bpd=4.57, g_l=4.57, gn=4.41, l=4.3, p_l=2.41e-6]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 34/78 [02:57<03:47, 5.17s/it, bpd=4.43, g_l=4.43, gn=2.95, l=4.16, p_l=2.87e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 45% 35/78 [03:02<03:42, 5.17s/it, bpd=5.41, g_l=5.41, gn=3.55, l=5.09, p_l=3.19e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 46% 36/78 [03:07<03:37, 5.18s/it, bpd=5.61, g_l=5.61, gn=3.09, l=5.28, p_l=3.18e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 47% 37/78 [03:12<03:32, 5.18s/it, bpd=4.27, g_l=4.27, gn=3.16, l=4.01, p_l=2.76e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 49% 38/78 [03:17<03:26, 5.17s/it, bpd=4.73, g_l=4.73, gn=3.38, l=4.45, p_l=2.4e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 50% 39/78 [03:22<03:21, 5.18s/it, bpd=4.4, g_l=4.4, gn=3.41, l=4.14, p_l=2.2e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 51% 40/78 [03:28<03:16, 5.18s/it, bpd=6.62, g_l=6.62, gn=3.32, l=6.23, p_l=2.16e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 53% 41/78 [03:33<03:11, 5.19s/it, bpd=4.52, g_l=4.52, gn=3.64, l=4.26, p_l=2.25e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 54% 42/78 [03:38<03:06, 5.19s/it, bpd=5, g_l=5, gn=3.45, l=4.7, p_l=2.5e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [03:43<03:02, 5.20s/it, bpd=5.61, g_l=5.61, gn=3.74, l=5.28, p_l=2.79e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 56% 44/78 [03:48<02:56, 5.19s/it, bpd=6.21, g_l=6.21, gn=3.88, l=5.84, p_l=2.97e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 58% 45/78 [03:54<02:51, 5.19s/it, bpd=4.76, g_l=4.76, gn=4.66, l=4.48, p_l=3.09e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 59% 46/78 [03:59<02:45, 5.18s/it, bpd=4.27, g_l=4.27, gn=3.51, l=4.02, p_l=2.92e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [04:04<02:40, 5.18s/it, bpd=5.47, g_l=5.47, gn=4.1, l=5.15, p_l=2.65e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 62% 48/78 [04:09<02:35, 5.17s/it, bpd=4.67, g_l=4.67, gn=4.16, l=4.4, p_l=2.55e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 63% 49/78 [04:14<02:29, 5.17s/it, bpd=4.28, g_l=4.28, gn=3.42, l=4.03, p_l=2.65e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 64% 50/78 [04:19<02:24, 5.17s/it, bpd=5.5, g_l=5.5, gn=3.23, l=5.18, p_l=2.62e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 65% 51/78 [04:25<02:19, 5.17s/it, bpd=4.6, g_l=4.6, gn=7.37, l=4.33, p_l=2.79e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 67% 52/78 [04:30<02:14, 5.17s/it, bpd=4.92, g_l=4.92, gn=5.12, l=4.64, p_l=3.07e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 68% 53/78 [04:35<02:09, 5.18s/it, bpd=5.72, g_l=5.72, gn=5.65, l=5.38, p_l=2.63e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 69% 54/78 [04:40<02:04, 5.19s/it, bpd=6.23, g_l=6.23, gn=3.25, l=5.86, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 71% 55/78 [04:45<01:59, 5.20s/it, bpd=5.8, g_l=5.8, gn=3.33, l=5.46, p_l=1.6e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 72% 56/78 [04:51<01:54, 5.21s/it, bpd=5.42, g_l=5.42, gn=4.5, l=5.11, p_l=1.26e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 73% 57/78 [05:01<02:20, 6.70s/it, bpd=4.35, g_l=4.35, gn=3.39, l=4.1, p_l=1.06e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 74% 58/78 [05:06<02:04, 6.23s/it, bpd=6.48, g_l=6.48, gn=3.14, l=6.1, p_l=9.25e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 76% 59/78 [05:11<01:52, 5.91s/it, bpd=4.37, g_l=4.37, gn=3.13, l=4.11, p_l=9.04e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 77% 60/78 [05:16<01:42, 5.71s/it, bpd=3.79, g_l=3.79, gn=4.17, l=3.56, p_l=9.1e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 78% 61/78 [05:22<01:34, 5.56s/it, bpd=4.44, g_l=4.44, gn=3.84, l=4.18, p_l=9.07e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 79% 62/78 [05:27<01:27, 5.47s/it, bpd=5.87, g_l=5.87, gn=3.16, l=5.52, p_l=9.14e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 81% 63/78 [05:32<01:20, 5.40s/it, bpd=5.2, g_l=5.2, gn=3.17, l=4.9, p_l=9.07e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 82% 64/78 [05:37<01:14, 5.35s/it, bpd=4.2, g_l=4.2, gn=3.65, l=3.95, p_l=8.76e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 83% 65/78 [05:42<01:08, 5.31s/it, bpd=4.36, g_l=4.36, gn=5.08, l=4.1, p_l=8.35e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 85% 66/78 [05:48<01:03, 5.28s/it, bpd=5.23, g_l=5.23, gn=3.67, l=4.92, p_l=8.09e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 86% 67/78 [05:53<00:57, 5.25s/it, bpd=4.48, g_l=4.48, gn=3.72, l=4.21, p_l=8.7e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 87% 68/78 [05:58<00:52, 5.22s/it, bpd=6.38, g_l=6.38, gn=3.91, l=6.01, p_l=1.02e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 88% 69/78 [06:03<00:46, 5.20s/it, bpd=4.85, g_l=4.85, gn=3.34, l=4.57, p_l=1.33e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 90% 70/78 [06:08<00:41, 5.19s/it, bpd=5.57, g_l=5.57, gn=4.12, l=5.24, p_l=1.74e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 91% 71/78 [06:14<00:36, 5.19s/it, bpd=6.49, g_l=6.49, gn=4.89, l=6.11, p_l=2.11e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 92% 72/78 [06:19<00:31, 5.18s/it, bpd=4.02, g_l=4.02, gn=3.92, l=3.78, p_l=2.32e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:24<00:25, 5.19s/it, bpd=4.96, g_l=4.96, gn=3.71, l=4.67, p_l=2.52e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 95% 74/78 [06:29<00:20, 5.18s/it, bpd=4.83, g_l=4.83, gn=3.53, l=4.55, p_l=2.34e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 96% 75/78 [06:34<00:15, 5.19s/it, bpd=4.02, g_l=4.02, gn=3.07, l=3.79, p_l=2.14e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n","100% 78/78 [06:50<00:00, 5.26s/it, bpd=3.61, g_l=3.61, gn=3.3, l=3.4, p_l=2.02e-6]\n","Train bpd: 4.8635 prime_loss: 0.0000 gen_loss: 4.8635 loss: 4.5775 gn: 3.8473 lr: 0.0003 lg_loss_scale: 16.1260 epoch: 15.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1321\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=4.11, l=3.87]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:13, 1.91s/it, bpd=4.54, l=4.28]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 33% 3/9 [00:05<00:10, 1.75s/it, bpd=4.8, l=4.51]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=5.59, l=5.26]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=4.92, l=4.63]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=5.39, l=5.07]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=5.39, l=5.07]\n","Ema bpd: 4.9701 prime_loss: 0.0154 gen_loss: 4.9701 loss: 4.6781 epoch: 15.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (27).txt\n"," 1% 1/78 [00:05<06:53, 5.37s/it, bpd=4.97, g_l=4.97, gn=3.27, l=4.67, p_l=2.27e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 3% 2/78 [00:10<06:45, 5.33s/it, bpd=5.13, g_l=5.13, gn=2.97, l=4.83, p_l=2.55e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 4% 3/78 [00:15<06:38, 5.31s/it, bpd=3.46, g_l=3.46, gn=5.11, l=3.26, p_l=2.7e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 5% 4/78 [00:21<06:33, 5.31s/it, bpd=4.86, g_l=4.86, gn=4.54, l=4.57, p_l=2.76e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 6% 5/78 [00:26<06:27, 5.31s/it, bpd=4.58, g_l=4.58, gn=3.31, l=4.31, p_l=2.89e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 8% 6/78 [00:31<06:22, 5.31s/it, bpd=5.02, g_l=5.02, gn=4.26, l=4.72, p_l=3.05e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:37<06:16, 5.30s/it, bpd=4.34, g_l=4.34, gn=3.31, l=4.08, p_l=3.07e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:09, 5.27s/it, bpd=4.48, g_l=4.48, gn=2.95, l=4.22, p_l=3.12e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 12% 9/78 [00:47<06:02, 5.25s/it, bpd=4.43, g_l=4.43, gn=3.07, l=4.17, p_l=3.16e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 13% 10/78 [00:52<05:55, 5.22s/it, bpd=4.29, g_l=4.29, gn=2.88, l=4.04, p_l=3.17e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 14% 11/78 [00:57<05:48, 5.21s/it, bpd=3.36, g_l=3.36, gn=3.36, l=3.16, p_l=3.12e-6]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 15% 12/78 [01:02<05:41, 5.18s/it, bpd=6.04, g_l=6.04, gn=3.69, l=5.69, p_l=3.09e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 17% 13/78 [01:08<05:35, 5.16s/it, bpd=4.18, g_l=4.18, gn=3.8, l=3.93, p_l=2.93e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 18% 14/78 [01:13<05:29, 5.15s/it, bpd=5.55, g_l=5.55, gn=3.29, l=5.22, p_l=2.72e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 19% 15/78 [01:18<05:23, 5.14s/it, bpd=5.64, g_l=5.64, gn=3.98, l=5.3, p_l=2.68e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:23<05:18, 5.13s/it, bpd=5.18, g_l=5.18, gn=3.62, l=4.88, p_l=2.71e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 22% 17/78 [01:28<05:13, 5.14s/it, bpd=4.31, g_l=4.31, gn=3.3, l=4.06, p_l=2.83e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 23% 18/78 [01:33<05:08, 5.15s/it, bpd=4.15, g_l=4.15, gn=3.15, l=3.91, p_l=2.98e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 24% 19/78 [01:38<05:04, 5.16s/it, bpd=5.58, g_l=5.58, gn=4.33, l=5.25, p_l=3.04e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 26% 20/78 [01:44<04:59, 5.17s/it, bpd=4.84, g_l=4.84, gn=3.45, l=4.55, p_l=3.2e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 27% 21/78 [01:49<04:55, 5.19s/it, bpd=3.59, g_l=3.59, gn=3.07, l=3.38, p_l=3.34e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 28% 22/78 [01:54<04:51, 5.20s/it, bpd=5.36, g_l=5.36, gn=3.54, l=5.05, p_l=3.34e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 29% 23/78 [01:59<04:46, 5.20s/it, bpd=4.13, g_l=4.13, gn=3.22, l=3.88, p_l=3.43e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=7.13, g_l=7.13, gn=3.16, l=6.71, p_l=3.76e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=5.95, g_l=5.95, gn=3.21, l=5.6, p_l=3.77e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 33% 26/78 [02:15<04:31, 5.21s/it, bpd=4.14, g_l=4.14, gn=8.61, l=3.89, p_l=3.61e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 35% 27/78 [02:20<04:25, 5.20s/it, bpd=4.86, g_l=4.86, gn=3.18, l=4.57, p_l=3.75e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 36% 28/78 [02:25<04:19, 5.19s/it, bpd=5.61, g_l=5.61, gn=3.17, l=5.28, p_l=4.1e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 37% 29/78 [02:30<04:13, 5.18s/it, bpd=6.09, g_l=6.09, gn=3.08, l=5.73, p_l=5.04e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 38% 30/78 [02:36<04:08, 5.17s/it, bpd=5.36, g_l=5.36, gn=3.58, l=5.04, p_l=6.13e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 40% 31/78 [02:41<04:02, 5.16s/it, bpd=4.48, g_l=4.48, gn=3.65, l=4.22, p_l=6.97e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 41% 32/78 [02:46<03:57, 5.16s/it, bpd=4.3, g_l=4.3, gn=4.78, l=4.05, p_l=7.62e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 42% 33/78 [02:51<03:52, 5.17s/it, bpd=4.87, g_l=4.87, gn=3.79, l=4.58, p_l=7.72e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 44% 34/78 [02:56<03:47, 5.17s/it, bpd=4.26, g_l=4.26, gn=4.25, l=4.01, p_l=7.69e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 45% 35/78 [03:01<03:43, 5.19s/it, bpd=4.48, g_l=4.48, gn=3.96, l=4.22, p_l=7.43e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:07<03:37, 5.19s/it, bpd=4.32, g_l=4.32, gn=3.69, l=4.06, p_l=6.96e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 47% 37/78 [03:12<03:33, 5.20s/it, bpd=4.59, g_l=4.59, gn=4.19, l=4.32, p_l=6.79e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 49% 38/78 [03:17<03:28, 5.20s/it, bpd=4.46, g_l=4.46, gn=3.65, l=4.2, p_l=6.6e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 50% 39/78 [03:22<03:22, 5.20s/it, bpd=4.21, g_l=4.21, gn=3.64, l=3.96, p_l=6.84e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 51% 40/78 [03:28<03:17, 5.21s/it, bpd=4.17, g_l=4.17, gn=3.46, l=3.92, p_l=7.25e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 53% 41/78 [03:33<03:12, 5.20s/it, bpd=6.03, g_l=6.03, gn=3.57, l=5.68, p_l=7.92e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 54% 42/78 [03:38<03:07, 5.20s/it, bpd=4.84, g_l=4.84, gn=4.1, l=4.56, p_l=8.35e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 55% 43/78 [03:43<03:01, 5.20s/it, bpd=4.55, g_l=4.55, gn=3.41, l=4.28, p_l=8.37e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 56% 44/78 [03:48<02:57, 5.21s/it, bpd=4.76, g_l=4.76, gn=5, l=4.48, p_l=7.61e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 58% 45/78 [03:54<02:51, 5.21s/it, bpd=4.77, g_l=4.77, gn=3.87, l=4.49, p_l=6.73e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 59% 46/78 [03:59<02:47, 5.22s/it, bpd=5.05, g_l=5.05, gn=3.97, l=4.76, p_l=5.69e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 60% 47/78 [04:04<02:41, 5.21s/it, bpd=4.12, g_l=4.12, gn=3.51, l=3.88, p_l=4.93e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 62% 48/78 [04:09<02:36, 5.22s/it, bpd=4.58, g_l=4.58, gn=4.12, l=4.31, p_l=4.55e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 63% 49/78 [04:14<02:30, 5.21s/it, bpd=3.94, g_l=3.94, gn=6.54, l=3.71, p_l=4.19e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 64% 50/78 [04:20<02:25, 5.21s/it, bpd=5.16, g_l=5.16, gn=3.37, l=4.86, p_l=3.85e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 65% 51/78 [04:25<02:20, 5.19s/it, bpd=3.96, g_l=3.96, gn=3.28, l=3.73, p_l=3.52e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 67% 52/78 [04:30<02:14, 5.18s/it, bpd=5.4, g_l=5.4, gn=3.08, l=5.08, p_l=3.45e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 68% 53/78 [04:35<02:09, 5.17s/it, bpd=4.76, g_l=4.76, gn=3.29, l=4.48, p_l=3.71e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 69% 54/78 [04:40<02:04, 5.17s/it, bpd=4.76, g_l=4.76, gn=3.62, l=4.48, p_l=4.06e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 71% 55/78 [04:45<01:59, 5.18s/it, bpd=5.74, g_l=5.74, gn=3.17, l=5.4, p_l=4.74e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 72% 56/78 [04:51<01:53, 5.17s/it, bpd=4.19, g_l=4.19, gn=4.19, l=3.94, p_l=5.38e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 73% 57/78 [04:56<01:48, 5.18s/it, bpd=6.25, g_l=6.25, gn=3.58, l=5.88, p_l=6.13e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 74% 58/78 [05:01<01:43, 5.17s/it, bpd=5.64, g_l=5.64, gn=3.36, l=5.31, p_l=6.96e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 76% 59/78 [05:06<01:38, 5.18s/it, bpd=5.52, g_l=5.52, gn=3.08, l=5.19, p_l=7.58e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 77% 60/78 [05:11<01:33, 5.18s/it, bpd=4.98, g_l=4.98, gn=3.7, l=4.69, p_l=8.23e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 78% 61/78 [05:17<01:28, 5.18s/it, bpd=6, g_l=6, gn=3.33, l=5.64, p_l=9.25e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 79% 62/78 [05:22<01:22, 5.19s/it, bpd=4.22, g_l=4.22, gn=4.43, l=3.97, p_l=1.03e-5]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 81% 63/78 [05:27<01:17, 5.18s/it, bpd=4.5, g_l=4.5, gn=4.24, l=4.24, p_l=1.09e-5]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 82% 64/78 [05:32<01:12, 5.19s/it, bpd=4.52, g_l=4.52, gn=3.5, l=4.25, p_l=1.15e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 83% 65/78 [05:37<01:07, 5.19s/it, bpd=5.74, g_l=5.74, gn=4.22, l=5.4, p_l=1.12e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 85% 66/78 [05:43<01:02, 5.21s/it, bpd=5.19, g_l=5.19, gn=3.75, l=4.89, p_l=1.11e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [05:48<00:57, 5.20s/it, bpd=4.43, g_l=4.43, gn=3.61, l=4.17, p_l=1.08e-5]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 87% 68/78 [05:53<00:52, 5.21s/it, bpd=4.51, g_l=4.51, gn=3.21, l=4.24, p_l=9.75e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 88% 69/78 [05:58<00:46, 5.21s/it, bpd=4.18, g_l=4.18, gn=3.36, l=3.94, p_l=8.58e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 90% 70/78 [06:03<00:41, 5.21s/it, bpd=5.02, g_l=5.02, gn=4.21, l=4.72, p_l=8.28e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 91% 71/78 [06:09<00:36, 5.20s/it, bpd=5.28, g_l=5.28, gn=3.84, l=4.97, p_l=8.05e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 92% 72/78 [06:14<00:31, 5.22s/it, bpd=5.89, g_l=5.89, gn=3.93, l=5.55, p_l=8.42e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 94% 73/78 [06:19<00:26, 5.21s/it, bpd=4.7, g_l=4.7, gn=3.16, l=4.43, p_l=8.63e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 95% 74/78 [06:24<00:20, 5.20s/it, bpd=4.34, g_l=4.34, gn=3.41, l=4.08, p_l=8.56e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [06:29<00:15, 5.20s/it, bpd=5.58, g_l=5.58, gn=3.72, l=5.25, p_l=7.97e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n","100% 78/78 [06:45<00:00, 5.20s/it, bpd=4.68, g_l=4.68, gn=3.4, l=4.41, p_l=8.83e-6]\n","Train bpd: 4.8342 prime_loss: 0.0000 gen_loss: 4.8342 loss: 4.5499 gn: 3.7241 lr: 0.0003 lg_loss_scale: 16.4380 epoch: 16.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1399\u001b[0m\n"," 11% 1/9 [00:02<00:17, 2.17s/it, bpd=5.8, l=5.46]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:14, 2.01s/it, bpd=5.09, l=4.79]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.82s/it, bpd=5.09, l=4.79]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.69s/it, bpd=5.07, l=4.77]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.60s/it, bpd=4.39, l=4.13]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 67% 6/9 [00:09<00:04, 1.54s/it, bpd=5.71, l=5.37]/content/gdrive/MyDrive/slon/slon (6).txt\n","100% 9/9 [00:13<00:00, 1.52s/it, bpd=5.39, l=5.07]\n","Ema bpd: 5.1750 prime_loss: 0.0154 gen_loss: 5.1750 loss: 4.8710 epoch: 16.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (2).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (24).txt\n"," 1% 1/78 [00:10<13:45, 10.72s/it, bpd=4.26, g_l=4.26, gn=3.74, l=4.01, p_l=7.99e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 3% 2/78 [00:15<11:29, 9.07s/it, bpd=5.12, g_l=5.12, gn=3.57, l=4.82, p_l=7.41e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:21<09:54, 7.93s/it, bpd=5.5, g_l=5.5, gn=3.16, l=5.18, p_l=6.87e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 5% 4/78 [00:26<08:49, 7.16s/it, bpd=5.09, g_l=5.09, gn=3.23, l=4.79, p_l=6.55e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 6% 5/78 [00:31<08:02, 6.60s/it, bpd=4.37, g_l=4.37, gn=4.08, l=4.11, p_l=6.71e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 8% 6/78 [00:37<07:28, 6.22s/it, bpd=4.1, g_l=4.1, gn=9.79, l=3.86, p_l=6.99e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 9% 7/78 [00:42<07:01, 5.94s/it, bpd=5.25, g_l=5.25, gn=3.18, l=4.94, p_l=7.67e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 10% 8/78 [00:47<06:40, 5.72s/it, bpd=5.93, g_l=5.93, gn=3.36, l=5.58, p_l=7.48e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 12% 9/78 [00:52<06:23, 5.56s/it, bpd=3.55, g_l=3.55, gn=3.13, l=3.34, p_l=6.24e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 13% 10/78 [00:58<06:09, 5.43s/it, bpd=5.18, g_l=5.18, gn=3.27, l=4.88, p_l=4.73e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 14% 11/78 [01:03<05:58, 5.35s/it, bpd=5.77, g_l=5.77, gn=2.87, l=5.43, p_l=3.65e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 15% 12/78 [01:08<05:48, 5.28s/it, bpd=5.56, g_l=5.56, gn=3.31, l=5.23, p_l=2.83e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 17% 13/78 [01:13<05:40, 5.24s/it, bpd=6.22, g_l=6.22, gn=3.25, l=5.85, p_l=2.6e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 18% 14/78 [01:18<05:33, 5.21s/it, bpd=4.24, g_l=4.24, gn=3.27, l=3.99, p_l=2.64e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 19% 15/78 [01:23<05:27, 5.19s/it, bpd=4.82, g_l=4.82, gn=3.84, l=4.54, p_l=2.71e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 21% 16/78 [01:28<05:21, 5.18s/it, bpd=5.38, g_l=5.38, gn=3.47, l=5.06, p_l=2.95e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 22% 17/78 [01:34<05:15, 5.17s/it, bpd=3.89, g_l=3.89, gn=3.02, l=3.66, p_l=3.13e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 23% 18/78 [01:39<05:10, 5.17s/it, bpd=5.1, g_l=5.1, gn=3.57, l=4.8, p_l=3.26e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 24% 19/78 [01:44<05:05, 5.18s/it, bpd=4.7, g_l=4.7, gn=2.77, l=4.42, p_l=3.13e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 26% 20/78 [01:49<05:00, 5.19s/it, bpd=4.67, g_l=4.67, gn=3.74, l=4.39, p_l=2.98e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 27% 21/78 [01:54<04:56, 5.19s/it, bpd=5.17, g_l=5.17, gn=4.11, l=4.86, p_l=2.79e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 28% 22/78 [02:00<04:51, 5.21s/it, bpd=5.98, g_l=5.98, gn=2.94, l=5.63, p_l=2.79e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 29% 23/78 [02:05<04:46, 5.21s/it, bpd=4.33, g_l=4.33, gn=3.25, l=4.07, p_l=2.81e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 31% 24/78 [02:10<04:41, 5.22s/it, bpd=4.46, g_l=4.46, gn=3.97, l=4.2, p_l=2.94e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 32% 25/78 [02:15<04:36, 5.21s/it, bpd=4.24, g_l=4.24, gn=4.39, l=3.99, p_l=3.13e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 33% 26/78 [02:20<04:31, 5.22s/it, bpd=4.26, g_l=4.26, gn=3.16, l=4.01, p_l=3.35e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 35% 27/78 [02:26<04:25, 5.21s/it, bpd=4.77, g_l=4.77, gn=3.25, l=4.49, p_l=3.46e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 36% 28/78 [02:31<04:20, 5.21s/it, bpd=4.92, g_l=4.92, gn=3.56, l=4.63, p_l=3.68e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:36<04:15, 5.21s/it, bpd=4.38, g_l=4.38, gn=3.32, l=4.13, p_l=3.55e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1429\u001b[0m\n"," 38% 30/78 [03:15<12:09, 15.19s/it, bpd=4.43, g_l=4.43, gn=3.13, l=4.17, p_l=3.57e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 40% 31/78 [03:20<09:35, 12.26s/it, bpd=4.56, g_l=4.56, gn=3.82, l=4.29, p_l=3.42e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 41% 32/78 [03:25<07:46, 10.13s/it, bpd=4.79, g_l=4.79, gn=4.51, l=4.51, p_l=3.26e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 42% 33/78 [03:31<06:32, 8.72s/it, bpd=4.69, g_l=4.69, gn=3.33, l=4.41, p_l=3.2e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 44% 34/78 [03:36<05:38, 7.70s/it, bpd=4.32, g_l=4.32, gn=3.63, l=4.07, p_l=3.35e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 45% 35/78 [03:41<05:03, 7.05s/it, bpd=4.21, g_l=4.21, gn=3.54, l=3.96, p_l=3.51e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:47<04:36, 6.58s/it, bpd=4.4, g_l=4.4, gn=3.75, l=4.14, p_l=3.77e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 47% 37/78 [03:52<04:16, 6.26s/it, bpd=5.42, g_l=5.42, gn=3.12, l=5.1, p_l=3.81e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 49% 38/78 [03:58<03:59, 5.99s/it, bpd=4.45, g_l=4.45, gn=3.38, l=4.19, p_l=3.96e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 50% 39/78 [04:03<03:46, 5.80s/it, bpd=3.28, g_l=3.28, gn=3.25, l=3.09, p_l=4.26e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 51% 40/78 [04:08<03:33, 5.62s/it, bpd=4.38, g_l=4.38, gn=3.11, l=4.12, p_l=4.6e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 53% 41/78 [04:14<03:24, 5.51s/it, bpd=4.35, g_l=4.35, gn=3.3, l=4.09, p_l=4.89e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 54% 42/78 [04:19<03:13, 5.39s/it, bpd=3.82, g_l=3.82, gn=2.81, l=3.6, p_l=5.08e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 55% 43/78 [04:24<03:07, 5.35s/it, bpd=6.02, g_l=6.02, gn=3.68, l=5.67, p_l=4.95e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 56% 44/78 [04:29<02:59, 5.29s/it, bpd=5.01, g_l=5.01, gn=3.64, l=4.71, p_l=4.75e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 58% 45/78 [04:34<02:52, 5.24s/it, bpd=5.69, g_l=5.69, gn=3.19, l=5.35, p_l=4.77e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 59% 46/78 [04:39<02:46, 5.22s/it, bpd=4.69, g_l=4.69, gn=3.47, l=4.42, p_l=5.04e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 60% 47/78 [04:45<02:41, 5.19s/it, bpd=5.35, g_l=5.35, gn=3.36, l=5.04, p_l=5.26e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 62% 48/78 [04:50<02:36, 5.23s/it, bpd=4.69, g_l=4.69, gn=4.02, l=4.41, p_l=5.45e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 63% 49/78 [04:55<02:32, 5.24s/it, bpd=4.33, g_l=4.33, gn=3.08, l=4.08, p_l=5.33e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 64% 50/78 [05:01<02:30, 5.36s/it, bpd=4.43, g_l=4.43, gn=2.98, l=4.17, p_l=5.5e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 65% 51/78 [05:06<02:24, 5.36s/it, bpd=4.21, g_l=4.21, gn=3.47, l=3.96, p_l=5.93e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [05:12<02:20, 5.40s/it, bpd=6.39, g_l=6.39, gn=3.61, l=6.01, p_l=6.37e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 68% 53/78 [05:17<02:13, 5.36s/it, bpd=5.94, g_l=5.94, gn=3.63, l=5.59, p_l=6.41e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 69% 54/78 [05:22<02:08, 5.37s/it, bpd=4.46, g_l=4.46, gn=3.5, l=4.2, p_l=5.93e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 71% 55/78 [05:27<02:02, 5.33s/it, bpd=4.68, g_l=4.68, gn=3.66, l=4.41, p_l=4.9e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 72% 56/78 [05:33<01:57, 5.36s/it, bpd=5.14, g_l=5.14, gn=3.85, l=4.84, p_l=3.94e-6]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 73% 57/78 [05:38<01:51, 5.30s/it, bpd=4.03, g_l=4.03, gn=3, l=3.79, p_l=2.94e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 74% 58/78 [05:43<01:45, 5.27s/it, bpd=5.14, g_l=5.14, gn=3.7, l=4.84, p_l=2.29e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 76% 59/78 [05:48<01:39, 5.23s/it, bpd=5.6, g_l=5.6, gn=3.27, l=5.27, p_l=2.07e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 77% 60/78 [05:54<01:33, 5.21s/it, bpd=4.56, g_l=4.56, gn=3.87, l=4.29, p_l=1.84e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 78% 61/78 [05:59<01:28, 5.20s/it, bpd=4.97, g_l=4.97, gn=3.81, l=4.68, p_l=1.63e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 79% 62/78 [06:04<01:22, 5.19s/it, bpd=3.85, g_l=3.85, gn=4.71, l=3.62, p_l=1.45e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 81% 63/78 [06:09<01:17, 5.18s/it, bpd=5.18, g_l=5.18, gn=4.01, l=4.88, p_l=1.18e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 82% 64/78 [06:14<01:12, 5.19s/it, bpd=5.02, g_l=5.02, gn=3.76, l=4.72, p_l=9.23e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 83% 65/78 [06:19<01:07, 5.19s/it, bpd=4.08, g_l=4.08, gn=3.17, l=3.84, p_l=7.01e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 85% 66/78 [06:25<01:02, 5.19s/it, bpd=4.27, g_l=4.27, gn=3.81, l=4.02, p_l=5.91e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 86% 67/78 [06:30<00:57, 5.21s/it, bpd=5, g_l=5, gn=3.93, l=4.7, p_l=5.47e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 87% 68/78 [06:35<00:52, 5.21s/it, bpd=4.83, g_l=4.83, gn=4.65, l=4.55, p_l=5.36e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 88% 69/78 [06:40<00:46, 5.22s/it, bpd=5.68, g_l=5.68, gn=4.1, l=5.35, p_l=5.35e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 90% 70/78 [06:46<00:41, 5.22s/it, bpd=5, g_l=5, gn=5.64, l=4.71, p_l=5.58e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 91% 71/78 [06:51<00:36, 5.23s/it, bpd=4.64, g_l=4.64, gn=3, l=4.37, p_l=6.16e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 92% 72/78 [06:56<00:31, 5.22s/it, bpd=5.13, g_l=5.13, gn=3.6, l=4.83, p_l=6.4e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 94% 73/78 [07:01<00:26, 5.22s/it, bpd=6.79, g_l=6.79, gn=4.18, l=6.39, p_l=6.78e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 95% 74/78 [07:06<00:20, 5.21s/it, bpd=5.46, g_l=5.46, gn=3.71, l=5.14, p_l=7.2e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 96% 75/78 [07:12<00:15, 5.20s/it, bpd=4.4, g_l=4.4, gn=3.69, l=4.14, p_l=7.37e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n","100% 78/78 [07:27<00:00, 5.74s/it, bpd=4.15, g_l=4.15, gn=3.65, l=3.9, p_l=7.69e-7]\n","Train bpd: 4.8282 prime_loss: 0.0000 gen_loss: 4.8282 loss: 4.5441 gn: 3.6348 lr: 0.0003 lg_loss_scale: 16.7500 epoch: 17.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1477\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.02s/it, bpd=4.24, l=3.99]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.89s/it, bpd=5.09, l=4.79]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:05<00:10, 1.74s/it, bpd=4.91, l=4.62]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=5.12, l=4.82]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=5.47, l=5.15]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=4.93, l=4.64]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=5.54, l=5.22]\n","Ema bpd: 5.0931 prime_loss: 0.0153 gen_loss: 5.0931 loss: 4.7938 epoch: 17.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (13).txt\n","/content/gdrive/MyDrive/slon/slon (4).txt\n"," 1% 1/78 [00:05<07:05, 5.53s/it, bpd=4.29, g_l=4.29, gn=3.52, l=4.04, p_l=8.49e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 3% 2/78 [00:10<06:53, 5.45s/it, bpd=6.05, g_l=6.05, gn=3.21, l=5.69, p_l=9.76e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:16<06:44, 5.39s/it, bpd=4.87, g_l=4.87, gn=5.35, l=4.59, p_l=1.08e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 5% 4/78 [00:21<06:37, 5.37s/it, bpd=3.87, g_l=3.87, gn=3.73, l=3.64, p_l=1.17e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 6% 5/78 [00:26<06:30, 5.35s/it, bpd=4.24, g_l=4.24, gn=4.55, l=3.99, p_l=1.27e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 8% 6/78 [00:31<06:23, 5.33s/it, bpd=5.66, g_l=5.66, gn=3.04, l=5.33, p_l=1.33e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 9% 7/78 [00:37<06:16, 5.30s/it, bpd=3.58, g_l=3.58, gn=3.79, l=3.37, p_l=1.33e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:08, 5.27s/it, bpd=5.63, g_l=5.63, gn=3.42, l=5.3, p_l=1.35e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 12% 9/78 [00:47<06:01, 5.24s/it, bpd=4.83, g_l=4.83, gn=3.97, l=4.55, p_l=1.48e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 13% 10/78 [00:52<05:54, 5.21s/it, bpd=4.29, g_l=4.29, gn=3.48, l=4.04, p_l=1.61e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 14% 11/78 [00:57<05:48, 5.20s/it, bpd=4.45, g_l=4.45, gn=3.88, l=4.19, p_l=1.73e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 15% 12/78 [01:03<05:42, 5.19s/it, bpd=4.65, g_l=4.65, gn=4.36, l=4.37, p_l=1.89e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=4.5, g_l=4.5, gn=4.29, l=4.24, p_l=2.02e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 18% 14/78 [01:13<05:31, 5.19s/it, bpd=4.95, g_l=4.95, gn=3.95, l=4.66, p_l=2.11e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 19% 15/78 [01:18<05:26, 5.19s/it, bpd=4.2, g_l=4.2, gn=4.02, l=3.96, p_l=2.22e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=5.2, g_l=5.2, gn=3.08, l=4.89, p_l=2.37e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 22% 17/78 [01:28<05:16, 5.19s/it, bpd=4.28, g_l=4.28, gn=3.8, l=4.03, p_l=2.7e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 23% 18/78 [01:34<05:11, 5.19s/it, bpd=4.93, g_l=4.93, gn=5.56, l=4.64, p_l=3.08e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=4.77, g_l=4.77, gn=3, l=4.49, p_l=3.61e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=4.88, g_l=4.88, gn=3.78, l=4.59, p_l=4e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 27% 21/78 [01:49<04:56, 5.20s/it, bpd=5.03, g_l=5.03, gn=3.38, l=4.74, p_l=4.17e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 28% 22/78 [01:55<04:52, 5.21s/it, bpd=4.32, g_l=4.32, gn=3.27, l=4.07, p_l=4.02e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 29% 23/78 [02:05<06:14, 6.81s/it, bpd=4.27, g_l=4.27, gn=4.14, l=4.01, p_l=3.74e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 31% 24/78 [02:10<05:40, 6.30s/it, bpd=4.38, g_l=4.38, gn=3.5, l=4.12, p_l=3.44e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 32% 25/78 [02:15<05:16, 5.97s/it, bpd=4.18, g_l=4.18, gn=3.88, l=3.93, p_l=3.33e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 33% 26/78 [02:21<04:58, 5.73s/it, bpd=4.35, g_l=4.35, gn=5.27, l=4.09, p_l=3.45e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 35% 27/78 [02:26<04:47, 5.63s/it, bpd=5.95, g_l=5.95, gn=3.24, l=5.6, p_l=3.56e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 36% 28/78 [02:31<04:35, 5.51s/it, bpd=4.22, g_l=4.22, gn=3.67, l=3.97, p_l=3.72e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n","\n","Overflow in backward. Loss 4.0261383056640625, grad norm inf, lgscale 17.020000000000223, new lgscale 16.020000000000223\n"," 37% 29/78 [02:36<04:14, 5.18s/it, bpd=4.22, g_l=4.22, gn=3.67, l=3.97, p_l=3.72e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 38% 30/78 [02:41<04:09, 5.19s/it, bpd=4.17, g_l=4.17, gn=3.08, l=3.93, p_l=3.84e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 40% 31/78 [02:46<04:04, 5.20s/it, bpd=5.92, g_l=5.92, gn=2.95, l=5.57, p_l=3.8e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 41% 32/78 [02:51<03:59, 5.20s/it, bpd=5.17, g_l=5.17, gn=3.14, l=4.86, p_l=3.61e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 42% 33/78 [02:56<03:53, 5.20s/it, bpd=4.91, g_l=4.91, gn=3.4, l=4.62, p_l=3.53e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 44% 34/78 [03:02<03:48, 5.20s/it, bpd=5.15, g_l=5.15, gn=5.26, l=4.85, p_l=3.37e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 45% 35/78 [03:07<03:43, 5.19s/it, bpd=5.74, g_l=5.74, gn=2.87, l=5.4, p_l=3.31e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 46% 36/78 [03:12<03:38, 5.19s/it, bpd=4.52, g_l=4.52, gn=4.58, l=4.26, p_l=3.67e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 47% 37/78 [03:17<03:32, 5.19s/it, bpd=4.26, g_l=4.26, gn=4.34, l=4.01, p_l=3.93e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 49% 38/78 [03:22<03:27, 5.18s/it, bpd=4.94, g_l=4.94, gn=3.28, l=4.65, p_l=4.46e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 50% 39/78 [03:28<03:21, 5.17s/it, bpd=5.45, g_l=5.45, gn=3.26, l=5.13, p_l=5.12e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 51% 40/78 [03:33<03:16, 5.17s/it, bpd=5.05, g_l=5.05, gn=3.37, l=4.75, p_l=5.54e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 53% 41/78 [03:38<03:11, 5.18s/it, bpd=5.24, g_l=5.24, gn=2.92, l=4.93, p_l=5.54e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 54% 42/78 [03:43<03:06, 5.17s/it, bpd=4.46, g_l=4.46, gn=3.76, l=4.19, p_l=5.25e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 55% 43/78 [03:48<03:01, 5.18s/it, bpd=5.71, g_l=5.71, gn=3.41, l=5.37, p_l=4.89e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 56% 44/78 [03:53<02:56, 5.18s/it, bpd=4.65, g_l=4.65, gn=3.52, l=4.37, p_l=4.35e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 58% 45/78 [03:59<02:51, 5.18s/it, bpd=4.51, g_l=4.51, gn=3.99, l=4.24, p_l=3.98e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 59% 46/78 [04:04<02:46, 5.20s/it, bpd=4.09, g_l=4.09, gn=3.53, l=3.85, p_l=3.88e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 60% 47/78 [04:09<02:41, 5.21s/it, bpd=4.36, g_l=4.36, gn=3.94, l=4.1, p_l=4.17e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 62% 48/78 [04:14<02:36, 5.20s/it, bpd=6.13, g_l=6.13, gn=3.37, l=5.77, p_l=4.42e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 63% 49/78 [04:19<02:30, 5.20s/it, bpd=5.16, g_l=5.16, gn=4.93, l=4.85, p_l=4.88e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 64% 50/78 [04:25<02:25, 5.20s/it, bpd=5.78, g_l=5.78, gn=3.69, l=5.44, p_l=5.27e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 65% 51/78 [04:30<02:20, 5.20s/it, bpd=4.29, g_l=4.29, gn=3.85, l=4.03, p_l=5.38e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 67% 52/78 [04:35<02:15, 5.21s/it, bpd=3.47, g_l=3.47, gn=3.23, l=3.27, p_l=4.94e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 68% 53/78 [04:40<02:10, 5.21s/it, bpd=5.27, g_l=5.27, gn=4.24, l=4.96, p_l=4.46e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 69% 54/78 [04:46<02:05, 5.23s/it, bpd=4.72, g_l=4.72, gn=4.53, l=4.44, p_l=4.48e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 71% 55/78 [04:51<02:00, 5.22s/it, bpd=4.21, g_l=4.21, gn=3.34, l=3.96, p_l=4.54e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 72% 56/78 [04:56<01:54, 5.23s/it, bpd=6.16, g_l=6.16, gn=3.46, l=5.79, p_l=4.75e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [05:01<01:49, 5.23s/it, bpd=4.39, g_l=4.39, gn=3.72, l=4.14, p_l=5.14e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 74% 58/78 [05:06<01:44, 5.22s/it, bpd=5.87, g_l=5.87, gn=5.63, l=5.53, p_l=5.52e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 76% 59/78 [05:12<01:39, 5.21s/it, bpd=4.71, g_l=4.71, gn=4.12, l=4.44, p_l=5.31e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 77% 60/78 [05:17<01:33, 5.21s/it, bpd=4.01, g_l=4.01, gn=3.12, l=3.77, p_l=4.8e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 78% 61/78 [05:22<01:28, 5.20s/it, bpd=5.26, g_l=5.26, gn=2.88, l=4.95, p_l=4.65e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 79% 62/78 [05:27<01:23, 5.19s/it, bpd=5.76, g_l=5.76, gn=3.23, l=5.42, p_l=4.55e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 81% 63/78 [05:32<01:17, 5.20s/it, bpd=4.46, g_l=4.46, gn=4.62, l=4.2, p_l=4.99e-6]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 82% 64/78 [05:38<01:12, 5.19s/it, bpd=4.14, g_l=4.14, gn=5.45, l=3.89, p_l=6.07e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 83% 65/78 [05:43<01:07, 5.20s/it, bpd=4.19, g_l=4.19, gn=4.48, l=3.94, p_l=7.72e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 85% 66/78 [05:48<01:02, 5.20s/it, bpd=5.36, g_l=5.36, gn=4.12, l=5.05, p_l=1e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 86% 67/78 [05:53<00:57, 5.21s/it, bpd=4.71, g_l=4.71, gn=3.59, l=4.43, p_l=1.03e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [05:58<00:52, 5.21s/it, bpd=5.59, g_l=5.59, gn=3.47, l=5.26, p_l=8.89e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:04<00:47, 5.22s/it, bpd=4.53, g_l=4.53, gn=3.51, l=4.26, p_l=6.93e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 90% 70/78 [06:09<00:41, 5.22s/it, bpd=4.66, g_l=4.66, gn=3.85, l=4.38, p_l=5.36e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 91% 71/78 [06:14<00:36, 5.22s/it, bpd=4.39, g_l=4.39, gn=3.22, l=4.13, p_l=4.32e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 92% 72/78 [06:19<00:31, 5.21s/it, bpd=5.6, g_l=5.6, gn=3.51, l=5.27, p_l=3.56e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 94% 73/78 [06:24<00:26, 5.21s/it, bpd=5.93, g_l=5.93, gn=3.74, l=5.58, p_l=3.24e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 95% 74/78 [06:30<00:20, 5.21s/it, bpd=5.32, g_l=5.32, gn=4.97, l=5, p_l=3.19e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 96% 75/78 [06:35<00:15, 5.21s/it, bpd=4.62, g_l=4.62, gn=3.68, l=4.35, p_l=2.93e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n","100% 78/78 [06:51<00:00, 5.27s/it, bpd=6.52, g_l=6.52, gn=2.89, l=6.14, p_l=2.12e-6]\n","Train bpd: 4.8619 prime_loss: 0.0000 gen_loss: 4.8619 loss: 4.5759 gn: 3.8504 lr: 0.0003 lg_loss_scale: 16.4236 epoch: 18.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1554\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=5.61, l=5.28]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:13, 1.91s/it, bpd=4.95, l=4.66]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:05<00:10, 1.75s/it, bpd=3.91, l=3.68]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=5.14, l=4.84]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=5.55, l=5.22]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.53s/it, bpd=5.21, l=4.91]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=4.91, l=4.62]\n","Ema bpd: 5.0011 prime_loss: 0.0150 gen_loss: 5.0011 loss: 4.7073 epoch: 18.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (21).txt\n","/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (4).txt\n"," 1% 1/78 [00:05<06:53, 5.37s/it, bpd=5.97, g_l=5.97, gn=3.62, l=5.62, p_l=1.83e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 3% 2/78 [00:10<06:44, 5.33s/it, bpd=4.57, g_l=4.57, gn=3.68, l=4.3, p_l=1.6e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 4% 3/78 [00:15<06:38, 5.31s/it, bpd=4.71, g_l=4.71, gn=3.6, l=4.43, p_l=1.52e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 5% 4/78 [00:21<06:32, 5.31s/it, bpd=5.88, g_l=5.88, gn=3.06, l=5.53, p_l=1.54e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 6% 5/78 [00:26<06:27, 5.31s/it, bpd=4.84, g_l=4.84, gn=5.57, l=4.56, p_l=1.6e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 8% 6/78 [00:31<06:22, 5.31s/it, bpd=5.54, g_l=5.54, gn=3.91, l=5.21, p_l=1.67e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 9% 7/78 [00:37<06:16, 5.30s/it, bpd=4.8, g_l=4.8, gn=4.94, l=4.52, p_l=1.85e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 10% 8/78 [00:42<06:09, 5.28s/it, bpd=4.09, g_l=4.09, gn=3.44, l=3.85, p_l=1.99e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 12% 9/78 [00:47<06:02, 5.26s/it, bpd=5.08, g_l=5.08, gn=4.88, l=4.78, p_l=2.02e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=6.04, g_l=6.04, gn=3.3, l=5.68, p_l=2.06e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 14% 11/78 [00:57<05:48, 5.21s/it, bpd=4.65, g_l=4.65, gn=3.67, l=4.38, p_l=1.98e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 15% 12/78 [01:03<05:43, 5.20s/it, bpd=5.49, g_l=5.49, gn=3.3, l=5.17, p_l=1.97e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 17% 13/78 [01:08<05:36, 5.17s/it, bpd=5.3, g_l=5.3, gn=3.23, l=4.99, p_l=1.87e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 18% 14/78 [01:13<05:30, 5.17s/it, bpd=4.24, g_l=4.24, gn=3.22, l=3.99, p_l=1.82e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=5.27, g_l=5.27, gn=3.22, l=4.96, p_l=1.75e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:23<05:20, 5.18s/it, bpd=5.64, g_l=5.64, gn=3.64, l=5.3, p_l=1.81e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 22% 17/78 [01:28<05:16, 5.18s/it, bpd=4.43, g_l=4.43, gn=4.18, l=4.17, p_l=1.92e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 23% 18/78 [01:34<05:11, 5.20s/it, bpd=4.15, g_l=4.15, gn=3.7, l=3.9, p_l=2.08e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 24% 19/78 [01:39<05:07, 5.21s/it, bpd=5.03, g_l=5.03, gn=3.38, l=4.73, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 26% 20/78 [01:44<05:02, 5.22s/it, bpd=4.59, g_l=4.59, gn=4.71, l=4.32, p_l=2.12e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 27% 21/78 [01:49<04:57, 5.22s/it, bpd=4.79, g_l=4.79, gn=3.43, l=4.51, p_l=2.08e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 28% 22/78 [01:54<04:52, 5.22s/it, bpd=5.95, g_l=5.95, gn=3.12, l=5.6, p_l=2.06e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 29% 23/78 [02:00<04:46, 5.22s/it, bpd=3.99, g_l=3.99, gn=3.75, l=3.76, p_l=2.03e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=5.45, g_l=5.45, gn=2.89, l=5.13, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=4.57, g_l=4.57, gn=4.02, l=4.3, p_l=2.25e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 33% 26/78 [02:15<04:30, 5.20s/it, bpd=4.94, g_l=4.94, gn=4.25, l=4.65, p_l=2.29e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 35% 27/78 [02:21<04:25, 5.21s/it, bpd=5.49, g_l=5.49, gn=5.25, l=5.17, p_l=2.17e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=4.05, g_l=4.05, gn=3.53, l=3.81, p_l=2.26e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=4.7, g_l=4.7, gn=3.56, l=4.42, p_l=2.37e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 38% 30/78 [02:36<04:10, 5.21s/it, bpd=4.38, g_l=4.38, gn=4.69, l=4.12, p_l=2.54e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 40% 31/78 [02:41<04:04, 5.21s/it, bpd=4.42, g_l=4.42, gn=3.52, l=4.16, p_l=2.75e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 41% 32/78 [02:47<03:59, 5.20s/it, bpd=4.49, g_l=4.49, gn=3.66, l=4.22, p_l=3.03e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 42% 33/78 [02:52<03:54, 5.20s/it, bpd=6.2, g_l=6.2, gn=3.2, l=5.83, p_l=3.39e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 44% 34/78 [02:57<03:48, 5.20s/it, bpd=4.24, g_l=4.24, gn=3.7, l=3.99, p_l=3.49e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 45% 35/78 [03:02<03:43, 5.19s/it, bpd=3.22, g_l=3.22, gn=10.1, l=3.03, p_l=3.68e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 46% 36/78 [03:07<03:37, 5.19s/it, bpd=4.55, g_l=4.55, gn=3.35, l=4.28, p_l=3.75e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 47% 37/78 [03:12<03:32, 5.18s/it, bpd=5.38, g_l=5.38, gn=3.4, l=5.07, p_l=3.77e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 49% 38/78 [03:18<03:27, 5.19s/it, bpd=4.34, g_l=4.34, gn=6.06, l=4.08, p_l=3.79e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 50% 39/78 [03:23<03:22, 5.20s/it, bpd=5.78, g_l=5.78, gn=3.05, l=5.44, p_l=3.78e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 51% 40/78 [03:28<03:17, 5.21s/it, bpd=4.85, g_l=4.85, gn=3.21, l=4.57, p_l=3.84e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 53% 41/78 [03:33<03:12, 5.20s/it, bpd=4.17, g_l=4.17, gn=3.42, l=3.92, p_l=4.01e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 54% 42/78 [03:38<03:07, 5.20s/it, bpd=4.21, g_l=4.21, gn=4.18, l=3.96, p_l=3.99e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [03:44<03:01, 5.19s/it, bpd=4.78, g_l=4.78, gn=3.91, l=4.5, p_l=3.77e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 56% 44/78 [03:49<02:56, 5.18s/it, bpd=3.46, g_l=3.46, gn=3.4, l=3.25, p_l=3.56e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 58% 45/78 [03:54<02:51, 5.18s/it, bpd=4.47, g_l=4.47, gn=3.42, l=4.21, p_l=3.34e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [04:05<03:37, 6.78s/it, bpd=5.66, g_l=5.66, gn=3.24, l=5.33, p_l=2.74e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [04:10<03:14, 6.27s/it, bpd=4.91, g_l=4.91, gn=3.65, l=4.62, p_l=2.34e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 62% 48/78 [04:15<02:58, 5.95s/it, bpd=4.11, g_l=4.11, gn=3.13, l=3.86, p_l=2.09e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 63% 49/78 [04:20<02:45, 5.72s/it, bpd=3.97, g_l=3.97, gn=3.08, l=3.74, p_l=1.83e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 64% 50/78 [04:25<02:36, 5.59s/it, bpd=4.27, g_l=4.27, gn=3.44, l=4.02, p_l=1.57e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 65% 51/78 [04:31<02:28, 5.50s/it, bpd=3.94, g_l=3.94, gn=3.05, l=3.71, p_l=1.48e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 67% 52/78 [04:36<02:21, 5.45s/it, bpd=3.87, g_l=3.87, gn=3.03, l=3.64, p_l=1.39e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 68% 53/78 [04:41<02:15, 5.40s/it, bpd=4.29, g_l=4.29, gn=5.03, l=4.04, p_l=1.2e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 69% 54/78 [04:46<02:08, 5.36s/it, bpd=5.12, g_l=5.12, gn=3.63, l=4.82, p_l=1.08e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 71% 55/78 [04:52<02:02, 5.32s/it, bpd=4.09, g_l=4.09, gn=3.92, l=3.85, p_l=9.96e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 72% 56/78 [04:57<01:56, 5.28s/it, bpd=4.2, g_l=4.2, gn=3.18, l=3.96, p_l=9.37e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 73% 57/78 [05:02<01:50, 5.26s/it, bpd=5.15, g_l=5.15, gn=4.02, l=4.85, p_l=8.72e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 74% 58/78 [05:07<01:44, 5.23s/it, bpd=4.03, g_l=4.03, gn=3.97, l=3.8, p_l=8.69e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 76% 59/78 [05:12<01:39, 5.21s/it, bpd=5.14, g_l=5.14, gn=5.79, l=4.84, p_l=8.89e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 77% 60/78 [05:18<01:33, 5.19s/it, bpd=5.3, g_l=5.3, gn=3.7, l=4.99, p_l=9.03e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 78% 61/78 [05:23<01:28, 5.19s/it, bpd=4.77, g_l=4.77, gn=3.09, l=4.49, p_l=9.63e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 79% 62/78 [05:28<01:23, 5.19s/it, bpd=5.41, g_l=5.41, gn=3.41, l=5.09, p_l=1.02e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 81% 63/78 [05:33<01:18, 5.20s/it, bpd=3.8, g_l=3.8, gn=4.22, l=3.57, p_l=9.81e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 82% 64/78 [05:38<01:12, 5.20s/it, bpd=3.12, g_l=3.12, gn=3.61, l=2.94, p_l=9.04e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 83% 65/78 [05:44<01:07, 5.21s/it, bpd=5.04, g_l=5.04, gn=6.53, l=4.74, p_l=7.88e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 85% 66/78 [05:49<01:02, 5.20s/it, bpd=2.93, g_l=2.93, gn=5.05, l=2.75, p_l=7.11e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 86% 67/78 [05:54<00:57, 5.20s/it, bpd=4.6, g_l=4.6, gn=3.93, l=4.33, p_l=6.38e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 87% 68/78 [05:59<00:51, 5.20s/it, bpd=4.69, g_l=4.69, gn=4.72, l=4.42, p_l=5.97e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 88% 69/78 [06:04<00:46, 5.20s/it, bpd=4.7, g_l=4.7, gn=4.37, l=4.42, p_l=6.1e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 90% 70/78 [06:10<00:41, 5.21s/it, bpd=4.54, g_l=4.54, gn=3.07, l=4.28, p_l=6.56e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 91% 71/78 [06:15<00:36, 5.21s/it, bpd=4.66, g_l=4.66, gn=5.9, l=4.38, p_l=7.41e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 92% 72/78 [06:20<00:31, 5.21s/it, bpd=5.08, g_l=5.08, gn=4.26, l=4.78, p_l=8.54e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 94% 73/78 [06:25<00:26, 5.20s/it, bpd=4.51, g_l=4.51, gn=3.12, l=4.25, p_l=9.87e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 95% 74/78 [06:30<00:20, 5.21s/it, bpd=5.71, g_l=5.71, gn=3.04, l=5.38, p_l=1.1e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 96% 75/78 [06:36<00:15, 5.21s/it, bpd=6.09, g_l=6.09, gn=2.91, l=5.73, p_l=1.17e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n","100% 78/78 [06:51<00:00, 5.28s/it, bpd=4.19, g_l=4.19, gn=3.16, l=3.94, p_l=1.22e-6]\n","Train bpd: 4.7275 prime_loss: 0.0000 gen_loss: 4.7275 loss: 4.4494 gn: 3.8957 lr: 0.0003 lg_loss_scale: 16.3700 epoch: 19.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1632\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=5.42, l=5.11]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:13, 1.89s/it, bpd=5.11, l=4.81]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:04<00:10, 1.74s/it, bpd=4.85, l=4.57]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=5.3, l=4.99]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=5.14, l=4.84]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=5.01, l=4.71]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=3.93, l=3.7]\n","Ema bpd: 4.9640 prime_loss: 0.0149 gen_loss: 4.9640 loss: 4.6724 epoch: 19.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (30).txt\n","/content/gdrive/MyDrive/slon/slon (2).txt\n","/content/gdrive/MyDrive/slon/slon (14).txt\n"," 1% 1/78 [00:05<06:54, 5.38s/it, bpd=5.91, g_l=5.91, gn=3.9, l=5.57, p_l=1.17e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 3% 2/78 [00:10<06:44, 5.33s/it, bpd=4.51, g_l=4.51, gn=3.88, l=4.25, p_l=1.2e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:15<06:38, 5.32s/it, bpd=5.88, g_l=5.88, gn=3.27, l=5.53, p_l=1.25e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 5% 4/78 [00:21<06:32, 5.31s/it, bpd=4.24, g_l=4.24, gn=3.78, l=3.99, p_l=1.37e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 6% 5/78 [00:26<06:28, 5.32s/it, bpd=4.45, g_l=4.45, gn=3.25, l=4.19, p_l=1.5e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 8% 6/78 [00:31<06:21, 5.30s/it, bpd=4.47, g_l=4.47, gn=3.32, l=4.21, p_l=1.69e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=5.22, g_l=5.22, gn=3.31, l=4.91, p_l=1.92e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:08, 5.27s/it, bpd=5.03, g_l=5.03, gn=4.7, l=4.73, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 12% 9/78 [00:47<06:03, 5.26s/it, bpd=5.16, g_l=5.16, gn=3.62, l=4.86, p_l=2.34e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=4.62, g_l=4.62, gn=4.33, l=4.35, p_l=2.64e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=4.93, g_l=4.93, gn=3.15, l=4.64, p_l=2.71e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=5, g_l=5, gn=3.85, l=4.71, p_l=2.71e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 17% 13/78 [01:08<05:36, 5.18s/it, bpd=4.25, g_l=4.25, gn=3.64, l=4, p_l=2.9e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=4.99, g_l=4.99, gn=3.71, l=4.7, p_l=3.35e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 19% 15/78 [01:18<05:26, 5.18s/it, bpd=5.45, g_l=5.45, gn=3.41, l=5.13, p_l=3.97e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=4.48, g_l=4.48, gn=4.5, l=4.22, p_l=4.48e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:28<05:16, 5.18s/it, bpd=4.38, g_l=4.38, gn=3.53, l=4.12, p_l=4.82e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 23% 18/78 [01:34<05:11, 5.19s/it, bpd=5.56, g_l=5.56, gn=3.55, l=5.23, p_l=5e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 24% 19/78 [01:39<05:06, 5.19s/it, bpd=4.36, g_l=4.36, gn=3.31, l=4.1, p_l=4.82e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=3.83, g_l=3.83, gn=4.3, l=3.61, p_l=4.61e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 27% 21/78 [01:49<04:56, 5.20s/it, bpd=4.27, g_l=4.27, gn=3.91, l=4.02, p_l=4.83e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 28% 22/78 [01:54<04:51, 5.21s/it, bpd=5.44, g_l=5.44, gn=3.68, l=5.12, p_l=4.85e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 29% 23/78 [02:00<04:46, 5.20s/it, bpd=3.63, g_l=3.63, gn=3.56, l=3.42, p_l=5.04e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=4.68, g_l=4.68, gn=3.51, l=4.41, p_l=4.89e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 32% 25/78 [02:10<04:35, 5.21s/it, bpd=4.43, g_l=4.43, gn=3.78, l=4.17, p_l=4.43e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 33% 26/78 [02:15<04:30, 5.20s/it, bpd=5.53, g_l=5.53, gn=3.4, l=5.21, p_l=3.97e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 35% 27/78 [02:20<04:25, 5.21s/it, bpd=5.08, g_l=5.08, gn=3.79, l=4.79, p_l=3.7e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 36% 28/78 [02:26<04:20, 5.20s/it, bpd=4.53, g_l=4.53, gn=3.3, l=4.26, p_l=3.38e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 37% 29/78 [02:31<04:14, 5.20s/it, bpd=4.15, g_l=4.15, gn=4.31, l=3.91, p_l=3.38e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=4.84, g_l=4.84, gn=3.74, l=4.56, p_l=3.47e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 40% 31/78 [02:41<04:04, 5.20s/it, bpd=4.01, g_l=4.01, gn=3.51, l=3.78, p_l=3.53e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 41% 32/78 [02:46<03:58, 5.19s/it, bpd=3.87, g_l=3.87, gn=3.28, l=3.64, p_l=3.47e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 42% 33/78 [02:52<03:54, 5.20s/it, bpd=5.55, g_l=5.55, gn=3.69, l=5.22, p_l=3.32e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 44% 34/78 [02:57<03:48, 5.19s/it, bpd=4.34, g_l=4.34, gn=3.32, l=4.09, p_l=3.16e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1667\u001b[0m\n"," 45% 35/78 [03:38<11:24, 15.91s/it, bpd=3.28, g_l=3.28, gn=5.96, l=3.08, p_l=2.92e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:43<08:53, 12.70s/it, bpd=4.54, g_l=4.54, gn=5.22, l=4.27, p_l=2.79e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 47% 37/78 [03:48<07:07, 10.42s/it, bpd=4.15, g_l=4.15, gn=3.71, l=3.91, p_l=2.59e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 49% 38/78 [03:53<05:52, 8.81s/it, bpd=4.07, g_l=4.07, gn=3.8, l=3.83, p_l=2.49e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 50% 39/78 [03:58<04:59, 7.67s/it, bpd=6.13, g_l=6.13, gn=3.69, l=5.77, p_l=2.36e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 51% 40/78 [04:03<04:22, 6.91s/it, bpd=4.38, g_l=4.38, gn=3.53, l=4.12, p_l=2.12e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 53% 41/78 [04:08<03:55, 6.35s/it, bpd=5.65, g_l=5.65, gn=3.05, l=5.32, p_l=2e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 54% 42/78 [04:13<03:35, 6.00s/it, bpd=4.33, g_l=4.33, gn=3.78, l=4.08, p_l=1.95e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [04:19<03:20, 5.73s/it, bpd=4.49, g_l=4.49, gn=3.38, l=4.22, p_l=1.82e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 56% 44/78 [04:24<03:09, 5.57s/it, bpd=4.73, g_l=4.73, gn=3.7, l=4.45, p_l=1.84e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 58% 45/78 [04:29<02:59, 5.44s/it, bpd=4.11, g_l=4.11, gn=3.12, l=3.87, p_l=1.94e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 59% 46/78 [04:34<02:52, 5.38s/it, bpd=4.28, g_l=4.28, gn=3.01, l=4.03, p_l=1.91e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 60% 47/78 [04:39<02:44, 5.32s/it, bpd=4.53, g_l=4.53, gn=3.68, l=4.26, p_l=1.87e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 62% 48/78 [04:45<02:39, 5.33s/it, bpd=4.9, g_l=4.9, gn=3.7, l=4.61, p_l=1.73e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 63% 49/78 [04:50<02:33, 5.30s/it, bpd=4.44, g_l=4.44, gn=4.52, l=4.17, p_l=1.59e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 64% 50/78 [04:55<02:27, 5.28s/it, bpd=5.91, g_l=5.91, gn=3.35, l=5.56, p_l=1.44e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 65% 51/78 [05:00<02:22, 5.28s/it, bpd=5.29, g_l=5.29, gn=3.54, l=4.98, p_l=1.21e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 67% 52/78 [05:06<02:17, 5.28s/it, bpd=4.79, g_l=4.79, gn=3.53, l=4.51, p_l=1.01e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 68% 53/78 [05:11<02:12, 5.30s/it, bpd=5.4, g_l=5.4, gn=3.21, l=5.08, p_l=8.96e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 69% 54/78 [05:16<02:06, 5.28s/it, bpd=4.81, g_l=4.81, gn=3.41, l=4.53, p_l=8.47e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 71% 55/78 [05:22<02:01, 5.28s/it, bpd=3.46, g_l=3.46, gn=3.75, l=3.26, p_l=8.93e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 72% 56/78 [05:27<01:55, 5.27s/it, bpd=5.15, g_l=5.15, gn=3.57, l=4.84, p_l=9.72e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 73% 57/78 [05:32<01:51, 5.30s/it, bpd=4.26, g_l=4.26, gn=3.64, l=4.01, p_l=1.03e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 74% 58/78 [05:37<01:45, 5.29s/it, bpd=4.75, g_l=4.75, gn=3.3, l=4.47, p_l=1.06e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 76% 59/78 [05:43<01:40, 5.31s/it, bpd=4.82, g_l=4.82, gn=3.74, l=4.54, p_l=1.05e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 77% 60/78 [05:48<01:35, 5.29s/it, bpd=5.46, g_l=5.46, gn=3.15, l=5.14, p_l=1.02e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 78% 61/78 [05:53<01:30, 5.30s/it, bpd=4.23, g_l=4.23, gn=3.46, l=3.98, p_l=9.5e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 79% 62/78 [05:59<01:24, 5.28s/it, bpd=4.4, g_l=4.4, gn=3.44, l=4.14, p_l=9.03e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 81% 63/78 [06:04<01:19, 5.29s/it, bpd=4.7, g_l=4.7, gn=3.24, l=4.42, p_l=9.47e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 82% 64/78 [06:09<01:13, 5.28s/it, bpd=3.11, g_l=3.11, gn=4.45, l=2.92, p_l=1.08e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 83% 65/78 [06:14<01:08, 5.26s/it, bpd=5.35, g_l=5.35, gn=3.09, l=5.04, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 85% 66/78 [06:20<01:02, 5.24s/it, bpd=5.44, g_l=5.44, gn=3.46, l=5.12, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [06:25<00:57, 5.22s/it, bpd=4.25, g_l=4.25, gn=4.08, l=4, p_l=1.2e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 87% 68/78 [06:32<00:59, 5.95s/it, bpd=4.21, g_l=4.21, gn=3.49, l=3.96, p_l=1.37e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:38<00:51, 5.72s/it, bpd=3.99, g_l=3.99, gn=3.11, l=3.75, p_l=1.72e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 90% 70/78 [06:43<00:44, 5.56s/it, bpd=3.93, g_l=3.93, gn=6.66, l=3.69, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 91% 71/78 [06:48<00:38, 5.45s/it, bpd=4.5, g_l=4.5, gn=3.57, l=4.23, p_l=2.57e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 92% 72/78 [06:53<00:32, 5.39s/it, bpd=5.45, g_l=5.45, gn=4.02, l=5.13, p_l=2.98e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 94% 73/78 [06:58<00:26, 5.33s/it, bpd=4.77, g_l=4.77, gn=5.67, l=4.49, p_l=3.24e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 95% 74/78 [07:04<00:21, 5.29s/it, bpd=5.28, g_l=5.28, gn=3.73, l=4.97, p_l=3.19e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 96% 75/78 [07:09<00:15, 5.27s/it, bpd=5.37, g_l=5.37, gn=3.45, l=5.05, p_l=2.75e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n","100% 78/78 [07:25<00:00, 5.71s/it, bpd=6.08, g_l=6.08, gn=2.82, l=5.72, p_l=1.69e-6]\n","Train bpd: 4.7149 prime_loss: 0.0000 gen_loss: 4.7149 loss: 4.4375 gn: 3.7190 lr: 0.0003 lg_loss_scale: 16.6820 epoch: 20.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1710\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.02s/it, bpd=4.94, l=4.65]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:13, 1.88s/it, bpd=5.88, l=5.53]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 33% 3/9 [00:04<00:10, 1.74s/it, bpd=4.91, l=4.62]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=5.74, l=5.4]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=4.81, l=4.53]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=4.94, l=4.65]/content/gdrive/MyDrive/slon/slon (6).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=4.89, l=4.6]\n","Ema bpd: 4.9929 prime_loss: 0.0147 gen_loss: 4.9929 loss: 4.6996 epoch: 20.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (15).txt\n","/content/gdrive/MyDrive/slon/slon (24).txt\n","/content/gdrive/MyDrive/slon/slon (19).txt\n"," 1% 1/78 [00:05<07:02, 5.49s/it, bpd=4.72, g_l=4.72, gn=3.85, l=4.45, p_l=1.69e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 3% 2/78 [00:10<06:51, 5.41s/it, bpd=5.44, g_l=5.44, gn=3.47, l=5.12, p_l=1.55e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 4% 3/78 [00:15<06:41, 5.36s/it, bpd=5.46, g_l=5.46, gn=4.02, l=5.14, p_l=1.49e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 5% 4/78 [00:21<06:34, 5.33s/it, bpd=3.91, g_l=3.91, gn=3.5, l=3.68, p_l=1.54e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 6% 5/78 [00:26<06:27, 5.31s/it, bpd=4.64, g_l=4.64, gn=3.4, l=4.37, p_l=1.5e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=4.71, g_l=4.71, gn=4.45, l=4.43, p_l=1.4e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 9% 7/78 [00:36<06:14, 5.28s/it, bpd=4.69, g_l=4.69, gn=3.99, l=4.41, p_l=1.36e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 10% 8/78 [00:42<06:08, 5.26s/it, bpd=4.76, g_l=4.76, gn=3.6, l=4.48, p_l=1.27e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 12% 9/78 [00:47<06:02, 5.26s/it, bpd=6.23, g_l=6.23, gn=3.68, l=5.86, p_l=1.13e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 13% 10/78 [00:52<05:55, 5.23s/it, bpd=2.96, g_l=2.96, gn=3.04, l=2.79, p_l=1.07e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=4.03, g_l=4.03, gn=3.35, l=3.79, p_l=1.14e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 15% 12/78 [01:02<05:43, 5.21s/it, bpd=5.05, g_l=5.05, gn=3.29, l=4.75, p_l=1.24e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 17% 13/78 [01:08<05:38, 5.21s/it, bpd=4, g_l=4, gn=3.03, l=3.76, p_l=1.31e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 18% 14/78 [01:13<05:32, 5.19s/it, bpd=4.7, g_l=4.7, gn=3.44, l=4.43, p_l=1.35e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 19% 15/78 [01:18<05:27, 5.19s/it, bpd=3.59, g_l=3.59, gn=3.41, l=3.38, p_l=1.37e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=3.08, g_l=3.08, gn=2.97, l=2.9, p_l=1.32e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:28<05:15, 5.18s/it, bpd=4.87, g_l=4.87, gn=3.56, l=4.58, p_l=1.24e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 23% 18/78 [01:34<05:10, 5.18s/it, bpd=4.09, g_l=4.09, gn=4.38, l=3.85, p_l=1.17e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 24% 19/78 [01:39<05:05, 5.17s/it, bpd=4.11, g_l=4.11, gn=3.41, l=3.86, p_l=1.04e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 26% 20/78 [01:44<05:00, 5.18s/it, bpd=4.74, g_l=4.74, gn=3.47, l=4.46, p_l=1.01e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 27% 21/78 [01:49<04:55, 5.18s/it, bpd=4.23, g_l=4.23, gn=3.23, l=3.98, p_l=9.63e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 28% 22/78 [01:54<04:50, 5.19s/it, bpd=5.09, g_l=5.09, gn=4.07, l=4.79, p_l=1.02e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 29% 23/78 [02:00<04:45, 5.20s/it, bpd=4.34, g_l=4.34, gn=3.69, l=4.09, p_l=1.05e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=4.75, g_l=4.75, gn=3.21, l=4.47, p_l=1.11e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=4.05, g_l=4.05, gn=3.88, l=3.81, p_l=1.18e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=5.42, g_l=5.42, gn=3.52, l=5.1, p_l=1.36e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 35% 27/78 [02:20<04:26, 5.22s/it, bpd=5.14, g_l=5.14, gn=2.91, l=4.84, p_l=1.64e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 36% 28/78 [02:26<04:21, 5.23s/it, bpd=4.18, g_l=4.18, gn=3.26, l=3.94, p_l=1.99e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 37% 29/78 [02:31<04:15, 5.22s/it, bpd=4.47, g_l=4.47, gn=3.22, l=4.2, p_l=2.42e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 38% 30/78 [02:36<04:10, 5.22s/it, bpd=5.14, g_l=5.14, gn=3.85, l=4.83, p_l=2.82e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 40% 31/78 [02:41<04:05, 5.22s/it, bpd=4.98, g_l=4.98, gn=4.92, l=4.69, p_l=2.87e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 41% 32/78 [02:47<03:59, 5.22s/it, bpd=4.17, g_l=4.17, gn=4.13, l=3.93, p_l=2.95e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 42% 33/78 [02:52<03:54, 5.21s/it, bpd=6.22, g_l=6.22, gn=3.35, l=5.85, p_l=3.02e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 44% 34/78 [02:57<03:49, 5.21s/it, bpd=5.45, g_l=5.45, gn=3.19, l=5.13, p_l=3.22e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 45% 35/78 [03:02<03:44, 5.21s/it, bpd=3.46, g_l=3.46, gn=3.73, l=3.26, p_l=3.33e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 46% 36/78 [03:07<03:38, 5.21s/it, bpd=4.18, g_l=4.18, gn=4.88, l=3.93, p_l=3.59e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 47% 37/78 [03:13<03:33, 5.22s/it, bpd=4.83, g_l=4.83, gn=4.15, l=4.54, p_l=3.79e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:18<03:28, 5.21s/it, bpd=4.48, g_l=4.48, gn=3.39, l=4.22, p_l=3.93e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 50% 39/78 [03:23<03:23, 5.22s/it, bpd=4.49, g_l=4.49, gn=4.4, l=4.23, p_l=4.12e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 51% 40/78 [03:28<03:18, 5.22s/it, bpd=4.47, g_l=4.47, gn=3.36, l=4.21, p_l=4.16e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 53% 41/78 [03:33<03:13, 5.23s/it, bpd=5.1, g_l=5.1, gn=3.23, l=4.8, p_l=4.11e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 54% 42/78 [03:39<03:07, 5.21s/it, bpd=5.08, g_l=5.08, gn=3.99, l=4.78, p_l=3.92e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 55% 43/78 [03:44<03:02, 5.21s/it, bpd=4.25, g_l=4.25, gn=4.43, l=4, p_l=3.79e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 56% 44/78 [03:49<02:56, 5.20s/it, bpd=4.31, g_l=4.31, gn=3.49, l=4.06, p_l=3.64e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 58% 45/78 [03:54<02:51, 5.19s/it, bpd=4.91, g_l=4.91, gn=4.86, l=4.62, p_l=3.51e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [03:59<02:46, 5.19s/it, bpd=5.91, g_l=5.91, gn=3.76, l=5.56, p_l=3.4e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 60% 47/78 [04:05<02:40, 5.19s/it, bpd=3.88, g_l=3.88, gn=3.44, l=3.65, p_l=3.62e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 62% 48/78 [04:10<02:35, 5.19s/it, bpd=4.02, g_l=4.02, gn=3.22, l=3.78, p_l=3.71e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 63% 49/78 [04:15<02:30, 5.19s/it, bpd=4.3, g_l=4.3, gn=7.18, l=4.04, p_l=3.81e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 64% 50/78 [04:20<02:25, 5.20s/it, bpd=5.7, g_l=5.7, gn=4.32, l=5.36, p_l=4.08e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 65% 51/78 [04:25<02:20, 5.20s/it, bpd=4.32, g_l=4.32, gn=3.4, l=4.07, p_l=3.84e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [04:31<02:15, 5.20s/it, bpd=4.96, g_l=4.96, gn=4.32, l=4.67, p_l=3.85e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 68% 53/78 [04:36<02:10, 5.20s/it, bpd=4.6, g_l=4.6, gn=3.49, l=4.33, p_l=4.03e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 69% 54/78 [04:41<02:04, 5.21s/it, bpd=3.7, g_l=3.7, gn=3.61, l=3.49, p_l=4.15e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 71% 55/78 [04:46<01:59, 5.21s/it, bpd=3.95, g_l=3.95, gn=3.17, l=3.72, p_l=4.13e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 72% 56/78 [04:51<01:54, 5.22s/it, bpd=5.67, g_l=5.67, gn=3.29, l=5.34, p_l=4.19e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 73% 57/78 [04:57<01:49, 5.21s/it, bpd=5.34, g_l=5.34, gn=3.42, l=5.02, p_l=4.18e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 74% 58/78 [05:02<01:44, 5.20s/it, bpd=5.09, g_l=5.09, gn=3.53, l=4.79, p_l=4.08e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 76% 59/78 [05:07<01:38, 5.19s/it, bpd=4.68, g_l=4.68, gn=4.62, l=4.4, p_l=3.68e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 77% 60/78 [05:12<01:33, 5.19s/it, bpd=5.47, g_l=5.47, gn=3.62, l=5.15, p_l=3.54e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 78% 61/78 [05:17<01:28, 5.19s/it, bpd=4.01, g_l=4.01, gn=2.93, l=3.77, p_l=3.46e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 79% 62/78 [05:23<01:22, 5.18s/it, bpd=4.14, g_l=4.14, gn=3.32, l=3.89, p_l=3.52e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 81% 63/78 [05:28<01:17, 5.19s/it, bpd=5.77, g_l=5.77, gn=3.21, l=5.43, p_l=3.67e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 82% 64/78 [05:33<01:12, 5.17s/it, bpd=4.39, g_l=4.39, gn=3.92, l=4.13, p_l=3.62e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 83% 65/78 [05:38<01:07, 5.18s/it, bpd=5.01, g_l=5.01, gn=3.92, l=4.71, p_l=3.4e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 85% 66/78 [05:43<01:02, 5.18s/it, bpd=4.13, g_l=4.13, gn=4.06, l=3.89, p_l=3.6e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 86% 67/78 [05:48<00:57, 5.19s/it, bpd=4.69, g_l=4.69, gn=4.74, l=4.41, p_l=3.35e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 87% 68/78 [05:54<00:51, 5.18s/it, bpd=4.49, g_l=4.49, gn=4.76, l=4.22, p_l=3.23e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 88% 69/78 [05:59<00:46, 5.19s/it, bpd=6.45, g_l=6.45, gn=3.27, l=6.07, p_l=3e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 90% 70/78 [06:04<00:41, 5.19s/it, bpd=5.79, g_l=5.79, gn=3.18, l=5.45, p_l=2.97e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 91% 71/78 [06:09<00:36, 5.19s/it, bpd=5.32, g_l=5.32, gn=4.26, l=5.01, p_l=3.06e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 92% 72/78 [06:14<00:31, 5.19s/it, bpd=4.29, g_l=4.29, gn=3.92, l=4.04, p_l=3.28e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:20<00:25, 5.18s/it, bpd=4.13, g_l=4.13, gn=3.32, l=3.89, p_l=3.36e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n","\n","Overflow in backward. Loss 4.311144828796387, grad norm nan, lgscale 17.132000000000264, new lgscale 16.132000000000264\n"," 95% 74/78 [06:24<00:19, 4.96s/it, bpd=4.13, g_l=4.13, gn=3.32, l=3.89, p_l=3.36e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 96% 75/78 [06:29<00:15, 5.02s/it, bpd=4.33, g_l=4.33, gn=4.07, l=4.07, p_l=3.35e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n","100% 78/78 [06:45<00:00, 5.20s/it, bpd=6.03, g_l=6.03, gn=3.94, l=5.68, p_l=3.03e-6]\n","Train bpd: 4.6996 prime_loss: 0.0000 gen_loss: 4.6996 loss: 4.4232 gn: 3.7506 lr: 0.0003 lg_loss_scale: 16.9401 epoch: 21.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1787\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=5.03, l=4.73]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.91s/it, bpd=5.02, l=4.72]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:05<00:10, 1.76s/it, bpd=4.48, l=4.22]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=4.62, l=4.35]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 56% 5/9 [00:07<00:06, 1.58s/it, bpd=5.22, l=4.91]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=5.88, l=5.53]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=5.98, l=5.63]\n","Ema bpd: 5.0759 prime_loss: 0.0147 gen_loss: 5.0759 loss: 4.7777 epoch: 21.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (4).txt\n","/content/gdrive/MyDrive/slon/slon (30).txt\n","/content/gdrive/MyDrive/slon/slon (2).txt\n","\n","Overflow in backward. Loss 4.030820369720459, grad norm nan, lgscale 16.148000000000263, new lgscale 15.148000000000264\n"," 1% 1/78 [00:04<06:04, 4.74s/it]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 3% 2/78 [00:09<06:10, 4.87s/it, bpd=6.19, g_l=6.19, gn=3.16, l=5.83, p_l=3.02e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 4% 3/78 [00:15<06:13, 4.98s/it, bpd=4.04, g_l=4.04, gn=4.26, l=3.8, p_l=3.07e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 5% 4/78 [00:20<06:14, 5.06s/it, bpd=3.76, g_l=3.76, gn=3.56, l=3.54, p_l=3.04e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 6% 5/78 [00:25<06:13, 5.11s/it, bpd=4.39, g_l=4.39, gn=3.56, l=4.13, p_l=3.2e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:30<06:10, 5.15s/it, bpd=4.87, g_l=4.87, gn=3.42, l=4.58, p_l=3.29e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 9% 7/78 [00:36<06:07, 5.18s/it, bpd=5.64, g_l=5.64, gn=3.39, l=5.31, p_l=3.34e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:41<06:03, 5.19s/it, bpd=4.48, g_l=4.48, gn=4.52, l=4.22, p_l=3.12e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 12% 9/78 [00:46<05:59, 5.20s/it, bpd=5.7, g_l=5.7, gn=3.85, l=5.37, p_l=2.7e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 13% 10/78 [00:51<05:53, 5.20s/it, bpd=4.12, g_l=4.12, gn=4.42, l=3.88, p_l=2.15e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:56<05:48, 5.20s/it, bpd=6.22, g_l=6.22, gn=3.07, l=5.86, p_l=1.87e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=5.84, g_l=5.84, gn=3.08, l=5.5, p_l=1.75e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 17% 13/78 [01:07<05:37, 5.20s/it, bpd=4.14, g_l=4.14, gn=3.75, l=3.9, p_l=1.96e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 18% 14/78 [01:17<07:08, 6.69s/it, bpd=4.42, g_l=4.42, gn=6.23, l=4.16, p_l=2.45e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 19% 15/78 [01:22<06:31, 6.21s/it, bpd=3.64, g_l=3.64, gn=3.42, l=3.42, p_l=2.95e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 21% 16/78 [01:27<06:05, 5.89s/it, bpd=4.6, g_l=4.6, gn=3.4, l=4.33, p_l=3.55e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 22% 17/78 [01:32<05:46, 5.68s/it, bpd=4.76, g_l=4.76, gn=4.38, l=4.48, p_l=4.06e-6]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 23% 18/78 [01:38<05:32, 5.54s/it, bpd=3.76, g_l=3.76, gn=3.25, l=3.54, p_l=4.06e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 24% 19/78 [01:43<05:22, 5.47s/it, bpd=5.68, g_l=5.68, gn=4.87, l=5.35, p_l=3.76e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 26% 20/78 [01:48<05:14, 5.42s/it, bpd=3.8, g_l=3.8, gn=5.66, l=3.57, p_l=3.28e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 27% 21/78 [01:54<05:07, 5.39s/it, bpd=5.01, g_l=5.01, gn=4.57, l=4.71, p_l=2.71e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 28% 22/78 [01:59<04:59, 5.35s/it, bpd=5.05, g_l=5.05, gn=3.99, l=4.75, p_l=2.25e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 29% 23/78 [02:04<04:52, 5.32s/it, bpd=3.19, g_l=3.19, gn=4.11, l=3, p_l=2.01e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 31% 24/78 [02:09<04:45, 5.28s/it, bpd=5.78, g_l=5.78, gn=3.43, l=5.44, p_l=1.88e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 32% 25/78 [02:15<04:39, 5.26s/it, bpd=4.52, g_l=4.52, gn=6.66, l=4.25, p_l=1.87e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 33% 26/78 [02:20<04:32, 5.23s/it, bpd=3.33, g_l=3.33, gn=4.25, l=3.13, p_l=1.77e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 35% 27/78 [02:25<04:26, 5.22s/it, bpd=4.94, g_l=4.94, gn=3.52, l=4.65, p_l=1.57e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 36% 28/78 [02:30<04:19, 5.20s/it, bpd=4.88, g_l=4.88, gn=4.24, l=4.59, p_l=1.28e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 37% 29/78 [02:35<04:14, 5.19s/it, bpd=3.98, g_l=3.98, gn=5.73, l=3.75, p_l=1.28e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 38% 30/78 [02:40<04:08, 5.18s/it, bpd=4.7, g_l=4.7, gn=9.84, l=4.42, p_l=1.34e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 40% 31/78 [02:46<04:03, 5.18s/it, bpd=5.06, g_l=5.06, gn=3.99, l=4.76, p_l=1.41e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 41% 32/78 [02:51<03:58, 5.18s/it, bpd=4.46, g_l=4.46, gn=5.94, l=4.2, p_l=1.41e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 42% 33/78 [02:56<03:53, 5.19s/it, bpd=3.89, g_l=3.89, gn=4.61, l=3.66, p_l=1.33e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 44% 34/78 [03:01<03:48, 5.20s/it, bpd=4.59, g_l=4.59, gn=3.85, l=4.32, p_l=1.3e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 45% 35/78 [03:06<03:43, 5.20s/it, bpd=4.43, g_l=4.43, gn=3.2, l=4.17, p_l=1.37e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 46% 36/78 [03:12<03:39, 5.22s/it, bpd=5.64, g_l=5.64, gn=3.59, l=5.31, p_l=1.47e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 47% 37/78 [03:17<03:33, 5.22s/it, bpd=4.57, g_l=4.57, gn=4.13, l=4.3, p_l=1.8e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 49% 38/78 [03:22<03:28, 5.21s/it, bpd=4.66, g_l=4.66, gn=3.38, l=4.39, p_l=2.55e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 50% 39/78 [03:27<03:23, 5.21s/it, bpd=3.93, g_l=3.93, gn=3.34, l=3.7, p_l=3.16e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 51% 40/78 [03:32<03:18, 5.21s/it, bpd=4.67, g_l=4.67, gn=5.28, l=4.39, p_l=3.48e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 53% 41/78 [03:38<03:12, 5.20s/it, bpd=5, g_l=5, gn=4.07, l=4.71, p_l=3.4e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 54% 42/78 [03:43<03:07, 5.21s/it, bpd=4.7, g_l=4.7, gn=3.85, l=4.42, p_l=3.43e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 55% 43/78 [03:48<03:02, 5.20s/it, bpd=4.61, g_l=4.61, gn=3.39, l=4.34, p_l=3.28e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 56% 44/78 [03:53<02:56, 5.21s/it, bpd=5.43, g_l=5.43, gn=3.55, l=5.11, p_l=2.76e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 58% 45/78 [03:58<02:51, 5.20s/it, bpd=4.17, g_l=4.17, gn=3.36, l=3.92, p_l=2.51e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [04:04<02:46, 5.19s/it, bpd=4.75, g_l=4.75, gn=3.49, l=4.47, p_l=2.65e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 60% 47/78 [04:09<02:40, 5.19s/it, bpd=4.51, g_l=4.51, gn=3.79, l=4.25, p_l=3.38e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 62% 48/78 [04:14<02:35, 5.18s/it, bpd=4.18, g_l=4.18, gn=5.79, l=3.93, p_l=4.09e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 63% 49/78 [04:19<02:30, 5.17s/it, bpd=4.11, g_l=4.11, gn=3.76, l=3.87, p_l=5.61e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 64% 50/78 [04:24<02:24, 5.17s/it, bpd=4.35, g_l=4.35, gn=4.32, l=4.1, p_l=7e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 65% 51/78 [04:29<02:19, 5.18s/it, bpd=4.33, g_l=4.33, gn=3.66, l=4.07, p_l=8.45e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 67% 52/78 [04:35<02:14, 5.18s/it, bpd=5.44, g_l=5.44, gn=3.7, l=5.12, p_l=9.98e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 68% 53/78 [04:40<02:09, 5.20s/it, bpd=4.16, g_l=4.16, gn=4.48, l=3.91, p_l=1.14e-5]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 69% 54/78 [04:45<02:04, 5.20s/it, bpd=4.99, g_l=4.99, gn=3.2, l=4.69, p_l=1.29e-5]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 71% 55/78 [04:50<01:59, 5.21s/it, bpd=4.79, g_l=4.79, gn=3.74, l=4.51, p_l=1.34e-5]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 72% 56/78 [04:56<01:54, 5.21s/it, bpd=5.86, g_l=5.86, gn=3.78, l=5.52, p_l=1.4e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [05:01<01:49, 5.22s/it, bpd=4.74, g_l=4.74, gn=3.66, l=4.46, p_l=1.47e-5]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 74% 58/78 [05:06<01:44, 5.21s/it, bpd=5.43, g_l=5.43, gn=3.6, l=5.11, p_l=1.54e-5]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 76% 59/78 [05:11<01:39, 5.22s/it, bpd=3.88, g_l=3.88, gn=3.37, l=3.65, p_l=1.85e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 77% 60/78 [05:16<01:33, 5.22s/it, bpd=4.45, g_l=4.45, gn=3.83, l=4.19, p_l=2.52e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 78% 61/78 [05:22<01:28, 5.22s/it, bpd=5.32, g_l=5.32, gn=2.81, l=5, p_l=2.98e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 79% 62/78 [05:27<01:23, 5.22s/it, bpd=4.88, g_l=4.88, gn=3.84, l=4.59, p_l=2.98e-5]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 81% 63/78 [05:32<01:18, 5.22s/it, bpd=4.07, g_l=4.07, gn=3.3, l=3.83, p_l=2.92e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 82% 64/78 [05:37<01:13, 5.22s/it, bpd=5.29, g_l=5.29, gn=4.63, l=4.98, p_l=2.91e-5]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 83% 65/78 [05:42<01:07, 5.21s/it, bpd=4.35, g_l=4.35, gn=4.22, l=4.09, p_l=3.17e-5]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 85% 66/78 [05:48<01:02, 5.22s/it, bpd=4.42, g_l=4.42, gn=4.65, l=4.16, p_l=4.16e-5]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 86% 67/78 [05:53<00:57, 5.22s/it, bpd=4.91, g_l=4.91, gn=3.71, l=4.62, p_l=4.84e-5]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 87% 68/78 [05:58<00:52, 5.22s/it, bpd=4.7, g_l=4.7, gn=4.01, l=4.42, p_l=5.36e-5]/content/gdrive/MyDrive/slon/slon (17).txt\n","\n","Overflow in backward. Loss 6.205726623535156, grad norm nan, lgscale 15.416000000000274, new lgscale 14.416000000000274\n"," 88% 69/78 [06:03<00:44, 4.97s/it, bpd=4.7, g_l=4.7, gn=4.01, l=4.42, p_l=5.36e-5]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 90% 70/78 [06:08<00:40, 5.05s/it, bpd=5.1, g_l=5.1, gn=3.69, l=4.8, p_l=4.94e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 91% 71/78 [06:13<00:35, 5.09s/it, bpd=4.51, g_l=4.51, gn=3.65, l=4.24, p_l=3.9e-5]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 92% 72/78 [06:18<00:30, 5.14s/it, bpd=3.57, g_l=3.57, gn=3.98, l=3.36, p_l=2.6e-5]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 94% 73/78 [06:23<00:25, 5.16s/it, bpd=5.55, g_l=5.55, gn=15.1, l=5.22, p_l=1.86e-5]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 95% 74/78 [06:29<00:20, 5.18s/it, bpd=4.99, g_l=4.99, gn=4.06, l=4.69, p_l=1.41e-5]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 96% 75/78 [06:34<00:15, 5.18s/it, bpd=4.74, g_l=4.74, gn=3.88, l=4.46, p_l=1.07e-5]/content/gdrive/MyDrive/slon/slon (14).txt\n","100% 78/78 [06:50<00:00, 5.26s/it, bpd=5.36, g_l=5.36, gn=3.97, l=5.04, p_l=7.04e-6]\n","Train bpd: 4.6783 prime_loss: 0.0000 gen_loss: 4.6783 loss: 4.4031 gn: 4.2371 lr: 0.0003 lg_loss_scale: 15.1796 epoch: 22.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1863\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=5.34, l=5.02]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 22% 2/9 [00:03<00:13, 1.92s/it, bpd=4.68, l=4.4]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.77s/it, bpd=5.72, l=5.38]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=4.85, l=4.56]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.58s/it, bpd=4.29, l=4.04]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 67% 6/9 [00:09<00:04, 1.53s/it, bpd=4.66, l=4.38]/content/gdrive/MyDrive/slon/slon (5).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=4.86, l=4.57]\n","Ema bpd: 5.0444 prime_loss: 0.0147 gen_loss: 5.0444 loss: 4.7480 epoch: 22.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (3).txt\n","/content/gdrive/MyDrive/slon/slon (28).txt\n","/content/gdrive/MyDrive/slon/slon (26).txt\n"," 1% 1/78 [00:05<06:59, 5.45s/it, bpd=5.3, g_l=5.3, gn=3.5, l=4.99, p_l=5.18e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 3% 2/78 [00:10<06:48, 5.37s/it, bpd=4.07, g_l=4.07, gn=3.6, l=3.83, p_l=3.52e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 4% 3/78 [00:15<06:40, 5.34s/it, bpd=4.82, g_l=4.82, gn=3.18, l=4.54, p_l=2.68e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 5% 4/78 [00:21<06:34, 5.33s/it, bpd=3.98, g_l=3.98, gn=5.5, l=3.74, p_l=2.12e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 6% 5/78 [00:26<06:28, 5.32s/it, bpd=5.55, g_l=5.55, gn=3.55, l=5.22, p_l=2.17e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:21, 5.30s/it, bpd=3.96, g_l=3.96, gn=3.72, l=3.73, p_l=2.07e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=5.08, g_l=5.08, gn=5.91, l=4.78, p_l=1.92e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 10% 8/78 [00:42<06:08, 5.26s/it, bpd=4.37, g_l=4.37, gn=4.03, l=4.11, p_l=1.8e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 12% 9/78 [00:47<06:02, 5.25s/it, bpd=5.38, g_l=5.38, gn=3.94, l=5.07, p_l=1.93e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 13% 10/78 [00:52<05:55, 5.23s/it, bpd=4.85, g_l=4.85, gn=4.31, l=4.56, p_l=1.82e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=5.66, g_l=5.66, gn=4.79, l=5.33, p_l=1.58e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=5, g_l=5, gn=4.58, l=4.71, p_l=1.26e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 17% 13/78 [01:08<05:36, 5.17s/it, bpd=4.48, g_l=4.48, gn=4.53, l=4.22, p_l=1.18e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 18% 14/78 [01:13<05:30, 5.17s/it, bpd=5.05, g_l=5.05, gn=3.49, l=4.76, p_l=1.21e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 19% 15/78 [01:18<05:25, 5.16s/it, bpd=5.84, g_l=5.84, gn=4.7, l=5.49, p_l=1.31e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 21% 16/78 [01:23<05:20, 5.16s/it, bpd=4.18, g_l=4.18, gn=3.94, l=3.93, p_l=1.27e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 22% 17/78 [01:28<05:15, 5.17s/it, bpd=3.18, g_l=3.18, gn=3.55, l=2.99, p_l=1.15e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 23% 18/78 [01:33<05:11, 5.19s/it, bpd=4.91, g_l=4.91, gn=3.78, l=4.62, p_l=1.05e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 24% 19/78 [01:39<05:06, 5.19s/it, bpd=5.11, g_l=5.11, gn=6.5, l=4.81, p_l=9.02e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 26% 20/78 [01:44<05:02, 5.22s/it, bpd=4.63, g_l=4.63, gn=4.96, l=4.36, p_l=7.71e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 27% 21/78 [01:49<04:57, 5.22s/it, bpd=4.28, g_l=4.28, gn=5.08, l=4.03, p_l=6.69e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 28% 22/78 [01:54<04:52, 5.23s/it, bpd=4.48, g_l=4.48, gn=3.7, l=4.21, p_l=6.23e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 29% 23/78 [02:00<04:46, 5.22s/it, bpd=4.55, g_l=4.55, gn=3.85, l=4.29, p_l=6.59e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 31% 24/78 [02:05<04:41, 5.22s/it, bpd=5.1, g_l=5.1, gn=3.73, l=4.8, p_l=6.9e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=5.4, g_l=5.4, gn=3.32, l=5.08, p_l=7.02e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 33% 26/78 [02:15<04:30, 5.21s/it, bpd=4.4, g_l=4.4, gn=4.15, l=4.14, p_l=7.19e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 35% 27/78 [02:20<04:25, 5.20s/it, bpd=4.03, g_l=4.03, gn=3.22, l=3.8, p_l=6.86e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 36% 28/78 [02:26<04:19, 5.19s/it, bpd=4.09, g_l=4.09, gn=5.77, l=3.85, p_l=6.57e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 37% 29/78 [02:31<04:14, 5.19s/it, bpd=6.49, g_l=6.49, gn=3.28, l=6.11, p_l=7.02e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 38% 30/78 [02:36<04:08, 5.19s/it, bpd=5.47, g_l=5.47, gn=3.52, l=5.14, p_l=6.88e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 40% 31/78 [02:41<04:03, 5.18s/it, bpd=4.04, g_l=4.04, gn=3.67, l=3.8, p_l=6.45e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 41% 32/78 [02:46<03:58, 5.18s/it, bpd=5.74, g_l=5.74, gn=3.44, l=5.4, p_l=5.97e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 42% 33/78 [02:51<03:53, 5.19s/it, bpd=3.88, g_l=3.88, gn=3.46, l=3.65, p_l=5.8e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 44% 34/78 [02:57<03:47, 5.18s/it, bpd=4.87, g_l=4.87, gn=3.58, l=4.58, p_l=5.97e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 45% 35/78 [03:02<03:42, 5.18s/it, bpd=5.24, g_l=5.24, gn=3.86, l=4.94, p_l=5.81e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:07<03:37, 5.18s/it, bpd=4.23, g_l=4.23, gn=3.19, l=3.98, p_l=6.2e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 47% 37/78 [03:17<04:35, 6.72s/it, bpd=4.38, g_l=4.38, gn=4.05, l=4.12, p_l=7.1e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:22<04:09, 6.24s/it, bpd=4.38, g_l=4.38, gn=3.49, l=4.12, p_l=8.67e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 50% 39/78 [03:28<03:50, 5.91s/it, bpd=4.68, g_l=4.68, gn=4.47, l=4.41, p_l=1.01e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 51% 40/78 [03:33<03:36, 5.70s/it, bpd=4.14, g_l=4.14, gn=4.25, l=3.89, p_l=1.28e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 53% 41/78 [03:38<03:25, 5.56s/it, bpd=4.09, g_l=4.09, gn=3.1, l=3.85, p_l=1.51e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1905\u001b[0m\n"," 54% 42/78 [04:17<09:19, 15.55s/it, bpd=5.68, g_l=5.68, gn=3.81, l=5.34, p_l=1.65e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 55% 43/78 [04:22<07:14, 12.42s/it, bpd=5.82, g_l=5.82, gn=3.1, l=5.48, p_l=1.63e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 56% 44/78 [04:27<05:46, 10.19s/it, bpd=4.63, g_l=4.63, gn=3.06, l=4.36, p_l=1.59e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 58% 45/78 [04:32<04:45, 8.64s/it, bpd=4.24, g_l=4.24, gn=4.92, l=3.99, p_l=1.69e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 59% 46/78 [04:37<04:02, 7.57s/it, bpd=5.88, g_l=5.88, gn=4.7, l=5.53, p_l=1.85e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 60% 47/78 [04:42<03:32, 6.86s/it, bpd=5.66, g_l=5.66, gn=4.35, l=5.33, p_l=2.25e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 62% 48/78 [04:47<03:09, 6.32s/it, bpd=4.89, g_l=4.89, gn=3.83, l=4.6, p_l=2.87e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 63% 49/78 [04:53<02:53, 5.99s/it, bpd=4.48, g_l=4.48, gn=3.45, l=4.22, p_l=3.61e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 64% 50/78 [04:58<02:40, 5.73s/it, bpd=6.1, g_l=6.1, gn=3.15, l=5.74, p_l=4.18e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 65% 51/78 [05:03<02:30, 5.57s/it, bpd=5.06, g_l=5.06, gn=3.17, l=4.76, p_l=4.52e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 67% 52/78 [05:08<02:21, 5.45s/it, bpd=4.38, g_l=4.38, gn=3.74, l=4.12, p_l=4.44e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 68% 53/78 [05:13<02:15, 5.41s/it, bpd=3.74, g_l=3.74, gn=8.63, l=3.52, p_l=4.31e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 69% 54/78 [05:19<02:07, 5.33s/it, bpd=4.09, g_l=4.09, gn=4.61, l=3.85, p_l=4.21e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 71% 55/78 [05:24<02:02, 5.32s/it, bpd=3.64, g_l=3.64, gn=4.03, l=3.42, p_l=4.34e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 72% 56/78 [05:29<01:56, 5.30s/it, bpd=4.33, g_l=4.33, gn=4.45, l=4.08, p_l=4.93e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 73% 57/78 [05:34<01:51, 5.31s/it, bpd=4.89, g_l=4.89, gn=3.72, l=4.6, p_l=5.36e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 74% 58/78 [05:40<01:45, 5.28s/it, bpd=4.52, g_l=4.52, gn=3.53, l=4.25, p_l=6.73e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 76% 59/78 [05:45<01:40, 5.30s/it, bpd=4.84, g_l=4.84, gn=5.45, l=4.55, p_l=7.97e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 77% 60/78 [05:50<01:35, 5.29s/it, bpd=5.43, g_l=5.43, gn=3.5, l=5.11, p_l=8.5e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 78% 61/78 [05:56<01:29, 5.29s/it, bpd=3.87, g_l=3.87, gn=4.77, l=3.64, p_l=8.52e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 79% 62/78 [06:01<01:24, 5.29s/it, bpd=4.11, g_l=4.11, gn=3.3, l=3.86, p_l=9.1e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 81% 63/78 [06:06<01:19, 5.30s/it, bpd=4.4, g_l=4.4, gn=5.01, l=4.14, p_l=9.16e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 82% 64/78 [06:11<01:14, 5.32s/it, bpd=4.51, g_l=4.51, gn=2.91, l=4.25, p_l=8.9e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 83% 65/78 [06:17<01:08, 5.29s/it, bpd=5.88, g_l=5.88, gn=3.36, l=5.53, p_l=7.21e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 85% 66/78 [06:22<01:03, 5.32s/it, bpd=5.25, g_l=5.25, gn=3.24, l=4.94, p_l=5.73e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 86% 67/78 [06:27<00:58, 5.29s/it, bpd=5.57, g_l=5.57, gn=3.36, l=5.24, p_l=4.48e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 87% 68/78 [06:33<00:53, 5.32s/it, bpd=4.19, g_l=4.19, gn=3.21, l=3.94, p_l=3.7e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 88% 69/78 [06:38<00:47, 5.28s/it, bpd=4.97, g_l=4.97, gn=3.37, l=4.68, p_l=3.01e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 90% 70/78 [06:43<00:42, 5.28s/it, bpd=5.38, g_l=5.38, gn=3.26, l=5.06, p_l=2.53e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 91% 71/78 [06:48<00:36, 5.25s/it, bpd=4.38, g_l=4.38, gn=4.65, l=4.12, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 92% 72/78 [06:54<00:31, 5.24s/it, bpd=3.88, g_l=3.88, gn=3.38, l=3.65, p_l=1.88e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 94% 73/78 [06:59<00:26, 5.22s/it, bpd=5.55, g_l=5.55, gn=3.36, l=5.22, p_l=1.59e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 95% 74/78 [07:04<00:20, 5.21s/it, bpd=4.02, g_l=4.02, gn=3.82, l=3.79, p_l=1.3e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 96% 75/78 [07:09<00:15, 5.20s/it, bpd=5.17, g_l=5.17, gn=3.24, l=4.86, p_l=1.11e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n","100% 78/78 [07:25<00:00, 5.71s/it, bpd=5.56, g_l=5.56, gn=3.27, l=5.24, p_l=8.76e-7]\n","Train bpd: 4.7850 prime_loss: 0.0000 gen_loss: 4.7850 loss: 4.5035 gn: 3.9676 lr: 0.0003 lg_loss_scale: 14.6060 epoch: 23.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:1941\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.99s/it, bpd=4.36, l=4.11]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:13, 1.89s/it, bpd=5.13, l=4.83]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 33% 3/9 [00:05<00:10, 1.74s/it, bpd=5.13, l=4.83]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.64s/it, bpd=5.47, l=5.15]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=5.12, l=4.82]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=5, l=4.7]/content/gdrive/MyDrive/slon/slon (5).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=4.96, l=4.67]\n","Ema bpd: 4.9786 prime_loss: 0.0144 gen_loss: 4.9786 loss: 4.6861 epoch: 23.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (24).txt\n","/content/gdrive/MyDrive/slon/slon (11).txt\n","/content/gdrive/MyDrive/slon/slon (32).txt\n"," 1% 1/78 [00:05<07:04, 5.51s/it, bpd=5.42, g_l=5.42, gn=3.36, l=5.1, p_l=8.32e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 3% 2/78 [00:10<06:51, 5.42s/it, bpd=4.15, g_l=4.15, gn=5.14, l=3.91, p_l=7.22e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:15<06:43, 5.37s/it, bpd=4.72, g_l=4.72, gn=4.49, l=4.44, p_l=5.15e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 5% 4/78 [00:21<06:34, 5.33s/it, bpd=5.04, g_l=5.04, gn=3.87, l=4.75, p_l=3.62e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 6% 5/78 [00:26<06:27, 5.31s/it, bpd=4.15, g_l=4.15, gn=3.78, l=3.91, p_l=3.26e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=3.84, g_l=3.84, gn=6.44, l=3.62, p_l=3.12e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 9% 7/78 [00:36<06:13, 5.26s/it, bpd=4.31, g_l=4.31, gn=3.19, l=4.06, p_l=3.19e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:07, 5.25s/it, bpd=4.1, g_l=4.1, gn=4.84, l=3.86, p_l=3.49e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 12% 9/78 [00:47<06:01, 5.24s/it, bpd=3.65, g_l=3.65, gn=3.6, l=3.44, p_l=3.67e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 13% 10/78 [00:52<05:54, 5.22s/it, bpd=3.79, g_l=3.79, gn=4.51, l=3.57, p_l=3.81e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=4.48, g_l=4.48, gn=4.03, l=4.21, p_l=3.96e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 15% 12/78 [01:02<05:43, 5.20s/it, bpd=4.7, g_l=4.7, gn=3.19, l=4.42, p_l=3.99e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 17% 13/78 [01:08<05:38, 5.20s/it, bpd=4.52, g_l=4.52, gn=3.16, l=4.26, p_l=4.02e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 18% 14/78 [01:13<05:31, 5.19s/it, bpd=4.55, g_l=4.55, gn=3.6, l=4.28, p_l=4.28e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 19% 15/78 [01:18<05:27, 5.20s/it, bpd=4.15, g_l=4.15, gn=3.91, l=3.9, p_l=4.53e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=5.46, g_l=5.46, gn=3.86, l=5.14, p_l=5.38e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 22% 17/78 [01:28<05:17, 5.20s/it, bpd=5.73, g_l=5.73, gn=2.99, l=5.39, p_l=7.09e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 23% 18/78 [01:34<05:11, 5.19s/it, bpd=5.76, g_l=5.76, gn=3.4, l=5.42, p_l=8.89e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=4.64, g_l=4.64, gn=3.51, l=4.37, p_l=1.04e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=4.43, g_l=4.43, gn=4.21, l=4.17, p_l=1.18e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 27% 21/78 [01:49<04:56, 5.21s/it, bpd=3.97, g_l=3.97, gn=6.21, l=3.74, p_l=1.33e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 28% 22/78 [01:54<04:51, 5.21s/it, bpd=4.19, g_l=4.19, gn=4.41, l=3.94, p_l=1.43e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 29% 23/78 [02:00<04:47, 5.22s/it, bpd=5.32, g_l=5.32, gn=3.96, l=5, p_l=1.36e-6]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 31% 24/78 [02:05<04:42, 5.22s/it, bpd=4.17, g_l=4.17, gn=3.87, l=3.92, p_l=1.31e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 32% 25/78 [02:10<04:37, 5.23s/it, bpd=4.13, g_l=4.13, gn=3.71, l=3.88, p_l=1.21e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=5.22, g_l=5.22, gn=3.39, l=4.91, p_l=1.25e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 35% 27/78 [02:20<04:25, 5.21s/it, bpd=4.05, g_l=4.05, gn=4.09, l=3.81, p_l=1.32e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 36% 28/78 [02:26<04:19, 5.19s/it, bpd=3.72, g_l=3.72, gn=3.46, l=3.51, p_l=1.46e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 37% 29/78 [02:31<04:14, 5.19s/it, bpd=4.35, g_l=4.35, gn=4.75, l=4.09, p_l=1.57e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 38% 30/78 [02:36<04:08, 5.18s/it, bpd=5.59, g_l=5.59, gn=4.51, l=5.26, p_l=1.63e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 40% 31/78 [02:41<04:03, 5.18s/it, bpd=5.87, g_l=5.87, gn=4.34, l=5.53, p_l=1.64e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 41% 32/78 [02:46<03:58, 5.18s/it, bpd=3.97, g_l=3.97, gn=4.53, l=3.73, p_l=1.55e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 42% 33/78 [02:52<03:52, 5.17s/it, bpd=4.06, g_l=4.06, gn=3.28, l=3.82, p_l=1.58e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 44% 34/78 [02:57<03:48, 5.18s/it, bpd=5.28, g_l=5.28, gn=3.22, l=4.97, p_l=1.64e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 45% 35/78 [03:02<03:42, 5.18s/it, bpd=4.4, g_l=4.4, gn=4.27, l=4.14, p_l=1.58e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 46% 36/78 [03:07<03:37, 5.19s/it, bpd=3.56, g_l=3.56, gn=3.33, l=3.35, p_l=1.55e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 47% 37/78 [03:12<03:32, 5.18s/it, bpd=5.62, g_l=5.62, gn=3.77, l=5.29, p_l=1.48e-6]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 49% 38/78 [03:17<03:27, 5.20s/it, bpd=4.28, g_l=4.28, gn=4.75, l=4.03, p_l=1.47e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 50% 39/78 [03:23<03:22, 5.20s/it, bpd=4.19, g_l=4.19, gn=3.41, l=3.94, p_l=1.39e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 51% 40/78 [03:28<03:18, 5.22s/it, bpd=4.64, g_l=4.64, gn=3.58, l=4.36, p_l=1.3e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 53% 41/78 [03:33<03:12, 5.21s/it, bpd=4.02, g_l=4.02, gn=3.87, l=3.78, p_l=1.28e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 54% 42/78 [03:38<03:08, 5.23s/it, bpd=4.99, g_l=4.99, gn=4.77, l=4.7, p_l=1.25e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 55% 43/78 [03:44<03:02, 5.22s/it, bpd=4.38, g_l=4.38, gn=3.48, l=4.12, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 56% 44/78 [03:49<02:57, 5.23s/it, bpd=4.62, g_l=4.62, gn=3.35, l=4.34, p_l=1.11e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 58% 45/78 [03:54<02:52, 5.23s/it, bpd=4.16, g_l=4.16, gn=3.77, l=3.92, p_l=1.11e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [03:59<02:47, 5.22s/it, bpd=5.07, g_l=5.07, gn=3.27, l=4.77, p_l=1.17e-6]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 60% 47/78 [04:05<02:41, 5.22s/it, bpd=3.88, g_l=3.88, gn=4.03, l=3.66, p_l=1.11e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 62% 48/78 [04:10<02:36, 5.21s/it, bpd=4.07, g_l=4.07, gn=4.05, l=3.83, p_l=1.12e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 63% 49/78 [04:15<02:30, 5.21s/it, bpd=4.26, g_l=4.26, gn=4.68, l=4.01, p_l=1.22e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 64% 50/78 [04:20<02:25, 5.20s/it, bpd=4.6, g_l=4.6, gn=5.24, l=4.33, p_l=1.29e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 65% 51/78 [04:25<02:20, 5.19s/it, bpd=4.08, g_l=4.08, gn=3.34, l=3.84, p_l=1.33e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 67% 52/78 [04:30<02:14, 5.19s/it, bpd=5.19, g_l=5.19, gn=3.47, l=4.89, p_l=1.24e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 68% 53/78 [04:36<02:09, 5.19s/it, bpd=4.61, g_l=4.61, gn=3.64, l=4.33, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 69% 54/78 [04:41<02:04, 5.19s/it, bpd=4.35, g_l=4.35, gn=3.42, l=4.09, p_l=1.05e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 71% 55/78 [04:46<01:59, 5.20s/it, bpd=5.87, g_l=5.87, gn=3.55, l=5.53, p_l=9.07e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 72% 56/78 [04:51<01:54, 5.20s/it, bpd=3.83, g_l=3.83, gn=3.7, l=3.61, p_l=7.64e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [04:56<01:49, 5.21s/it, bpd=4.39, g_l=4.39, gn=3.77, l=4.13, p_l=6.85e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 74% 58/78 [05:02<01:44, 5.20s/it, bpd=5.27, g_l=5.27, gn=3.18, l=4.96, p_l=6.63e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 76% 59/78 [05:12<02:08, 6.75s/it, bpd=4.25, g_l=4.25, gn=3.14, l=4, p_l=6.66e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 77% 60/78 [05:17<01:52, 6.27s/it, bpd=4.27, g_l=4.27, gn=3.61, l=4.01, p_l=6.59e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 78% 61/78 [05:22<01:41, 5.94s/it, bpd=5.67, g_l=5.67, gn=3.65, l=5.33, p_l=6.52e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 79% 62/78 [05:28<01:31, 5.72s/it, bpd=5.61, g_l=5.61, gn=4.21, l=5.28, p_l=6.21e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 81% 63/78 [05:33<01:23, 5.58s/it, bpd=4.39, g_l=4.39, gn=4.02, l=4.13, p_l=5.51e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 82% 64/78 [05:38<01:16, 5.49s/it, bpd=3.75, g_l=3.75, gn=3.31, l=3.53, p_l=4.57e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 83% 65/78 [05:43<01:10, 5.42s/it, bpd=4.95, g_l=4.95, gn=3.52, l=4.66, p_l=3.82e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 85% 66/78 [05:49<01:04, 5.37s/it, bpd=4.4, g_l=4.4, gn=4.49, l=4.14, p_l=3.47e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 86% 67/78 [05:54<00:58, 5.33s/it, bpd=4.4, g_l=4.4, gn=3.9, l=4.14, p_l=3.05e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 87% 68/78 [05:59<00:53, 5.30s/it, bpd=6.27, g_l=6.27, gn=3.17, l=5.9, p_l=2.84e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:04<00:47, 5.27s/it, bpd=4.06, g_l=4.06, gn=3.1, l=3.83, p_l=2.62e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 90% 70/78 [06:09<00:41, 5.24s/it, bpd=6.23, g_l=6.23, gn=3.17, l=5.86, p_l=2.56e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 91% 71/78 [06:15<00:36, 5.22s/it, bpd=4.14, g_l=4.14, gn=3.48, l=3.89, p_l=2.39e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 92% 72/78 [06:20<00:31, 5.20s/it, bpd=4.45, g_l=4.45, gn=4.3, l=4.19, p_l=2.31e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 94% 73/78 [06:25<00:25, 5.18s/it, bpd=5.46, g_l=5.46, gn=3.16, l=5.14, p_l=2.33e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 95% 74/78 [06:30<00:20, 5.18s/it, bpd=4.17, g_l=4.17, gn=3.15, l=3.93, p_l=2.18e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 96% 75/78 [06:35<00:15, 5.18s/it, bpd=5.52, g_l=5.52, gn=3.86, l=5.2, p_l=2.17e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n","100% 78/78 [06:51<00:00, 5.28s/it, bpd=4.93, g_l=4.93, gn=3.19, l=4.64, p_l=2.54e-7]\n","Train bpd: 4.6199 prime_loss: 0.0000 gen_loss: 4.6199 loss: 4.3481 gn: 3.8646 lr: 0.0003 lg_loss_scale: 14.9180 epoch: 24.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2019\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.89s/it, bpd=4.85, l=4.57]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 22% 2/9 [00:03<00:13, 1.91s/it, bpd=5.67, l=5.34]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.75s/it, bpd=4.79, l=4.51]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=4.86, l=4.57]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:08<00:06, 1.57s/it, bpd=4.95, l=4.66]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=4.33, l=4.08]/content/gdrive/MyDrive/slon/slon (6).txt\n","100% 9/9 [00:13<00:00, 1.53s/it, bpd=5, l=4.71]\n","Ema bpd: 4.9389 prime_loss: 0.0141 gen_loss: 4.9389 loss: 4.6487 epoch: 24.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (24).txt\n","/content/gdrive/MyDrive/slon/slon (14).txt\n","/content/gdrive/MyDrive/slon/slon (24).txt\n"," 1% 1/78 [00:05<07:00, 5.46s/it, bpd=5.89, g_l=5.89, gn=2.94, l=5.54, p_l=2.69e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 3% 2/78 [00:10<06:49, 5.38s/it, bpd=5.21, g_l=5.21, gn=3.52, l=4.91, p_l=2.72e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 4% 3/78 [00:15<06:41, 5.35s/it, bpd=5.29, g_l=5.29, gn=3.03, l=4.97, p_l=2.85e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 5% 4/78 [00:21<06:33, 5.32s/it, bpd=4.93, g_l=4.93, gn=4.65, l=4.64, p_l=2.95e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 6% 5/78 [00:26<06:27, 5.31s/it, bpd=4.86, g_l=4.86, gn=3.57, l=4.57, p_l=3.02e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 8% 6/78 [00:31<06:21, 5.29s/it, bpd=4.42, g_l=4.42, gn=3.54, l=4.16, p_l=3.07e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=3.92, g_l=3.92, gn=3.25, l=3.69, p_l=3.14e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 10% 8/78 [00:42<06:08, 5.26s/it, bpd=4.44, g_l=4.44, gn=2.98, l=4.18, p_l=3.11e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 12% 9/78 [00:47<06:02, 5.25s/it, bpd=4.38, g_l=4.38, gn=3.73, l=4.12, p_l=2.96e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 13% 10/78 [00:52<05:55, 5.23s/it, bpd=4.09, g_l=4.09, gn=4.46, l=3.85, p_l=2.77e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=4.68, g_l=4.68, gn=3.07, l=4.41, p_l=2.51e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 15% 12/78 [01:02<05:43, 5.20s/it, bpd=4.2, g_l=4.2, gn=3.26, l=3.95, p_l=2.24e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=2.95, g_l=2.95, gn=4.36, l=2.78, p_l=2.13e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=3.69, g_l=3.69, gn=3.18, l=3.48, p_l=2.09e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=4.12, g_l=4.12, gn=3.53, l=3.88, p_l=2.24e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 21% 16/78 [01:23<05:21, 5.18s/it, bpd=5.31, g_l=5.31, gn=3.25, l=5, p_l=2.5e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 22% 17/78 [01:28<05:15, 5.18s/it, bpd=3.61, g_l=3.61, gn=6.11, l=3.4, p_l=2.9e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 23% 18/78 [01:33<05:10, 5.18s/it, bpd=4.5, g_l=4.5, gn=3.86, l=4.24, p_l=3.25e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 24% 19/78 [01:39<05:05, 5.18s/it, bpd=3.02, g_l=3.02, gn=3.8, l=2.85, p_l=3.22e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 26% 20/78 [01:44<05:00, 5.19s/it, bpd=3.79, g_l=3.79, gn=3.29, l=3.56, p_l=3.19e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 27% 21/78 [01:49<04:55, 5.19s/it, bpd=3.4, g_l=3.4, gn=3.33, l=3.2, p_l=3.35e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 28% 22/78 [01:54<04:51, 5.21s/it, bpd=5.15, g_l=5.15, gn=3.27, l=4.85, p_l=3.62e-7]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 29% 23/78 [01:59<04:45, 5.20s/it, bpd=4.37, g_l=4.37, gn=4.87, l=4.11, p_l=4.04e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=3.95, g_l=3.95, gn=6.12, l=3.72, p_l=4.58e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 32% 25/78 [02:10<04:35, 5.21s/it, bpd=5.6, g_l=5.6, gn=4.27, l=5.27, p_l=5.14e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=4.07, g_l=4.07, gn=3.09, l=3.83, p_l=5.63e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 35% 27/78 [02:20<04:25, 5.21s/it, bpd=4.64, g_l=4.64, gn=6.9, l=4.36, p_l=5.88e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=3.81, g_l=3.81, gn=3.25, l=3.59, p_l=6.36e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:31<04:14, 5.20s/it, bpd=3.86, g_l=3.86, gn=3.55, l=3.63, p_l=7.06e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=3.83, g_l=3.83, gn=3.12, l=3.61, p_l=8.01e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 40% 31/78 [02:41<04:03, 5.19s/it, bpd=4.08, g_l=4.08, gn=3.03, l=3.84, p_l=9.53e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 41% 32/78 [02:46<03:58, 5.19s/it, bpd=5.54, g_l=5.54, gn=3.73, l=5.22, p_l=1.08e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 42% 33/78 [02:51<03:53, 5.18s/it, bpd=5.04, g_l=5.04, gn=3.26, l=4.74, p_l=1.18e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 44% 34/78 [02:57<03:48, 5.19s/it, bpd=4.61, g_l=4.61, gn=3.74, l=4.34, p_l=1.19e-6]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 45% 35/78 [03:02<03:42, 5.18s/it, bpd=5.02, g_l=5.02, gn=3.25, l=4.72, p_l=1.14e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 46% 36/78 [03:07<03:38, 5.19s/it, bpd=4.25, g_l=4.25, gn=3.6, l=4, p_l=1.13e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 47% 37/78 [03:12<03:32, 5.19s/it, bpd=5.15, g_l=5.15, gn=4.32, l=4.85, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 49% 38/78 [03:17<03:27, 5.20s/it, bpd=5.38, g_l=5.38, gn=3.07, l=5.07, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 50% 39/78 [03:23<03:22, 5.19s/it, bpd=6.02, g_l=6.02, gn=3.33, l=5.67, p_l=1.22e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 51% 40/78 [03:28<03:17, 5.20s/it, bpd=3.49, g_l=3.49, gn=5.16, l=3.28, p_l=1.21e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 53% 41/78 [03:33<03:12, 5.20s/it, bpd=4.19, g_l=4.19, gn=3.6, l=3.94, p_l=1.22e-6]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 54% 42/78 [03:38<03:07, 5.21s/it, bpd=4.84, g_l=4.84, gn=3.53, l=4.55, p_l=1.28e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 55% 43/78 [03:43<03:02, 5.21s/it, bpd=4.81, g_l=4.81, gn=3.94, l=4.53, p_l=1.26e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 56% 44/78 [03:49<02:57, 5.22s/it, bpd=5.13, g_l=5.13, gn=3.78, l=4.83, p_l=1.22e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 58% 45/78 [03:54<02:51, 5.21s/it, bpd=4.7, g_l=4.7, gn=4.85, l=4.43, p_l=1.2e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 59% 46/78 [03:59<02:46, 5.22s/it, bpd=4.43, g_l=4.43, gn=3.15, l=4.17, p_l=1.2e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 60% 47/78 [04:04<02:41, 5.22s/it, bpd=4.55, g_l=4.55, gn=4.13, l=4.28, p_l=1.17e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 62% 48/78 [04:10<02:36, 5.22s/it, bpd=3.57, g_l=3.57, gn=4.02, l=3.36, p_l=1.19e-6]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 63% 49/78 [04:15<02:31, 5.21s/it, bpd=4.46, g_l=4.46, gn=3.61, l=4.2, p_l=1.24e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 64% 50/78 [04:20<02:25, 5.21s/it, bpd=5.2, g_l=5.2, gn=4.22, l=4.89, p_l=1.28e-6]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 65% 51/78 [04:25<02:20, 5.21s/it, bpd=3.73, g_l=3.73, gn=4.41, l=3.51, p_l=1.27e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [04:30<02:15, 5.21s/it, bpd=5.31, g_l=5.31, gn=3.54, l=4.99, p_l=1.23e-6]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 68% 53/78 [04:36<02:10, 5.21s/it, bpd=5.9, g_l=5.9, gn=3.27, l=5.55, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 69% 54/78 [04:41<02:05, 5.21s/it, bpd=4.04, g_l=4.04, gn=3.39, l=3.8, p_l=1.05e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 71% 55/78 [04:46<01:59, 5.21s/it, bpd=4.08, g_l=4.08, gn=3.64, l=3.84, p_l=9.25e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 72% 56/78 [04:51<01:54, 5.20s/it, bpd=4.14, g_l=4.14, gn=3.96, l=3.9, p_l=8.89e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [04:56<01:49, 5.20s/it, bpd=4.5, g_l=4.5, gn=3.21, l=4.23, p_l=9.15e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 74% 58/78 [05:02<01:43, 5.20s/it, bpd=3.99, g_l=3.99, gn=3.76, l=3.75, p_l=1.06e-6]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 76% 59/78 [05:07<01:38, 5.20s/it, bpd=4.45, g_l=4.45, gn=4.29, l=4.19, p_l=1.4e-6]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 77% 60/78 [05:12<01:33, 5.20s/it, bpd=4.52, g_l=4.52, gn=4.59, l=4.25, p_l=1.63e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 78% 61/78 [05:17<01:28, 5.20s/it, bpd=4.41, g_l=4.41, gn=4.16, l=4.15, p_l=1.78e-6]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 79% 62/78 [05:22<01:23, 5.20s/it, bpd=4.16, g_l=4.16, gn=3.45, l=3.91, p_l=1.95e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 81% 63/78 [05:28<01:18, 5.20s/it, bpd=4.97, g_l=4.97, gn=3.58, l=4.68, p_l=2.1e-6]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 82% 64/78 [05:33<01:12, 5.20s/it, bpd=4.65, g_l=4.65, gn=3.64, l=4.38, p_l=2.13e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 83% 65/78 [05:38<01:07, 5.21s/it, bpd=6.25, g_l=6.25, gn=3.48, l=5.88, p_l=2.02e-6]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 85% 66/78 [05:43<01:02, 5.21s/it, bpd=5.79, g_l=5.79, gn=3.24, l=5.45, p_l=1.97e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 86% 67/78 [05:49<00:57, 5.22s/it, bpd=6, g_l=6, gn=2.88, l=5.64, p_l=2.06e-6]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 87% 68/78 [05:54<00:52, 5.21s/it, bpd=5.01, g_l=5.01, gn=3.51, l=4.71, p_l=1.91e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 88% 69/78 [05:59<00:46, 5.22s/it, bpd=4.48, g_l=4.48, gn=4.03, l=4.22, p_l=1.8e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 90% 70/78 [06:04<00:41, 5.21s/it, bpd=5.42, g_l=5.42, gn=3.58, l=5.1, p_l=1.59e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 91% 71/78 [06:09<00:36, 5.22s/it, bpd=3.82, g_l=3.82, gn=3.15, l=3.6, p_l=1.28e-6]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 92% 72/78 [06:15<00:31, 5.21s/it, bpd=5.69, g_l=5.69, gn=4.25, l=5.36, p_l=1.09e-6]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 94% 73/78 [06:20<00:26, 5.21s/it, bpd=4.36, g_l=4.36, gn=3.48, l=4.11, p_l=8.97e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 95% 74/78 [06:25<00:20, 5.21s/it, bpd=4.92, g_l=4.92, gn=3.16, l=4.63, p_l=7.47e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 96% 75/78 [06:30<00:15, 5.22s/it, bpd=5.46, g_l=5.46, gn=3.61, l=5.14, p_l=5.98e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n","100% 78/78 [06:46<00:00, 5.21s/it, bpd=4.43, g_l=4.43, gn=3.8, l=4.17, p_l=4.31e-7]\n","Train bpd: 4.5751 prime_loss: 0.0000 gen_loss: 4.5751 loss: 4.3060 gn: 3.7577 lr: 0.0003 lg_loss_scale: 15.2300 epoch: 25.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2097\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.90s/it, bpd=4.55, l=4.29]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:12, 1.78s/it, bpd=4.55, l=4.28]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.74s/it, bpd=5.33, l=5.01]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.63s/it, bpd=5.17, l=4.86]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=4.54, l=4.27]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=5.03, l=4.74]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=4.75, l=4.47]\n","Ema bpd: 4.7531 prime_loss: 0.0141 gen_loss: 4.7531 loss: 4.4738 epoch: 25.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (25).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (14).txt\n"," 1% 1/78 [00:05<07:02, 5.49s/it, bpd=4.75, g_l=4.75, gn=4.52, l=4.47, p_l=4.38e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 3% 2/78 [00:10<06:51, 5.41s/it, bpd=4.78, g_l=4.78, gn=3.36, l=4.5, p_l=4.45e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 4% 3/78 [00:21<08:35, 6.87s/it, bpd=5.63, g_l=5.63, gn=3.71, l=5.29, p_l=4.8e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 5% 4/78 [00:26<07:52, 6.38s/it, bpd=6.08, g_l=6.08, gn=3.32, l=5.72, p_l=4.79e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 6% 5/78 [00:31<07:20, 6.03s/it, bpd=4.52, g_l=4.52, gn=3.14, l=4.25, p_l=4.97e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 8% 6/78 [00:36<06:57, 5.80s/it, bpd=4.08, g_l=4.08, gn=3.37, l=3.84, p_l=5.12e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 9% 7/78 [00:41<06:39, 5.63s/it, bpd=5, g_l=5, gn=3.49, l=4.71, p_l=5.24e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 10% 8/78 [00:47<06:26, 5.52s/it, bpd=4.6, g_l=4.6, gn=3.97, l=4.33, p_l=5.55e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 12% 9/78 [00:52<06:14, 5.42s/it, bpd=4.08, g_l=4.08, gn=4.28, l=3.84, p_l=6.21e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:57<06:04, 5.36s/it, bpd=4.96, g_l=4.96, gn=3.27, l=4.67, p_l=7.11e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [01:02<05:55, 5.30s/it, bpd=4.36, g_l=4.36, gn=3.51, l=4.11, p_l=7.03e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 15% 12/78 [01:07<05:47, 5.27s/it, bpd=3.51, g_l=3.51, gn=3.59, l=3.3, p_l=6.89e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 17% 13/78 [01:13<05:40, 5.24s/it, bpd=3.91, g_l=3.91, gn=2.98, l=3.68, p_l=6.72e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 18% 14/78 [01:18<05:33, 5.22s/it, bpd=4.34, g_l=4.34, gn=4.9, l=4.08, p_l=6.44e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 19% 15/78 [01:23<05:27, 5.20s/it, bpd=5.25, g_l=5.25, gn=4.13, l=4.94, p_l=5.53e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 21% 16/78 [01:28<05:21, 5.19s/it, bpd=5.51, g_l=5.51, gn=3.16, l=5.19, p_l=4.6e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:33<05:15, 5.18s/it, bpd=4.14, g_l=4.14, gn=4.01, l=3.9, p_l=3.93e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 23% 18/78 [01:38<05:10, 5.17s/it, bpd=4.14, g_l=4.14, gn=3.19, l=3.89, p_l=3.42e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 24% 19/78 [01:44<05:05, 5.17s/it, bpd=4.45, g_l=4.45, gn=4.72, l=4.19, p_l=3.12e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 26% 20/78 [01:49<04:59, 5.17s/it, bpd=4.11, g_l=4.11, gn=3.34, l=3.86, p_l=3.07e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 27% 21/78 [01:54<04:55, 5.18s/it, bpd=4.34, g_l=4.34, gn=3.2, l=4.08, p_l=3.09e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 28% 22/78 [01:59<04:49, 5.17s/it, bpd=5.1, g_l=5.1, gn=4.21, l=4.8, p_l=3.39e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 29% 23/78 [02:04<04:45, 5.18s/it, bpd=5.34, g_l=5.34, gn=3.18, l=5.03, p_l=3.52e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 31% 24/78 [02:09<04:39, 5.17s/it, bpd=3.98, g_l=3.98, gn=5.74, l=3.74, p_l=3.51e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 32% 25/78 [02:15<04:34, 5.19s/it, bpd=4.59, g_l=4.59, gn=3.72, l=4.32, p_l=3.51e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 33% 26/78 [02:20<04:29, 5.19s/it, bpd=5.02, g_l=5.02, gn=3.18, l=4.72, p_l=3.2e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 35% 27/78 [02:25<04:25, 5.20s/it, bpd=4.24, g_l=4.24, gn=3.23, l=3.99, p_l=2.82e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 36% 28/78 [02:30<04:19, 5.19s/it, bpd=4.19, g_l=4.19, gn=3.55, l=3.95, p_l=2.64e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 37% 29/78 [02:36<04:14, 5.20s/it, bpd=4.07, g_l=4.07, gn=3.46, l=3.83, p_l=2.46e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 38% 30/78 [02:41<04:09, 5.20s/it, bpd=5.29, g_l=5.29, gn=3.75, l=4.97, p_l=2.25e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 40% 31/78 [02:46<04:04, 5.21s/it, bpd=4.39, g_l=4.39, gn=3.54, l=4.13, p_l=2.08e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 41% 32/78 [02:51<03:59, 5.20s/it, bpd=6.09, g_l=6.09, gn=3.48, l=5.73, p_l=1.97e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 42% 33/78 [02:56<03:54, 5.21s/it, bpd=4.05, g_l=4.05, gn=4.26, l=3.81, p_l=1.89e-7]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 34/78 [03:02<03:48, 5.20s/it, bpd=3.85, g_l=3.85, gn=3.64, l=3.63, p_l=1.82e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 45% 35/78 [03:07<03:43, 5.21s/it, bpd=4.2, g_l=4.2, gn=4.11, l=3.95, p_l=1.76e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 46% 36/78 [03:12<03:38, 5.20s/it, bpd=5.21, g_l=5.21, gn=3.77, l=4.9, p_l=1.57e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 47% 37/78 [03:17<03:33, 5.20s/it, bpd=3.89, g_l=3.89, gn=4.06, l=3.66, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:22<03:28, 5.20s/it, bpd=3.61, g_l=3.61, gn=4.12, l=3.4, p_l=1.05e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 50% 39/78 [03:28<03:23, 5.21s/it, bpd=5.01, g_l=5.01, gn=3.1, l=4.71, p_l=8.87e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 51% 40/78 [03:33<03:17, 5.20s/it, bpd=3.96, g_l=3.96, gn=3.17, l=3.72, p_l=7.79e-8]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 53% 41/78 [03:38<03:12, 5.21s/it, bpd=4.22, g_l=4.22, gn=3.18, l=3.97, p_l=7.88e-8]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 54% 42/78 [03:43<03:07, 5.20s/it, bpd=4.35, g_l=4.35, gn=3.74, l=4.1, p_l=8.73e-8]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 55% 43/78 [03:48<03:02, 5.20s/it, bpd=5.67, g_l=5.67, gn=3.33, l=5.34, p_l=9.94e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 56% 44/78 [03:54<02:56, 5.20s/it, bpd=5.2, g_l=5.2, gn=3.62, l=4.9, p_l=1.08e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 58% 45/78 [03:59<02:51, 5.20s/it, bpd=3.96, g_l=3.96, gn=3.79, l=3.72, p_l=1.16e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2143\u001b[0m\n"," 59% 46/78 [04:38<08:08, 15.28s/it, bpd=5.22, g_l=5.22, gn=3.09, l=4.91, p_l=1.26e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 60% 47/78 [04:43<06:20, 12.27s/it, bpd=5.38, g_l=5.38, gn=3.38, l=5.06, p_l=1.38e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 62% 48/78 [04:48<05:02, 10.10s/it, bpd=3.32, g_l=3.32, gn=3.32, l=3.12, p_l=1.3e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 63% 49/78 [04:53<04:09, 8.61s/it, bpd=3.74, g_l=3.74, gn=4.45, l=3.52, p_l=1.23e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 64% 50/78 [04:58<03:31, 7.54s/it, bpd=4.44, g_l=4.44, gn=3.63, l=4.18, p_l=1.15e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 65% 51/78 [05:03<03:04, 6.82s/it, bpd=3.83, g_l=3.83, gn=4.33, l=3.61, p_l=1.07e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [05:08<02:43, 6.29s/it, bpd=3.27, g_l=3.27, gn=3.42, l=3.08, p_l=1.03e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 68% 53/78 [05:13<02:28, 5.96s/it, bpd=4.53, g_l=4.53, gn=3.43, l=4.26, p_l=1.07e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 69% 54/78 [05:19<02:16, 5.70s/it, bpd=4.16, g_l=4.16, gn=3.07, l=3.91, p_l=1.17e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 71% 55/78 [05:24<02:07, 5.55s/it, bpd=4.21, g_l=4.21, gn=6.11, l=3.96, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 72% 56/78 [05:29<01:59, 5.43s/it, bpd=5.71, g_l=5.71, gn=3.57, l=5.37, p_l=1.41e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 73% 57/78 [05:34<01:52, 5.35s/it, bpd=5.52, g_l=5.52, gn=3.32, l=5.19, p_l=1.63e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 74% 58/78 [05:39<01:46, 5.31s/it, bpd=5.49, g_l=5.49, gn=3.27, l=5.17, p_l=1.7e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 76% 59/78 [05:44<01:40, 5.28s/it, bpd=4.17, g_l=4.17, gn=3.26, l=3.93, p_l=1.66e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 77% 60/78 [05:50<01:34, 5.27s/it, bpd=4.47, g_l=4.47, gn=3.84, l=4.21, p_l=1.51e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 78% 61/78 [05:55<01:29, 5.26s/it, bpd=4.8, g_l=4.8, gn=4.82, l=4.52, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 79% 62/78 [06:00<01:24, 5.27s/it, bpd=5.69, g_l=5.69, gn=3.01, l=5.36, p_l=1.15e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 81% 63/78 [06:05<01:18, 5.26s/it, bpd=4.93, g_l=4.93, gn=3.21, l=4.64, p_l=1.05e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [06:11<01:13, 5.27s/it, bpd=4.4, g_l=4.4, gn=3.39, l=4.14, p_l=1.01e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 83% 65/78 [06:16<01:08, 5.26s/it, bpd=5.24, g_l=5.24, gn=4.35, l=4.93, p_l=9.67e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 85% 66/78 [06:21<01:03, 5.26s/it, bpd=4.07, g_l=4.07, gn=3.53, l=3.83, p_l=8.69e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [06:26<00:57, 5.25s/it, bpd=4.18, g_l=4.18, gn=3.59, l=3.93, p_l=8.11e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 87% 68/78 [06:32<00:52, 5.27s/it, bpd=5.13, g_l=5.13, gn=3.25, l=4.83, p_l=7.84e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 88% 69/78 [06:37<00:47, 5.26s/it, bpd=3.97, g_l=3.97, gn=3.14, l=3.73, p_l=7.79e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 90% 70/78 [06:42<00:42, 5.29s/it, bpd=4.87, g_l=4.87, gn=3.47, l=4.59, p_l=7.48e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 91% 71/78 [06:48<00:36, 5.27s/it, bpd=5.03, g_l=5.03, gn=3.08, l=4.73, p_l=6.72e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 92% 72/78 [06:53<00:31, 5.29s/it, bpd=4.8, g_l=4.8, gn=3.75, l=4.52, p_l=6.45e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 94% 73/78 [06:58<00:26, 5.28s/it, bpd=3.36, g_l=3.36, gn=4.42, l=3.16, p_l=6.05e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 95% 74/78 [07:04<00:21, 5.31s/it, bpd=4.56, g_l=4.56, gn=4.2, l=4.29, p_l=5.87e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 96% 75/78 [07:09<00:15, 5.28s/it, bpd=4.47, g_l=4.47, gn=3.19, l=4.21, p_l=6.36e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n","100% 78/78 [07:25<00:00, 5.71s/it, bpd=4.93, g_l=4.93, gn=4.6, l=4.64, p_l=6.49e-8]\n","Train bpd: 4.5645 prime_loss: 0.0000 gen_loss: 4.5645 loss: 4.2960 gn: 3.6813 lr: 0.0003 lg_loss_scale: 15.5420 epoch: 26.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2175\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.03s/it, bpd=4.72, l=4.44]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:13, 1.91s/it, bpd=4.85, l=4.56]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 33% 3/9 [00:05<00:10, 1.75s/it, bpd=5.27, l=4.96]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=5.19, l=4.88]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=4.99, l=4.7]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=5.94, l=5.59]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=4.41, l=4.15]\n","Ema bpd: 5.1118 prime_loss: 0.0140 gen_loss: 5.1118 loss: 4.8114 epoch: 26.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (4).txt\n","/content/gdrive/MyDrive/slon/slon (14).txt\n","/content/gdrive/MyDrive/slon/slon (27).txt\n"," 1% 1/78 [00:05<06:51, 5.35s/it, bpd=4.55, g_l=4.55, gn=3.89, l=4.28, p_l=6.36e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 3% 2/78 [00:10<06:43, 5.32s/it, bpd=5.24, g_l=5.24, gn=2.96, l=4.93, p_l=6.54e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:15<06:37, 5.29s/it, bpd=4.6, g_l=4.6, gn=3.87, l=4.33, p_l=6.72e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 5% 4/78 [00:21<06:32, 5.30s/it, bpd=4.72, g_l=4.72, gn=4.84, l=4.44, p_l=6.81e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 6% 5/78 [00:26<06:26, 5.30s/it, bpd=4.38, g_l=4.38, gn=4.05, l=4.12, p_l=7.21e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 8% 6/78 [00:31<06:21, 5.30s/it, bpd=5.96, g_l=5.96, gn=4.82, l=5.61, p_l=7.43e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 9% 7/78 [00:37<06:15, 5.28s/it, bpd=6.06, g_l=6.06, gn=4.2, l=5.7, p_l=7.39e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 10% 8/78 [00:42<06:08, 5.27s/it, bpd=4.43, g_l=4.43, gn=3.17, l=4.17, p_l=7.17e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 12% 9/78 [00:47<06:01, 5.24s/it, bpd=4.15, g_l=4.15, gn=4.2, l=3.91, p_l=6.54e-8]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 13% 10/78 [00:52<05:55, 5.22s/it, bpd=4.26, g_l=4.26, gn=3.81, l=4.01, p_l=6.4e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:48, 5.20s/it, bpd=5.01, g_l=5.01, gn=4.14, l=4.72, p_l=5.91e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=4.52, g_l=4.52, gn=3.77, l=4.25, p_l=5.33e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 17% 13/78 [01:08<05:35, 5.17s/it, bpd=4.03, g_l=4.03, gn=3.98, l=3.8, p_l=4.79e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=4.89, g_l=4.89, gn=3.4, l=4.6, p_l=4.17e-8]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=4.17, g_l=4.17, gn=4.33, l=3.92, p_l=3.99e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 21% 16/78 [01:23<05:21, 5.18s/it, bpd=4.42, g_l=4.42, gn=3.45, l=4.16, p_l=3.99e-8]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 22% 17/78 [01:28<05:16, 5.19s/it, bpd=4.79, g_l=4.79, gn=3.6, l=4.51, p_l=4.21e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 23% 18/78 [01:33<05:11, 5.19s/it, bpd=4.37, g_l=4.37, gn=4.19, l=4.11, p_l=4.61e-8]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=5.2, g_l=5.2, gn=3.5, l=4.89, p_l=4.79e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=4.44, g_l=4.44, gn=3.72, l=4.18, p_l=4.97e-8]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 27% 21/78 [01:49<04:56, 5.20s/it, bpd=4.07, g_l=4.07, gn=3.21, l=3.83, p_l=4.61e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 28% 22/78 [01:54<04:51, 5.20s/it, bpd=4.29, g_l=4.29, gn=4.22, l=4.04, p_l=4.3e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 29% 23/78 [02:00<04:46, 5.20s/it, bpd=6.27, g_l=6.27, gn=4.11, l=5.9, p_l=4.03e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 31% 24/78 [02:05<04:40, 5.20s/it, bpd=3.97, g_l=3.97, gn=3.28, l=3.73, p_l=3.9e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 32% 25/78 [02:15<05:55, 6.71s/it, bpd=5.21, g_l=5.21, gn=3.49, l=4.9, p_l=3.76e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 33% 26/78 [02:20<05:24, 6.24s/it, bpd=3.93, g_l=3.93, gn=3.61, l=3.7, p_l=3.81e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 35% 27/78 [02:25<05:01, 5.91s/it, bpd=4.11, g_l=4.11, gn=3.32, l=3.87, p_l=3.9e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 36% 28/78 [02:30<04:45, 5.71s/it, bpd=5.54, g_l=5.54, gn=3.46, l=5.22, p_l=3.94e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:36<04:32, 5.56s/it, bpd=5.7, g_l=5.7, gn=4.35, l=5.37, p_l=4.21e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 38% 30/78 [02:41<04:22, 5.47s/it, bpd=4.45, g_l=4.45, gn=4.64, l=4.19, p_l=4.12e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 40% 31/78 [02:46<04:13, 5.40s/it, bpd=4.19, g_l=4.19, gn=3.68, l=3.94, p_l=4.08e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 41% 32/78 [02:51<04:06, 5.35s/it, bpd=3.96, g_l=3.96, gn=5.79, l=3.73, p_l=4.12e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 42% 33/78 [02:57<03:59, 5.31s/it, bpd=4.91, g_l=4.91, gn=3.36, l=4.62, p_l=4.3e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 44% 34/78 [03:02<03:52, 5.29s/it, bpd=3.68, g_l=3.68, gn=4.09, l=3.47, p_l=5.02e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 45% 35/78 [03:07<03:46, 5.26s/it, bpd=3.46, g_l=3.46, gn=3.08, l=3.26, p_l=5.96e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 46% 36/78 [03:12<03:40, 5.24s/it, bpd=4.98, g_l=4.98, gn=3.21, l=4.69, p_l=6.58e-8]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 47% 37/78 [03:17<03:33, 5.21s/it, bpd=4.62, g_l=4.62, gn=3.45, l=4.35, p_l=6.99e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 49% 38/78 [03:23<03:28, 5.21s/it, bpd=4.66, g_l=4.66, gn=3.66, l=4.38, p_l=7.03e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 50% 39/78 [03:28<03:22, 5.19s/it, bpd=4.92, g_l=4.92, gn=3.79, l=4.63, p_l=7.66e-8]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 51% 40/78 [03:33<03:17, 5.19s/it, bpd=4.36, g_l=4.36, gn=3.35, l=4.1, p_l=8.29e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 53% 41/78 [03:38<03:11, 5.18s/it, bpd=4.14, g_l=4.14, gn=3.64, l=3.9, p_l=9.09e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 54% 42/78 [03:43<03:06, 5.18s/it, bpd=4.96, g_l=4.96, gn=3.69, l=4.67, p_l=9.23e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 55% 43/78 [03:48<03:01, 5.18s/it, bpd=5.36, g_l=5.36, gn=3.08, l=5.04, p_l=9.27e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 56% 44/78 [03:54<02:56, 5.19s/it, bpd=5.83, g_l=5.83, gn=3.42, l=5.48, p_l=9.45e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 58% 45/78 [03:59<02:51, 5.19s/it, bpd=4.32, g_l=4.32, gn=4.16, l=4.06, p_l=9.41e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 59% 46/78 [04:04<02:46, 5.19s/it, bpd=4.2, g_l=4.2, gn=3.61, l=3.95, p_l=9.9e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 60% 47/78 [04:09<02:41, 5.20s/it, bpd=5.4, g_l=5.4, gn=2.92, l=5.08, p_l=1.06e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 62% 48/78 [04:15<02:36, 5.20s/it, bpd=3.99, g_l=3.99, gn=3.41, l=3.76, p_l=1.05e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 63% 49/78 [04:20<02:30, 5.20s/it, bpd=4.91, g_l=4.91, gn=3.22, l=4.62, p_l=1.16e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 64% 50/78 [04:25<02:25, 5.20s/it, bpd=5.31, g_l=5.31, gn=3.09, l=5, p_l=1.26e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 65% 51/78 [04:30<02:20, 5.20s/it, bpd=4.07, g_l=4.07, gn=3.04, l=3.83, p_l=1.32e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 67% 52/78 [04:35<02:15, 5.20s/it, bpd=3.91, g_l=3.91, gn=3.6, l=3.68, p_l=1.39e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 68% 53/78 [04:41<02:10, 5.21s/it, bpd=4.11, g_l=4.11, gn=4.07, l=3.87, p_l=1.35e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 69% 54/78 [04:46<02:04, 5.21s/it, bpd=5.02, g_l=5.02, gn=4.27, l=4.72, p_l=1.29e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 71% 55/78 [04:51<01:59, 5.21s/it, bpd=4.18, g_l=4.18, gn=3.35, l=3.94, p_l=1.34e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 72% 56/78 [04:56<01:54, 5.21s/it, bpd=3.2, g_l=3.2, gn=3.65, l=3.01, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 73% 57/78 [05:01<01:49, 5.21s/it, bpd=4.62, g_l=4.62, gn=3.03, l=4.35, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 74% 58/78 [05:07<01:44, 5.21s/it, bpd=4.09, g_l=4.09, gn=3.04, l=3.84, p_l=1.58e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 76% 59/78 [05:12<01:39, 5.21s/it, bpd=4, g_l=4, gn=3.63, l=3.76, p_l=1.66e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 77% 60/78 [05:17<01:33, 5.21s/it, bpd=4.1, g_l=4.1, gn=4.15, l=3.86, p_l=1.64e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 78% 61/78 [05:22<01:28, 5.21s/it, bpd=5.95, g_l=5.95, gn=2.9, l=5.6, p_l=1.66e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 79% 62/78 [05:27<01:23, 5.21s/it, bpd=4.32, g_l=4.32, gn=3.64, l=4.06, p_l=1.56e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 81% 63/78 [05:33<01:18, 5.21s/it, bpd=5.09, g_l=5.09, gn=3.25, l=4.79, p_l=1.5e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 82% 64/78 [05:38<01:12, 5.20s/it, bpd=3.62, g_l=3.62, gn=3.52, l=3.4, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 83% 65/78 [05:43<01:07, 5.21s/it, bpd=5.59, g_l=5.59, gn=3.55, l=5.26, p_l=1.53e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 85% 66/78 [05:48<01:02, 5.21s/it, bpd=4.18, g_l=4.18, gn=3.6, l=3.93, p_l=1.72e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 86% 67/78 [05:53<00:57, 5.21s/it, bpd=4.41, g_l=4.41, gn=4.22, l=4.15, p_l=1.77e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [05:59<00:51, 5.20s/it, bpd=6.09, g_l=6.09, gn=3.78, l=5.74, p_l=1.92e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:04<00:46, 5.20s/it, bpd=5.19, g_l=5.19, gn=4.03, l=4.89, p_l=1.87e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 90% 70/78 [06:09<00:41, 5.20s/it, bpd=3.98, g_l=3.98, gn=3.56, l=3.74, p_l=1.63e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 91% 71/78 [06:14<00:36, 5.20s/it, bpd=3.59, g_l=3.59, gn=3.24, l=3.38, p_l=1.49e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 92% 72/78 [06:19<00:31, 5.19s/it, bpd=4.34, g_l=4.34, gn=3.7, l=4.09, p_l=1.32e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 94% 73/78 [06:25<00:25, 5.19s/it, bpd=4.58, g_l=4.58, gn=3.37, l=4.31, p_l=1.33e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 95% 74/78 [06:30<00:20, 5.19s/it, bpd=4.33, g_l=4.33, gn=3.09, l=4.07, p_l=1.45e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [06:35<00:15, 5.19s/it, bpd=4.26, g_l=4.26, gn=3.5, l=4.01, p_l=1.53e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n","100% 78/78 [06:51<00:00, 5.27s/it, bpd=5.41, g_l=5.41, gn=3.61, l=5.09, p_l=1.56e-7]\n","Train bpd: 4.6031 prime_loss: 0.0000 gen_loss: 4.6031 loss: 4.3323 gn: 3.6694 lr: 0.0003 lg_loss_scale: 15.8540 epoch: 27.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2253\u001b[0m\n"," 11% 1/9 [00:02<00:17, 2.16s/it, bpd=4.88, l=4.59]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:13, 1.97s/it, bpd=4.93, l=4.64]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:05<00:10, 1.80s/it, bpd=4.4, l=4.14]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.68s/it, bpd=5.72, l=5.39]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.60s/it, bpd=6.13, l=5.77]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.54s/it, bpd=5.4, l=5.09]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.52s/it, bpd=5.03, l=4.73]\n","Ema bpd: 5.2375 prime_loss: 0.0135 gen_loss: 5.2375 loss: 4.9297 epoch: 27.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (28).txt\n","/content/gdrive/MyDrive/slon/slon (23).txt\n","/content/gdrive/MyDrive/slon/slon (26).txt\n"," 1% 1/78 [00:05<06:57, 5.42s/it, bpd=3.1, g_l=3.1, gn=3.33, l=2.92, p_l=1.58e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 3% 2/78 [00:10<06:47, 5.36s/it, bpd=5, g_l=5, gn=3.5, l=4.71, p_l=1.65e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 4% 3/78 [00:15<06:39, 5.33s/it, bpd=4.85, g_l=4.85, gn=3.14, l=4.57, p_l=1.76e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 5% 4/78 [00:21<06:33, 5.31s/it, bpd=4.72, g_l=4.72, gn=3.83, l=4.44, p_l=1.93e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 6% 5/78 [00:26<06:27, 5.30s/it, bpd=5.55, g_l=5.55, gn=3.92, l=5.22, p_l=2.18e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=4.15, g_l=4.15, gn=3.36, l=3.9, p_l=2.66e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:36<06:14, 5.27s/it, bpd=3.89, g_l=3.89, gn=3.82, l=3.66, p_l=3.16e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 10% 8/78 [00:42<06:07, 5.26s/it, bpd=5.64, g_l=5.64, gn=3.49, l=5.3, p_l=3.29e-7]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 12% 9/78 [00:47<06:00, 5.23s/it, bpd=3.91, g_l=3.91, gn=3.25, l=3.68, p_l=3.45e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:52<05:54, 5.22s/it, bpd=4.08, g_l=4.08, gn=4.27, l=3.84, p_l=3.49e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 14% 11/78 [00:57<05:47, 5.19s/it, bpd=5.24, g_l=5.24, gn=3.71, l=4.93, p_l=3.22e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=4.14, g_l=4.14, gn=3.25, l=3.89, p_l=3.36e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 17% 13/78 [01:07<05:36, 5.18s/it, bpd=4.8, g_l=4.8, gn=3.31, l=4.52, p_l=3.55e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=3.56, g_l=3.56, gn=3.81, l=3.35, p_l=3.81e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 19% 15/78 [01:18<05:26, 5.18s/it, bpd=4.54, g_l=4.54, gn=2.95, l=4.27, p_l=4.01e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=3.61, g_l=3.61, gn=5.8, l=3.4, p_l=4.33e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 22% 17/78 [01:28<05:16, 5.19s/it, bpd=4.1, g_l=4.1, gn=3.66, l=3.86, p_l=5.41e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 23% 18/78 [01:33<05:12, 5.20s/it, bpd=3.66, g_l=3.66, gn=3.7, l=3.44, p_l=6.45e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 24% 19/78 [01:39<05:07, 5.22s/it, bpd=6.09, g_l=6.09, gn=3.38, l=5.73, p_l=7.52e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:44<05:03, 5.23s/it, bpd=4.4, g_l=4.4, gn=3.76, l=4.14, p_l=8.45e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 27% 21/78 [01:49<04:57, 5.22s/it, bpd=5.58, g_l=5.58, gn=3.23, l=5.25, p_l=8.33e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 28% 22/78 [01:54<04:53, 5.24s/it, bpd=3.88, g_l=3.88, gn=3.62, l=3.65, p_l=8.32e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 29% 23/78 [02:00<04:47, 5.23s/it, bpd=5.17, g_l=5.17, gn=4.7, l=4.86, p_l=7.63e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 31% 24/78 [02:05<04:42, 5.23s/it, bpd=4.51, g_l=4.51, gn=3.43, l=4.24, p_l=7e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 32% 25/78 [02:10<04:36, 5.22s/it, bpd=5.64, g_l=5.64, gn=3.21, l=5.3, p_l=6.48e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=3.81, g_l=3.81, gn=3.99, l=3.58, p_l=6.28e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 35% 27/78 [02:20<04:25, 5.21s/it, bpd=4.1, g_l=4.1, gn=3.25, l=3.86, p_l=5.85e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=4.85, g_l=4.85, gn=3.44, l=4.57, p_l=6.08e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 37% 29/78 [02:31<04:14, 5.20s/it, bpd=4.52, g_l=4.52, gn=3.7, l=4.25, p_l=6.1e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=3.82, g_l=3.82, gn=3.19, l=3.59, p_l=6.15e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 40% 31/78 [02:41<04:03, 5.19s/it, bpd=4.17, g_l=4.17, gn=3.49, l=3.93, p_l=6.57e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 41% 32/78 [02:47<04:01, 5.24s/it, bpd=5.24, g_l=5.24, gn=3.04, l=4.93, p_l=7.49e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 42% 33/78 [02:52<03:54, 5.21s/it, bpd=4.18, g_l=4.18, gn=3.17, l=3.94, p_l=8.53e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 44% 34/78 [02:57<03:48, 5.20s/it, bpd=3.68, g_l=3.68, gn=3, l=3.46, p_l=9.14e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 45% 35/78 [03:02<03:43, 5.19s/it, bpd=3.77, g_l=3.77, gn=3.33, l=3.55, p_l=8.97e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 46% 36/78 [03:07<03:37, 5.19s/it, bpd=4.66, g_l=4.66, gn=3.41, l=4.38, p_l=8.2e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 47% 37/78 [03:12<03:32, 5.18s/it, bpd=4.27, g_l=4.27, gn=4.08, l=4.02, p_l=6.78e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 49% 38/78 [03:18<03:27, 5.20s/it, bpd=3.61, g_l=3.61, gn=3.56, l=3.39, p_l=6.1e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 50% 39/78 [03:23<03:22, 5.19s/it, bpd=4.89, g_l=4.89, gn=2.92, l=4.6, p_l=6.06e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 51% 40/78 [03:28<03:17, 5.20s/it, bpd=5.31, g_l=5.31, gn=3.61, l=4.99, p_l=5.61e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 53% 41/78 [03:33<03:12, 5.20s/it, bpd=4.23, g_l=4.23, gn=3.42, l=3.98, p_l=5.77e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 54% 42/78 [03:38<03:07, 5.21s/it, bpd=4.63, g_l=4.63, gn=3.43, l=4.35, p_l=5.69e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [03:44<03:02, 5.21s/it, bpd=5.64, g_l=5.64, gn=3.82, l=5.31, p_l=5.2e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 56% 44/78 [03:49<02:57, 5.21s/it, bpd=4.97, g_l=4.97, gn=3.27, l=4.68, p_l=4.89e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 58% 45/78 [03:54<02:52, 5.21s/it, bpd=4.12, g_l=4.12, gn=3.18, l=3.88, p_l=5.1e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 59% 46/78 [03:59<02:46, 5.21s/it, bpd=4.47, g_l=4.47, gn=3.76, l=4.21, p_l=5.14e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 60% 47/78 [04:10<03:29, 6.76s/it, bpd=4.54, g_l=4.54, gn=3.11, l=4.27, p_l=5.11e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 62% 48/78 [04:15<03:08, 6.27s/it, bpd=5.82, g_l=5.82, gn=3.56, l=5.48, p_l=4.81e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 63% 49/78 [04:20<02:52, 5.94s/it, bpd=3.19, g_l=3.19, gn=5.6, l=3, p_l=4.42e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 64% 50/78 [04:25<02:40, 5.72s/it, bpd=3.55, g_l=3.55, gn=3.07, l=3.34, p_l=4.04e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 65% 51/78 [04:30<02:30, 5.57s/it, bpd=5.1, g_l=5.1, gn=3.94, l=4.8, p_l=3.85e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [04:36<02:22, 5.46s/it, bpd=4.75, g_l=4.75, gn=3.68, l=4.47, p_l=3.73e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 68% 53/78 [04:41<02:14, 5.40s/it, bpd=3.89, g_l=3.89, gn=3.09, l=3.66, p_l=3.44e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 69% 54/78 [04:46<02:08, 5.35s/it, bpd=3.37, g_l=3.37, gn=3.16, l=3.17, p_l=3.29e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 71% 55/78 [04:51<02:02, 5.31s/it, bpd=6.06, g_l=6.06, gn=3.84, l=5.7, p_l=3.56e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 72% 56/78 [04:57<01:56, 5.28s/it, bpd=4.69, g_l=4.69, gn=3.23, l=4.42, p_l=3.67e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [05:02<01:50, 5.26s/it, bpd=4.38, g_l=4.38, gn=3.5, l=4.12, p_l=3.81e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 74% 58/78 [05:07<01:44, 5.24s/it, bpd=4.3, g_l=4.3, gn=4, l=4.05, p_l=4.04e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 76% 59/78 [05:12<01:39, 5.22s/it, bpd=4.13, g_l=4.13, gn=3.5, l=3.89, p_l=4.62e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 77% 60/78 [05:17<01:33, 5.20s/it, bpd=6.16, g_l=6.16, gn=3.27, l=5.8, p_l=4.89e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 78% 61/78 [05:22<01:28, 5.18s/it, bpd=3.69, g_l=3.69, gn=3.02, l=3.47, p_l=4.91e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 79% 62/78 [05:28<01:22, 5.17s/it, bpd=5.21, g_l=5.21, gn=3.08, l=4.91, p_l=4.95e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 81% 63/78 [05:33<01:17, 5.16s/it, bpd=4.92, g_l=4.92, gn=2.94, l=4.63, p_l=4.73e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 82% 64/78 [05:38<01:12, 5.16s/it, bpd=6.01, g_l=6.01, gn=2.98, l=5.66, p_l=4.3e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 83% 65/78 [05:43<01:07, 5.16s/it, bpd=5.1, g_l=5.1, gn=3.29, l=4.8, p_l=4.24e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 85% 66/78 [05:48<01:01, 5.16s/it, bpd=4.57, g_l=4.57, gn=3.41, l=4.3, p_l=4.15e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 86% 67/78 [05:53<00:56, 5.16s/it, bpd=3.93, g_l=3.93, gn=5.05, l=3.7, p_l=4.02e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 87% 68/78 [05:59<00:51, 5.18s/it, bpd=3.67, g_l=3.67, gn=3.76, l=3.46, p_l=3.98e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 88% 69/78 [06:04<00:46, 5.19s/it, bpd=4.37, g_l=4.37, gn=3.63, l=4.11, p_l=3.71e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 90% 70/78 [06:09<00:41, 5.20s/it, bpd=4.44, g_l=4.44, gn=3.56, l=4.18, p_l=3.64e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 91% 71/78 [06:14<00:36, 5.20s/it, bpd=3.91, g_l=3.91, gn=3.21, l=3.68, p_l=3.52e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 92% 72/78 [06:19<00:31, 5.21s/it, bpd=4.31, g_l=4.31, gn=3.01, l=4.06, p_l=3.35e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 94% 73/78 [06:25<00:26, 5.21s/it, bpd=4.77, g_l=4.77, gn=3.75, l=4.49, p_l=3.2e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 95% 74/78 [06:30<00:20, 5.21s/it, bpd=2.96, g_l=2.96, gn=3.43, l=2.78, p_l=3.17e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 96% 75/78 [06:35<00:15, 5.21s/it, bpd=4.53, g_l=4.53, gn=3.13, l=4.26, p_l=3.13e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n","100% 78/78 [06:51<00:00, 5.27s/it, bpd=5.12, g_l=5.12, gn=3.57, l=4.82, p_l=2.52e-7]\n","Train bpd: 4.4915 prime_loss: 0.0000 gen_loss: 4.4915 loss: 4.2273 gn: 3.5573 lr: 0.0003 lg_loss_scale: 16.1660 epoch: 28.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2331\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.94s/it, bpd=5.21, l=4.9]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:12, 1.86s/it, bpd=5.15, l=4.85]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.72s/it, bpd=5.28, l=4.97]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.63s/it, bpd=5.24, l=4.93]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=4.96, l=4.67]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=4.79, l=4.5]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=5.71, l=5.37]\n","Ema bpd: 5.0665 prime_loss: 0.0132 gen_loss: 5.0665 loss: 4.7687 epoch: 28.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (12).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n"," 1% 1/78 [00:05<06:58, 5.44s/it, bpd=4.16, g_l=4.16, gn=3.36, l=3.92, p_l=2.34e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 3% 2/78 [00:10<06:48, 5.37s/it, bpd=3.73, g_l=3.73, gn=3.75, l=3.51, p_l=2.25e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 4% 3/78 [00:15<06:39, 5.32s/it, bpd=4.1, g_l=4.1, gn=2.89, l=3.86, p_l=2.19e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 5% 4/78 [00:21<06:33, 5.31s/it, bpd=4.05, g_l=4.05, gn=3.25, l=3.81, p_l=2.1e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 6% 5/78 [00:26<06:25, 5.29s/it, bpd=4.18, g_l=4.18, gn=3.39, l=3.93, p_l=1.88e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 8% 6/78 [00:31<06:20, 5.28s/it, bpd=2.86, g_l=2.86, gn=3.45, l=2.69, p_l=1.69e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 9% 7/78 [00:36<06:14, 5.27s/it, bpd=4.18, g_l=4.18, gn=3.52, l=3.93, p_l=1.58e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 10% 8/78 [00:42<06:08, 5.27s/it, bpd=4.48, g_l=4.48, gn=4.1, l=4.21, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 12% 9/78 [00:47<06:02, 5.25s/it, bpd=4.04, g_l=4.04, gn=3.17, l=3.8, p_l=1.36e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=4.4, g_l=4.4, gn=3.19, l=4.14, p_l=1.37e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=4.11, g_l=4.11, gn=3.53, l=3.87, p_l=1.38e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 15% 12/78 [01:02<05:44, 5.22s/it, bpd=5.41, g_l=5.41, gn=3.29, l=5.09, p_l=1.33e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 17% 13/78 [01:08<05:38, 5.21s/it, bpd=5.99, g_l=5.99, gn=2.86, l=5.63, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 18% 14/78 [01:13<05:32, 5.20s/it, bpd=4.85, g_l=4.85, gn=3.14, l=4.56, p_l=1.56e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 19% 15/78 [01:18<05:27, 5.19s/it, bpd=5.49, g_l=5.49, gn=3.04, l=5.17, p_l=1.66e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 21% 16/78 [01:23<05:22, 5.20s/it, bpd=3.81, g_l=3.81, gn=3.53, l=3.58, p_l=1.61e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 22% 17/78 [01:28<05:16, 5.19s/it, bpd=4.47, g_l=4.47, gn=3.57, l=4.21, p_l=1.53e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 23% 18/78 [01:34<05:12, 5.21s/it, bpd=4.42, g_l=4.42, gn=3.47, l=4.16, p_l=1.43e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 24% 19/78 [01:39<05:07, 5.21s/it, bpd=4.66, g_l=4.66, gn=3.61, l=4.39, p_l=1.27e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:44<05:02, 5.22s/it, bpd=5.1, g_l=5.1, gn=3.4, l=4.8, p_l=1.19e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 27% 21/78 [01:49<04:57, 5.22s/it, bpd=5.56, g_l=5.56, gn=3.24, l=5.23, p_l=1.07e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 28% 22/78 [01:55<04:52, 5.22s/it, bpd=4.12, g_l=4.12, gn=3.12, l=3.87, p_l=8.78e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 29% 23/78 [02:00<04:47, 5.23s/it, bpd=4.91, g_l=4.91, gn=4.17, l=4.63, p_l=8.2e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 31% 24/78 [02:05<04:42, 5.23s/it, bpd=4.93, g_l=4.93, gn=2.89, l=4.64, p_l=7.61e-8]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 32% 25/78 [02:10<04:36, 5.22s/it, bpd=4.61, g_l=4.61, gn=3.16, l=4.34, p_l=7.21e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=4.92, g_l=4.92, gn=2.92, l=4.63, p_l=7.26e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 35% 27/78 [02:21<04:26, 5.22s/it, bpd=4.66, g_l=4.66, gn=3.08, l=4.39, p_l=7.03e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 36% 28/78 [02:26<04:21, 5.23s/it, bpd=3.33, g_l=3.33, gn=4.57, l=3.14, p_l=6.4e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 37% 29/78 [02:31<04:15, 5.22s/it, bpd=4.73, g_l=4.73, gn=3.41, l=4.45, p_l=5.82e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 38% 30/78 [02:36<04:10, 5.23s/it, bpd=4.33, g_l=4.33, gn=3.39, l=4.07, p_l=5.87e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 40% 31/78 [02:42<04:05, 5.22s/it, bpd=3.82, g_l=3.82, gn=3.63, l=3.59, p_l=6.45e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 41% 32/78 [02:47<04:00, 5.22s/it, bpd=4.58, g_l=4.58, gn=3.79, l=4.31, p_l=7.17e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 42% 33/78 [02:52<03:54, 5.21s/it, bpd=4.23, g_l=4.23, gn=3.65, l=3.98, p_l=7.48e-8]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 44% 34/78 [02:57<03:49, 5.22s/it, bpd=3.94, g_l=3.94, gn=3.22, l=3.71, p_l=7.97e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 45% 35/78 [03:02<03:44, 5.22s/it, bpd=5.73, g_l=5.73, gn=3.16, l=5.4, p_l=7.93e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:08<03:39, 5.23s/it, bpd=4.35, g_l=4.35, gn=3.48, l=4.09, p_l=8.64e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 47% 37/78 [03:13<03:33, 5.22s/it, bpd=4.94, g_l=4.94, gn=3.21, l=4.65, p_l=8.55e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 49% 38/78 [03:18<03:28, 5.22s/it, bpd=4.03, g_l=4.03, gn=3.27, l=3.79, p_l=8.78e-8]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 50% 39/78 [03:23<03:23, 5.21s/it, bpd=5.44, g_l=5.44, gn=3.51, l=5.12, p_l=8.91e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 51% 40/78 [03:28<03:17, 5.21s/it, bpd=4.1, g_l=4.1, gn=3.17, l=3.86, p_l=8.87e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 53% 41/78 [03:34<03:12, 5.21s/it, bpd=2.68, g_l=2.68, gn=3.31, l=2.52, p_l=8.2e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 54% 42/78 [03:39<03:07, 5.20s/it, bpd=4.34, g_l=4.34, gn=3.79, l=4.09, p_l=8.15e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [03:44<03:01, 5.19s/it, bpd=3.4, g_l=3.4, gn=4.42, l=3.2, p_l=7.93e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 56% 44/78 [03:49<02:56, 5.20s/it, bpd=4.91, g_l=4.91, gn=3.26, l=4.62, p_l=7.3e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 58% 45/78 [03:54<02:51, 5.19s/it, bpd=4.02, g_l=4.02, gn=3.55, l=3.78, p_l=6.99e-8]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 59% 46/78 [04:00<02:46, 5.20s/it, bpd=3.63, g_l=3.63, gn=4.82, l=3.42, p_l=6.49e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 60% 47/78 [04:05<02:40, 5.19s/it, bpd=3.78, g_l=3.78, gn=3.09, l=3.56, p_l=6.63e-8]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 62% 48/78 [04:10<02:35, 5.20s/it, bpd=3.76, g_l=3.76, gn=3.5, l=3.54, p_l=6.76e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 63% 49/78 [04:15<02:30, 5.20s/it, bpd=6.06, g_l=6.06, gn=3.47, l=5.7, p_l=6.94e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2381\u001b[0m\n"," 64% 50/78 [04:56<07:27, 15.99s/it, bpd=4.08, g_l=4.08, gn=3.19, l=3.84, p_l=7.12e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 65% 51/78 [05:02<05:44, 12.75s/it, bpd=4.89, g_l=4.89, gn=3.16, l=4.6, p_l=7.21e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 67% 52/78 [05:07<04:31, 10.43s/it, bpd=4.11, g_l=4.11, gn=3.15, l=3.87, p_l=7.48e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 68% 53/78 [05:12<03:40, 8.81s/it, bpd=3.38, g_l=3.38, gn=3.12, l=3.18, p_l=7.66e-8]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 69% 54/78 [05:17<03:04, 7.68s/it, bpd=4.66, g_l=4.66, gn=2.94, l=4.39, p_l=7.61e-8]/content/gdrive/MyDrive/slon/slon (35).txt\n","\n","Overflow in backward. Loss 4.30302095413208, grad norm nan, lgscale 16.54000000000035, new lgscale 15.540000000000349\n"," 71% 55/78 [05:21<02:32, 6.65s/it, bpd=4.66, g_l=4.66, gn=2.94, l=4.39, p_l=7.61e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 72% 56/78 [05:26<02:16, 6.19s/it, bpd=4.38, g_l=4.38, gn=5.41, l=4.13, p_l=8.15e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 73% 57/78 [05:31<02:03, 5.86s/it, bpd=5.05, g_l=5.05, gn=3.54, l=4.75, p_l=8.96e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 74% 58/78 [05:36<01:53, 5.67s/it, bpd=4.23, g_l=4.23, gn=3.41, l=3.98, p_l=1.08e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 76% 59/78 [05:41<01:44, 5.51s/it, bpd=5.21, g_l=5.21, gn=3.71, l=4.9, p_l=1.25e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 77% 60/78 [05:47<01:37, 5.42s/it, bpd=5.01, g_l=5.01, gn=3.41, l=4.72, p_l=1.43e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 78% 61/78 [05:52<01:31, 5.36s/it, bpd=3.79, g_l=3.79, gn=3.55, l=3.57, p_l=1.51e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 79% 62/78 [05:57<01:25, 5.35s/it, bpd=3.75, g_l=3.75, gn=3.19, l=3.53, p_l=1.55e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 81% 63/78 [06:02<01:19, 5.31s/it, bpd=4.45, g_l=4.45, gn=6.85, l=4.19, p_l=1.43e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 82% 64/78 [06:08<01:14, 5.32s/it, bpd=5.04, g_l=5.04, gn=3.89, l=4.75, p_l=1.42e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 83% 65/78 [06:13<01:08, 5.30s/it, bpd=4.32, g_l=4.32, gn=5.06, l=4.07, p_l=1.4e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 85% 66/78 [06:18<01:03, 5.33s/it, bpd=5.38, g_l=5.38, gn=3.55, l=5.06, p_l=1.47e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 86% 67/78 [06:24<00:58, 5.31s/it, bpd=5.64, g_l=5.64, gn=3.11, l=5.31, p_l=1.55e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 87% 68/78 [06:29<00:53, 5.33s/it, bpd=4.54, g_l=4.54, gn=3.71, l=4.27, p_l=1.64e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 88% 69/78 [06:34<00:47, 5.31s/it, bpd=4.13, g_l=4.13, gn=3.21, l=3.89, p_l=1.75e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 90% 70/78 [06:42<00:49, 6.16s/it, bpd=5.4, g_l=5.4, gn=3.23, l=5.08, p_l=1.78e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 91% 71/78 [06:48<00:41, 5.89s/it, bpd=4.76, g_l=4.76, gn=4.08, l=4.48, p_l=1.69e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 92% 72/78 [06:53<00:34, 5.68s/it, bpd=4.25, g_l=4.25, gn=3.64, l=4, p_l=1.49e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 94% 73/78 [06:58<00:27, 5.57s/it, bpd=4.82, g_l=4.82, gn=4.47, l=4.53, p_l=1.25e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 95% 74/78 [07:03<00:21, 5.46s/it, bpd=3.19, g_l=3.19, gn=3.33, l=3, p_l=1.26e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [07:09<00:16, 5.45s/it, bpd=4.65, g_l=4.65, gn=5.35, l=4.38, p_l=1.26e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n","100% 78/78 [07:25<00:00, 5.71s/it, bpd=3.52, g_l=3.52, gn=3.5, l=3.31, p_l=1.39e-7]\n","Train bpd: 4.4297 prime_loss: 0.0000 gen_loss: 4.4297 loss: 4.1692 gn: 3.5653 lr: 0.0003 lg_loss_scale: 16.1773 epoch: 29.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2408\u001b[0m\n"," 11% 1/9 [00:02<00:17, 2.19s/it, bpd=5.3, l=4.99]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 22% 2/9 [00:03<00:14, 2.02s/it, bpd=5.67, l=5.33]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.83s/it, bpd=5.63, l=5.3]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.70s/it, bpd=4.83, l=4.55]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.61s/it, bpd=4.59, l=4.32]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.54s/it, bpd=4.91, l=4.62]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.52s/it, bpd=5.18, l=4.88]\n","Ema bpd: 5.0994 prime_loss: 0.0130 gen_loss: 5.0994 loss: 4.7997 epoch: 29.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (28).txt\n","/content/gdrive/MyDrive/slon/slon (1).txt\n"," 1% 1/78 [00:05<06:54, 5.38s/it, bpd=3.86, g_l=3.86, gn=2.97, l=3.63, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 3% 2/78 [00:10<06:45, 5.33s/it, bpd=3.26, g_l=3.26, gn=4.82, l=3.07, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 4% 3/78 [00:15<06:37, 5.30s/it, bpd=4.18, g_l=4.18, gn=3.71, l=3.93, p_l=1.42e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 5% 4/78 [00:21<06:30, 5.28s/it, bpd=5.31, g_l=5.31, gn=3.82, l=5, p_l=1.37e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 6% 5/78 [00:26<06:25, 5.28s/it, bpd=2.3, g_l=2.3, gn=5.34, l=2.16, p_l=1.23e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 8% 6/78 [00:31<06:19, 5.28s/it, bpd=3.8, g_l=3.8, gn=3.99, l=3.58, p_l=1.2e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:36<06:13, 5.27s/it, bpd=5.51, g_l=5.51, gn=3.09, l=5.19, p_l=1.17e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 10% 8/78 [00:42<06:07, 5.25s/it, bpd=4.9, g_l=4.9, gn=4.23, l=4.61, p_l=1.2e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 12% 9/78 [00:47<06:01, 5.24s/it, bpd=4.36, g_l=4.36, gn=4.56, l=4.1, p_l=1.33e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:52<05:55, 5.22s/it, bpd=4.4, g_l=4.4, gn=2.96, l=4.14, p_l=1.54e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:49, 5.21s/it, bpd=4.82, g_l=4.82, gn=6.19, l=4.53, p_l=1.8e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=4.04, g_l=4.04, gn=3.46, l=3.8, p_l=2.25e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 17% 13/78 [01:07<05:36, 5.18s/it, bpd=3.95, g_l=3.95, gn=3.22, l=3.72, p_l=2.63e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 18% 14/78 [01:13<05:30, 5.17s/it, bpd=4.66, g_l=4.66, gn=3.53, l=4.38, p_l=2.83e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=5.2, g_l=5.2, gn=3.13, l=4.89, p_l=3.05e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:23<05:20, 5.17s/it, bpd=3.92, g_l=3.92, gn=3.73, l=3.69, p_l=3.05e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 22% 17/78 [01:28<05:16, 5.19s/it, bpd=4, g_l=4, gn=3.34, l=3.76, p_l=3.05e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 23% 18/78 [01:33<05:11, 5.19s/it, bpd=4.1, g_l=4.1, gn=3.38, l=3.86, p_l=2.87e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=4.02, g_l=4.02, gn=3.39, l=3.78, p_l=2.88e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=6.05, g_l=6.05, gn=3.27, l=5.7, p_l=2.92e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 27% 21/78 [01:49<04:57, 5.21s/it, bpd=4.8, g_l=4.8, gn=4.87, l=4.52, p_l=2.92e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 28% 22/78 [01:54<04:51, 5.21s/it, bpd=4.97, g_l=4.97, gn=3.07, l=4.68, p_l=2.82e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 29% 23/78 [01:59<04:46, 5.22s/it, bpd=4.3, g_l=4.3, gn=3.52, l=4.05, p_l=2.69e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=5.71, g_l=5.71, gn=3.08, l=5.37, p_l=2.62e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=3.9, g_l=3.9, gn=3.02, l=3.67, p_l=2.37e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 33% 26/78 [02:15<04:30, 5.20s/it, bpd=3.63, g_l=3.63, gn=4.89, l=3.42, p_l=2.17e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 35% 27/78 [02:20<04:25, 5.21s/it, bpd=4.03, g_l=4.03, gn=3.46, l=3.79, p_l=2.03e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 36% 28/78 [02:25<04:19, 5.20s/it, bpd=4.14, g_l=4.14, gn=7.01, l=3.89, p_l=1.81e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=3.76, g_l=3.76, gn=5.04, l=3.54, p_l=1.55e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=4.57, g_l=4.57, gn=3.31, l=4.3, p_l=1.29e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 40% 31/78 [02:41<04:04, 5.20s/it, bpd=3.81, g_l=3.81, gn=3.74, l=3.59, p_l=1.16e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 41% 32/78 [02:46<03:58, 5.19s/it, bpd=5.2, g_l=5.2, gn=3.35, l=4.89, p_l=1.14e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 42% 33/78 [02:51<03:53, 5.19s/it, bpd=4.98, g_l=4.98, gn=3.14, l=4.69, p_l=1.2e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 44% 34/78 [02:57<03:47, 5.18s/it, bpd=5.2, g_l=5.2, gn=3.32, l=4.89, p_l=1.41e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 45% 35/78 [03:02<03:42, 5.18s/it, bpd=3.73, g_l=3.73, gn=5.78, l=3.51, p_l=1.59e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:07<03:37, 5.18s/it, bpd=5.11, g_l=5.11, gn=3.38, l=4.81, p_l=1.78e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 47% 37/78 [03:12<03:32, 5.19s/it, bpd=3.74, g_l=3.74, gn=3.3, l=3.52, p_l=1.75e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 49% 38/78 [03:17<03:27, 5.18s/it, bpd=3.86, g_l=3.86, gn=3.04, l=3.63, p_l=1.61e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 50% 39/78 [03:23<03:22, 5.19s/it, bpd=4.79, g_l=4.79, gn=3.56, l=4.51, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 51% 40/78 [03:28<03:16, 5.18s/it, bpd=4.3, g_l=4.3, gn=3.76, l=4.04, p_l=1.21e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 53% 41/78 [03:33<03:11, 5.19s/it, bpd=4.77, g_l=4.77, gn=3.56, l=4.49, p_l=1e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 54% 42/78 [03:38<03:06, 5.18s/it, bpd=4.55, g_l=4.55, gn=3.62, l=4.28, p_l=8.78e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 55% 43/78 [03:43<03:01, 5.19s/it, bpd=4, g_l=4, gn=3.56, l=3.77, p_l=8.38e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 56% 44/78 [03:48<02:56, 5.19s/it, bpd=3.65, g_l=3.65, gn=3.58, l=3.44, p_l=8.33e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 58% 45/78 [03:54<02:51, 5.19s/it, bpd=4.86, g_l=4.86, gn=3.3, l=4.57, p_l=9.81e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [03:59<02:46, 5.19s/it, bpd=3.37, g_l=3.37, gn=2.98, l=3.17, p_l=1.16e-7]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 60% 47/78 [04:04<02:41, 5.19s/it, bpd=4.71, g_l=4.71, gn=3.14, l=4.44, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 62% 48/78 [04:09<02:35, 5.19s/it, bpd=4.11, g_l=4.11, gn=3.71, l=3.87, p_l=1.48e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 63% 49/78 [04:14<02:30, 5.20s/it, bpd=5.41, g_l=5.41, gn=3.75, l=5.09, p_l=1.42e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 64% 50/78 [04:20<02:25, 5.19s/it, bpd=3.91, g_l=3.91, gn=3.47, l=3.68, p_l=1.33e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 65% 51/78 [04:25<02:20, 5.19s/it, bpd=3.84, g_l=3.84, gn=4.28, l=3.61, p_l=1.27e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 67% 52/78 [04:30<02:14, 5.19s/it, bpd=4.33, g_l=4.33, gn=3.12, l=4.08, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 68% 53/78 [04:35<02:09, 5.19s/it, bpd=4.66, g_l=4.66, gn=3.22, l=4.38, p_l=1.43e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 69% 54/78 [04:40<02:04, 5.19s/it, bpd=4.37, g_l=4.37, gn=4.03, l=4.11, p_l=1.48e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 71% 55/78 [04:46<01:59, 5.19s/it, bpd=4.16, g_l=4.16, gn=3.44, l=3.91, p_l=1.5e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 72% 56/78 [04:51<01:54, 5.19s/it, bpd=5.92, g_l=5.92, gn=3.55, l=5.58, p_l=1.49e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [04:56<01:49, 5.20s/it, bpd=5.01, g_l=5.01, gn=3.17, l=4.72, p_l=1.48e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 74% 58/78 [05:01<01:43, 5.19s/it, bpd=3.56, g_l=3.56, gn=3.7, l=3.35, p_l=1.39e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 76% 59/78 [05:06<01:38, 5.20s/it, bpd=3.68, g_l=3.68, gn=3.9, l=3.47, p_l=1.37e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 77% 60/78 [05:12<01:33, 5.20s/it, bpd=5.41, g_l=5.41, gn=3.46, l=5.09, p_l=1.52e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 78% 61/78 [05:17<01:28, 5.21s/it, bpd=5, g_l=5, gn=3.3, l=4.7, p_l=1.67e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 79% 62/78 [05:22<01:23, 5.20s/it, bpd=4.34, g_l=4.34, gn=3.74, l=4.09, p_l=1.79e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 81% 63/78 [05:27<01:18, 5.20s/it, bpd=4.03, g_l=4.03, gn=5.3, l=3.8, p_l=1.9e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 82% 64/78 [05:32<01:12, 5.20s/it, bpd=4, g_l=4, gn=3.2, l=3.76, p_l=2.02e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 83% 65/78 [05:38<01:07, 5.20s/it, bpd=4.63, g_l=4.63, gn=3.25, l=4.36, p_l=2.08e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 85% 66/78 [05:43<01:02, 5.20s/it, bpd=6.43, g_l=6.43, gn=3, l=6.05, p_l=2.1e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 86% 67/78 [05:48<00:57, 5.21s/it, bpd=3.91, g_l=3.91, gn=3.1, l=3.68, p_l=1.83e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 87% 68/78 [05:53<00:52, 5.20s/it, bpd=4.06, g_l=4.06, gn=3.47, l=3.82, p_l=1.65e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 88% 69/78 [05:58<00:46, 5.21s/it, bpd=4.27, g_l=4.27, gn=3.91, l=4.02, p_l=1.48e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 90% 70/78 [06:04<00:41, 5.21s/it, bpd=4.51, g_l=4.51, gn=3.73, l=4.24, p_l=1.36e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 91% 71/78 [06:09<00:36, 5.21s/it, bpd=4.33, g_l=4.33, gn=3.66, l=4.07, p_l=1.33e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 92% 72/78 [06:14<00:31, 5.21s/it, bpd=4.69, g_l=4.69, gn=3.46, l=4.41, p_l=1.4e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 94% 73/78 [06:19<00:26, 5.21s/it, bpd=4.15, g_l=4.15, gn=3.66, l=3.9, p_l=1.43e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 95% 74/78 [06:24<00:20, 5.21s/it, bpd=4.72, g_l=4.72, gn=3.13, l=4.44, p_l=1.48e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 96% 75/78 [06:30<00:15, 5.21s/it, bpd=4.18, g_l=4.18, gn=4.24, l=3.94, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n","100% 78/78 [06:45<00:00, 5.20s/it, bpd=4.99, g_l=4.99, gn=3.23, l=4.69, p_l=1.16e-7]\n","Train bpd: 4.4066 prime_loss: 0.0000 gen_loss: 4.4066 loss: 4.1474 gn: 3.6992 lr: 0.0003 lg_loss_scale: 15.7860 epoch: 30.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2486\u001b[0m\n"," 11% 1/9 [00:02<00:17, 2.18s/it, bpd=4.5, l=4.24]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:14, 2.00s/it, bpd=4.37, l=4.12]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:05<00:10, 1.82s/it, bpd=4.75, l=4.47]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.69s/it, bpd=5.48, l=5.16]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.61s/it, bpd=5.66, l=5.33]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 67% 6/9 [00:09<00:04, 1.54s/it, bpd=5.64, l=5.31]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.52s/it, bpd=4.91, l=4.62]\n","Ema bpd: 5.0524 prime_loss: 0.0130 gen_loss: 5.0524 loss: 4.7555 epoch: 30.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (21).txt\n","/content/gdrive/MyDrive/slon/slon (35).txt\n"," 1% 1/78 [00:05<06:56, 5.41s/it, bpd=4.92, g_l=4.92, gn=3.23, l=4.63, p_l=1.1e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 3% 2/78 [00:10<06:46, 5.35s/it, bpd=5.12, g_l=5.12, gn=2.97, l=4.82, p_l=1.05e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:15<06:38, 5.32s/it, bpd=4.87, g_l=4.87, gn=3.74, l=4.59, p_l=9.63e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 5% 4/78 [00:21<06:32, 5.31s/it, bpd=3.22, g_l=3.22, gn=3.85, l=3.03, p_l=8.73e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 6% 5/78 [00:26<06:26, 5.30s/it, bpd=4.05, g_l=4.05, gn=3.33, l=3.81, p_l=8.02e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=5.05, g_l=5.05, gn=3.95, l=4.75, p_l=7.93e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 9% 7/78 [00:36<06:14, 5.27s/it, bpd=5.68, g_l=5.68, gn=3.4, l=5.35, p_l=7.35e-8]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 10% 8/78 [00:42<06:08, 5.26s/it, bpd=5.45, g_l=5.45, gn=3.47, l=5.13, p_l=6.67e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 12% 9/78 [00:47<06:01, 5.24s/it, bpd=4.04, g_l=4.04, gn=5.78, l=3.8, p_l=6.36e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 13% 10/78 [00:52<05:54, 5.22s/it, bpd=5.44, g_l=5.44, gn=3.42, l=5.12, p_l=5.69e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:48, 5.20s/it, bpd=4.5, g_l=4.5, gn=3.4, l=4.23, p_l=5.24e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 15% 12/78 [01:02<05:41, 5.18s/it, bpd=3.35, g_l=3.35, gn=4, l=3.15, p_l=5.11e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 17% 13/78 [01:07<05:35, 5.17s/it, bpd=3.99, g_l=3.99, gn=3.06, l=3.75, p_l=5.02e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 18% 14/78 [01:18<07:11, 6.75s/it, bpd=4.41, g_l=4.41, gn=3.94, l=4.15, p_l=5.37e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 19% 15/78 [01:23<06:33, 6.25s/it, bpd=3.62, g_l=3.62, gn=4.17, l=3.41, p_l=5.78e-8]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 21% 16/78 [01:28<06:06, 5.91s/it, bpd=5.57, g_l=5.57, gn=3.1, l=5.24, p_l=6.09e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 22% 17/78 [01:33<05:47, 5.70s/it, bpd=4.75, g_l=4.75, gn=3.63, l=4.47, p_l=7.03e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 23% 18/78 [01:39<05:34, 5.57s/it, bpd=4.97, g_l=4.97, gn=3.62, l=4.68, p_l=7.79e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 24% 19/78 [01:44<05:23, 5.49s/it, bpd=4.13, g_l=4.13, gn=3.05, l=3.89, p_l=8.51e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:49<05:15, 5.43s/it, bpd=5, g_l=5, gn=4.24, l=4.71, p_l=8.87e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 27% 21/78 [01:54<05:07, 5.39s/it, bpd=4.79, g_l=4.79, gn=3.29, l=4.5, p_l=9.18e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 28% 22/78 [02:00<04:59, 5.34s/it, bpd=3.97, g_l=3.97, gn=3.88, l=3.74, p_l=9.45e-8]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 29% 23/78 [02:05<04:51, 5.31s/it, bpd=5.27, g_l=5.27, gn=3.26, l=4.96, p_l=9.85e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 31% 24/78 [02:10<04:44, 5.28s/it, bpd=5.27, g_l=5.27, gn=3.27, l=4.96, p_l=9e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 32% 25/78 [02:15<04:37, 5.24s/it, bpd=4.99, g_l=4.99, gn=3.28, l=4.7, p_l=9.23e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 33% 26/78 [02:20<04:30, 5.21s/it, bpd=4.25, g_l=4.25, gn=4.11, l=4, p_l=9.49e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 35% 27/78 [02:26<04:24, 5.18s/it, bpd=4.1, g_l=4.1, gn=5.18, l=3.86, p_l=9.85e-8]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 36% 28/78 [02:31<04:18, 5.17s/it, bpd=3.88, g_l=3.88, gn=3.84, l=3.65, p_l=9.99e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 37% 29/78 [02:36<04:12, 5.16s/it, bpd=4.09, g_l=4.09, gn=3.72, l=3.85, p_l=1.02e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 38% 30/78 [02:41<04:07, 5.15s/it, bpd=4.18, g_l=4.18, gn=3.77, l=3.93, p_l=1.01e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 40% 31/78 [02:46<04:01, 5.15s/it, bpd=4.5, g_l=4.5, gn=4.65, l=4.23, p_l=1.01e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 41% 32/78 [02:51<03:57, 5.16s/it, bpd=3.23, g_l=3.23, gn=3.18, l=3.04, p_l=9.81e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 42% 33/78 [02:56<03:52, 5.16s/it, bpd=3.75, g_l=3.75, gn=2.89, l=3.53, p_l=8.91e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 44% 34/78 [03:02<03:47, 5.17s/it, bpd=4.89, g_l=4.89, gn=3.88, l=4.61, p_l=8.24e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 45% 35/78 [03:07<03:42, 5.18s/it, bpd=3.38, g_l=3.38, gn=3.13, l=3.18, p_l=7.3e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 46% 36/78 [03:12<03:37, 5.19s/it, bpd=4.49, g_l=4.49, gn=3.16, l=4.23, p_l=6.76e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 47% 37/78 [03:17<03:32, 5.19s/it, bpd=4.53, g_l=4.53, gn=3.42, l=4.26, p_l=6e-8]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 49% 38/78 [03:22<03:27, 5.19s/it, bpd=4.77, g_l=4.77, gn=3.09, l=4.49, p_l=5.91e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 50% 39/78 [03:28<03:22, 5.20s/it, bpd=5.35, g_l=5.35, gn=3.22, l=5.04, p_l=6e-8]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 51% 40/78 [03:33<03:17, 5.19s/it, bpd=4.95, g_l=4.95, gn=3.86, l=4.66, p_l=6.72e-8]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 53% 41/78 [03:38<03:12, 5.19s/it, bpd=5, g_l=5, gn=4.36, l=4.71, p_l=7.97e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 54% 42/78 [03:43<03:06, 5.18s/it, bpd=3.92, g_l=3.92, gn=3.73, l=3.69, p_l=9.05e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 55% 43/78 [03:48<03:01, 5.18s/it, bpd=4.43, g_l=4.43, gn=4.24, l=4.17, p_l=1.03e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 56% 44/78 [03:53<02:55, 5.17s/it, bpd=4.46, g_l=4.46, gn=4.64, l=4.19, p_l=1.01e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 58% 45/78 [03:59<02:50, 5.18s/it, bpd=4.17, g_l=4.17, gn=3.64, l=3.92, p_l=9.72e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 59% 46/78 [04:04<02:45, 5.17s/it, bpd=4.27, g_l=4.27, gn=3.19, l=4.02, p_l=8.51e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 60% 47/78 [04:09<02:40, 5.17s/it, bpd=4.12, g_l=4.12, gn=3.07, l=3.87, p_l=6.99e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 62% 48/78 [04:14<02:35, 5.17s/it, bpd=4.29, g_l=4.29, gn=3.91, l=4.04, p_l=5.91e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 63% 49/78 [04:19<02:29, 5.17s/it, bpd=5.01, g_l=5.01, gn=3.53, l=4.72, p_l=5.33e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 64% 50/78 [04:25<02:24, 5.17s/it, bpd=4.42, g_l=4.42, gn=3.09, l=4.16, p_l=4.84e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 65% 51/78 [04:30<02:19, 5.18s/it, bpd=5.08, g_l=5.08, gn=3.3, l=4.78, p_l=4.43e-8]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 67% 52/78 [04:35<02:14, 5.19s/it, bpd=3.99, g_l=3.99, gn=3.47, l=3.75, p_l=4.21e-8]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 68% 53/78 [04:40<02:09, 5.19s/it, bpd=4.37, g_l=4.37, gn=5.01, l=4.11, p_l=4.12e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 69% 54/78 [04:45<02:04, 5.20s/it, bpd=5.39, g_l=5.39, gn=3, l=5.07, p_l=4.12e-8]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 71% 55/78 [04:51<01:59, 5.21s/it, bpd=4.1, g_l=4.1, gn=3.9, l=3.86, p_l=4.34e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 72% 56/78 [04:56<01:54, 5.21s/it, bpd=4.63, g_l=4.63, gn=3.83, l=4.35, p_l=4.66e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [05:01<01:49, 5.21s/it, bpd=4.05, g_l=4.05, gn=3.8, l=3.81, p_l=4.57e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 74% 58/78 [05:06<01:44, 5.20s/it, bpd=3.41, g_l=3.41, gn=3.63, l=3.21, p_l=4.21e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 76% 59/78 [05:11<01:38, 5.20s/it, bpd=4.12, g_l=4.12, gn=3.29, l=3.88, p_l=3.9e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 77% 60/78 [05:17<01:33, 5.20s/it, bpd=4.12, g_l=4.12, gn=3.69, l=3.88, p_l=3.76e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 78% 61/78 [05:22<01:28, 5.20s/it, bpd=5.11, g_l=5.11, gn=3.63, l=4.81, p_l=3.45e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 79% 62/78 [05:27<01:23, 5.20s/it, bpd=4.16, g_l=4.16, gn=3.29, l=3.92, p_l=3.22e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 81% 63/78 [05:32<01:17, 5.19s/it, bpd=4.79, g_l=4.79, gn=3.93, l=4.51, p_l=3.18e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 82% 64/78 [05:37<01:12, 5.19s/it, bpd=4.04, g_l=4.04, gn=3.52, l=3.8, p_l=3.22e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 83% 65/78 [05:43<01:07, 5.19s/it, bpd=3.83, g_l=3.83, gn=3.13, l=3.6, p_l=3.09e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 85% 66/78 [05:48<01:02, 5.19s/it, bpd=3.88, g_l=3.88, gn=5.1, l=3.65, p_l=2.87e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 86% 67/78 [05:53<00:57, 5.18s/it, bpd=4.72, g_l=4.72, gn=3.7, l=4.44, p_l=2.91e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [05:58<00:51, 5.18s/it, bpd=6.11, g_l=6.11, gn=3.3, l=5.75, p_l=3.05e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 88% 69/78 [06:03<00:46, 5.18s/it, bpd=5.38, g_l=5.38, gn=3.26, l=5.06, p_l=2.87e-8]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 90% 70/78 [06:08<00:41, 5.17s/it, bpd=3.94, g_l=3.94, gn=3.46, l=3.71, p_l=2.64e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 91% 71/78 [06:14<00:36, 5.17s/it, bpd=4.57, g_l=4.57, gn=3.81, l=4.3, p_l=2.37e-8]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 92% 72/78 [06:19<00:31, 5.17s/it, bpd=4.28, g_l=4.28, gn=3.28, l=4.03, p_l=2.19e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:24<00:25, 5.16s/it, bpd=4.19, g_l=4.19, gn=3.93, l=3.95, p_l=2.1e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 95% 74/78 [06:29<00:20, 5.17s/it, bpd=3.74, g_l=3.74, gn=3.61, l=3.52, p_l=1.97e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 96% 75/78 [06:34<00:15, 5.16s/it, bpd=3.33, g_l=3.33, gn=3.4, l=3.13, p_l=1.84e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n","100% 78/78 [06:50<00:00, 5.26s/it, bpd=4.58, g_l=4.58, gn=3.07, l=4.31, p_l=1.97e-8]\n","Train bpd: 4.4489 prime_loss: 0.0000 gen_loss: 4.4489 loss: 4.1872 gn: 3.6555 lr: 0.0003 lg_loss_scale: 16.0980 epoch: 31.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2564\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.93s/it, bpd=5.24, l=4.93]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 22% 2/9 [00:03<00:13, 1.88s/it, bpd=4.77, l=4.49]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 33% 3/9 [00:05<00:10, 1.73s/it, bpd=4.56, l=4.29]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.63s/it, bpd=5.67, l=5.33]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=5.1, l=4.8]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=5.53, l=5.2]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=4.8, l=4.52]\n","Ema bpd: 5.0100 prime_loss: 0.0128 gen_loss: 5.0100 loss: 4.7156 epoch: 31.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (31).txt\n","/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (1).txt\n"," 1% 1/78 [00:05<06:52, 5.36s/it, bpd=4.34, g_l=4.34, gn=2.73, l=4.08, p_l=2.15e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 3% 2/78 [00:10<06:44, 5.32s/it, bpd=3.93, g_l=3.93, gn=3.11, l=3.7, p_l=2.28e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 4% 3/78 [00:15<06:37, 5.30s/it, bpd=4.08, g_l=4.08, gn=3.61, l=3.84, p_l=2.64e-8]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 5% 4/78 [00:21<06:32, 5.30s/it, bpd=3.92, g_l=3.92, gn=2.96, l=3.69, p_l=2.78e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 6% 5/78 [00:26<06:25, 5.29s/it, bpd=3.93, g_l=3.93, gn=5.74, l=3.69, p_l=3.05e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 8% 6/78 [00:31<06:21, 5.29s/it, bpd=4.49, g_l=4.49, gn=5.47, l=4.23, p_l=3.22e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 9% 7/78 [00:36<06:14, 5.28s/it, bpd=4.48, g_l=4.48, gn=3.29, l=4.21, p_l=3.76e-8]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 10% 8/78 [00:42<06:09, 5.28s/it, bpd=4.05, g_l=4.05, gn=3.84, l=3.81, p_l=3.9e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 12% 9/78 [00:47<06:02, 5.25s/it, bpd=4.49, g_l=4.49, gn=3.08, l=4.23, p_l=4.66e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=3.43, g_l=3.43, gn=3.32, l=3.23, p_l=5.15e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 14% 11/78 [00:57<05:49, 5.21s/it, bpd=3.88, g_l=3.88, gn=4.56, l=3.65, p_l=5.55e-8]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 15% 12/78 [01:02<05:43, 5.21s/it, bpd=4.05, g_l=4.05, gn=4.03, l=3.82, p_l=5.64e-8]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=3.39, g_l=3.39, gn=3.9, l=3.19, p_l=5.69e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 18% 14/78 [01:13<05:32, 5.19s/it, bpd=4.08, g_l=4.08, gn=3.58, l=3.84, p_l=5.91e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 19% 15/78 [01:18<05:26, 5.18s/it, bpd=5.89, g_l=5.89, gn=3.21, l=5.54, p_l=6.36e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 21% 16/78 [01:23<05:21, 5.18s/it, bpd=4.02, g_l=4.02, gn=7.44, l=3.78, p_l=6.45e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 22% 17/78 [01:28<05:16, 5.19s/it, bpd=4.97, g_l=4.97, gn=4.22, l=4.68, p_l=6.76e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 23% 18/78 [01:34<05:12, 5.20s/it, bpd=5.51, g_l=5.51, gn=3.26, l=5.19, p_l=7.39e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=5.53, g_l=5.53, gn=3.38, l=5.2, p_l=8.51e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 26% 20/78 [01:44<05:02, 5.21s/it, bpd=5.49, g_l=5.49, gn=2.93, l=5.17, p_l=9.09e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 27% 21/78 [01:49<04:56, 5.21s/it, bpd=2.78, g_l=2.78, gn=3.05, l=2.61, p_l=9.76e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 28% 22/78 [01:54<04:52, 5.22s/it, bpd=5.17, g_l=5.17, gn=3.29, l=4.86, p_l=1.05e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 29% 23/78 [02:00<04:46, 5.21s/it, bpd=4.2, g_l=4.2, gn=3.83, l=3.95, p_l=1.2e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=3.93, g_l=3.93, gn=3, l=3.7, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 32% 25/78 [02:10<04:35, 5.21s/it, bpd=5.39, g_l=5.39, gn=3.54, l=5.08, p_l=1.45e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 33% 26/78 [02:15<04:31, 5.21s/it, bpd=4.43, g_l=4.43, gn=3.54, l=4.17, p_l=1.57e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 35% 27/78 [02:20<04:25, 5.20s/it, bpd=3.91, g_l=3.91, gn=3.5, l=3.68, p_l=1.63e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=3.66, g_l=3.66, gn=3.9, l=3.44, p_l=1.64e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=3.93, g_l=3.93, gn=3.06, l=3.7, p_l=1.64e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 38% 30/78 [02:36<04:10, 5.21s/it, bpd=4.12, g_l=4.12, gn=3.45, l=3.87, p_l=1.69e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 40% 31/78 [02:41<04:04, 5.20s/it, bpd=5.28, g_l=5.28, gn=3.08, l=4.97, p_l=1.71e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 41% 32/78 [02:47<03:59, 5.21s/it, bpd=5.15, g_l=5.15, gn=2.98, l=4.85, p_l=1.78e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 42% 33/78 [02:52<03:54, 5.20s/it, bpd=4.98, g_l=4.98, gn=3.27, l=4.69, p_l=1.85e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 44% 34/78 [02:57<03:48, 5.20s/it, bpd=5.46, g_l=5.46, gn=3.12, l=5.14, p_l=1.92e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 45% 35/78 [03:02<03:43, 5.20s/it, bpd=4.3, g_l=4.3, gn=3.42, l=4.05, p_l=1.77e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 46% 36/78 [03:12<04:42, 6.72s/it, bpd=3.98, g_l=3.98, gn=3.33, l=3.75, p_l=1.76e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 47% 37/78 [03:18<04:16, 6.25s/it, bpd=4.9, g_l=4.9, gn=3.09, l=4.61, p_l=1.76e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:23<03:56, 5.91s/it, bpd=4.38, g_l=4.38, gn=3.98, l=4.12, p_l=1.59e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 50% 39/78 [03:28<03:42, 5.70s/it, bpd=5.04, g_l=5.04, gn=3.21, l=4.75, p_l=1.52e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 51% 40/78 [03:33<03:31, 5.56s/it, bpd=3.85, g_l=3.85, gn=3.36, l=3.63, p_l=1.47e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 53% 41/78 [03:38<03:22, 5.48s/it, bpd=4.87, g_l=4.87, gn=3.3, l=4.58, p_l=1.51e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 54% 42/78 [03:44<03:15, 5.43s/it, bpd=3.9, g_l=3.9, gn=3.2, l=3.67, p_l=1.51e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 55% 43/78 [03:49<03:08, 5.38s/it, bpd=4.36, g_l=4.36, gn=3.38, l=4.1, p_l=1.53e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 56% 44/78 [03:54<03:01, 5.34s/it, bpd=3.62, g_l=3.62, gn=3.17, l=3.41, p_l=1.61e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 58% 45/78 [03:59<02:55, 5.31s/it, bpd=6.43, g_l=6.43, gn=3.32, l=6.06, p_l=1.65e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 59% 46/78 [04:05<02:48, 5.28s/it, bpd=2.87, g_l=2.87, gn=3.47, l=2.7, p_l=1.87e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [04:10<02:43, 5.26s/it, bpd=4.05, g_l=4.05, gn=3.36, l=3.82, p_l=2.16e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 62% 48/78 [04:15<02:37, 5.24s/it, bpd=4.93, g_l=4.93, gn=3.26, l=4.64, p_l=2.29e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 63% 49/78 [04:20<02:31, 5.22s/it, bpd=4.23, g_l=4.23, gn=3.38, l=3.98, p_l=2.63e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 64% 50/78 [04:25<02:25, 5.19s/it, bpd=4.25, g_l=4.25, gn=3.66, l=4, p_l=3.17e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 65% 51/78 [04:31<02:20, 5.19s/it, bpd=4.75, g_l=4.75, gn=3.17, l=4.47, p_l=3.94e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 67% 52/78 [04:36<02:14, 5.18s/it, bpd=3.49, g_l=3.49, gn=3, l=3.29, p_l=4.85e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 68% 53/78 [04:41<02:09, 5.19s/it, bpd=3.99, g_l=3.99, gn=4, l=3.75, p_l=5.35e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 69% 54/78 [04:46<02:04, 5.19s/it, bpd=4.79, g_l=4.79, gn=3.08, l=4.51, p_l=5.97e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2619\u001b[0m\n"," 71% 55/78 [05:25<05:53, 15.35s/it, bpd=4.09, g_l=4.09, gn=4.54, l=3.85, p_l=6.33e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 72% 56/78 [05:30<04:31, 12.32s/it, bpd=3.98, g_l=3.98, gn=3.41, l=3.74, p_l=6.49e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [05:35<03:32, 10.13s/it, bpd=4.34, g_l=4.34, gn=3.39, l=4.09, p_l=6.56e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 74% 58/78 [05:41<02:52, 8.62s/it, bpd=4.58, g_l=4.58, gn=4.52, l=4.31, p_l=6.24e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 76% 59/78 [05:46<02:23, 7.57s/it, bpd=3.72, g_l=3.72, gn=3.03, l=3.5, p_l=5.45e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 77% 60/78 [05:51<02:02, 6.82s/it, bpd=4.33, g_l=4.33, gn=3.3, l=4.08, p_l=4.91e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 78% 61/78 [05:56<01:47, 6.31s/it, bpd=4.23, g_l=4.23, gn=3, l=3.99, p_l=4.22e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 79% 62/78 [06:01<01:35, 5.94s/it, bpd=4.49, g_l=4.49, gn=3.33, l=4.23, p_l=3.61e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 81% 63/78 [06:06<01:25, 5.72s/it, bpd=3.71, g_l=3.71, gn=3.18, l=3.5, p_l=3.28e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 82% 64/78 [06:11<01:17, 5.54s/it, bpd=4.83, g_l=4.83, gn=3.37, l=4.54, p_l=3.01e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 83% 65/78 [06:16<01:10, 5.45s/it, bpd=4.9, g_l=4.9, gn=4.27, l=4.62, p_l=2.93e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 85% 66/78 [06:22<01:04, 5.36s/it, bpd=4.02, g_l=4.02, gn=3.35, l=3.78, p_l=2.84e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 86% 67/78 [06:27<00:58, 5.34s/it, bpd=5.37, g_l=5.37, gn=3.17, l=5.06, p_l=2.87e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 87% 68/78 [06:32<00:52, 5.30s/it, bpd=4.1, g_l=4.1, gn=4.14, l=3.86, p_l=3.15e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:37<00:47, 5.29s/it, bpd=3.99, g_l=3.99, gn=3.43, l=3.76, p_l=3.43e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 90% 70/78 [06:43<00:42, 5.28s/it, bpd=4.57, g_l=4.57, gn=3.6, l=4.3, p_l=3.47e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 91% 71/78 [06:48<00:37, 5.30s/it, bpd=4.01, g_l=4.01, gn=3.6, l=3.78, p_l=3.35e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 92% 72/78 [06:53<00:31, 5.28s/it, bpd=4.9, g_l=4.9, gn=3.29, l=4.61, p_l=3.33e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 94% 73/78 [06:59<00:26, 5.29s/it, bpd=4.1, g_l=4.1, gn=3.48, l=3.86, p_l=3.08e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 95% 74/78 [07:04<00:21, 5.28s/it, bpd=4.4, g_l=4.4, gn=3.16, l=4.14, p_l=2.75e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 96% 75/78 [07:09<00:15, 5.29s/it, bpd=5.13, g_l=5.13, gn=3.21, l=4.83, p_l=2.53e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n","100% 78/78 [07:25<00:00, 5.71s/it, bpd=3.74, g_l=3.74, gn=3.26, l=3.52, p_l=2.86e-7]\n","Train bpd: 4.3915 prime_loss: 0.0000 gen_loss: 4.3915 loss: 4.1332 gn: 3.5389 lr: 0.0003 lg_loss_scale: 16.4100 epoch: 32.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2642\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.11s/it, bpd=5.04, l=4.74]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:13, 1.96s/it, bpd=5.16, l=4.86]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:10, 1.79s/it, bpd=4.86, l=4.57]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.67s/it, bpd=5.22, l=4.92]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.59s/it, bpd=4.6, l=4.33]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.54s/it, bpd=5.26, l=4.95]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.52s/it, bpd=4.69, l=4.41]\n","Ema bpd: 4.9119 prime_loss: 0.0125 gen_loss: 4.9119 loss: 4.6233 epoch: 32.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (34).txt\n","/content/gdrive/MyDrive/slon/slon (25).txt\n","/content/gdrive/MyDrive/slon/slon (17).txt\n"," 1% 1/78 [00:05<07:04, 5.52s/it, bpd=2.65, g_l=2.65, gn=3.15, l=2.5, p_l=2.74e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 3% 2/78 [00:10<06:54, 5.46s/it, bpd=4.19, g_l=4.19, gn=4.72, l=3.94, p_l=2.72e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 4% 3/78 [00:16<06:44, 5.39s/it, bpd=3.54, g_l=3.54, gn=2.92, l=3.33, p_l=2.35e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 5% 4/78 [00:21<06:36, 5.36s/it, bpd=4.8, g_l=4.8, gn=3.48, l=4.52, p_l=2.26e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 6% 5/78 [00:26<06:28, 5.33s/it, bpd=5.21, g_l=5.21, gn=3.72, l=4.9, p_l=1.89e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 8% 6/78 [00:31<06:22, 5.32s/it, bpd=5.46, g_l=5.46, gn=3.01, l=5.14, p_l=1.59e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=2.9, g_l=2.9, gn=4.42, l=2.73, p_l=1.2e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 10% 8/78 [00:42<06:10, 5.29s/it, bpd=5.53, g_l=5.53, gn=3.5, l=5.21, p_l=1.02e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 12% 9/78 [00:47<06:02, 5.26s/it, bpd=3.08, g_l=3.08, gn=2.97, l=2.9, p_l=9.36e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:52<05:56, 5.25s/it, bpd=5.36, g_l=5.36, gn=3.14, l=5.04, p_l=9.14e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 14% 11/78 [00:58<05:50, 5.23s/it, bpd=4.08, g_l=4.08, gn=3.48, l=3.84, p_l=9.23e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 15% 12/78 [01:03<05:44, 5.23s/it, bpd=4.09, g_l=4.09, gn=3.05, l=3.85, p_l=9.94e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 17% 13/78 [01:08<05:38, 5.21s/it, bpd=3.96, g_l=3.96, gn=3.55, l=3.72, p_l=1.08e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 18% 14/78 [01:13<05:32, 5.20s/it, bpd=3.92, g_l=3.92, gn=3.42, l=3.69, p_l=1.14e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 19% 15/78 [01:18<05:26, 5.19s/it, bpd=2.68, g_l=2.68, gn=3.31, l=2.52, p_l=1.16e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=4.54, g_l=4.54, gn=4.19, l=4.27, p_l=1.19e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 22% 17/78 [01:29<05:16, 5.18s/it, bpd=4.41, g_l=4.41, gn=4.39, l=4.15, p_l=1.05e-7]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 23% 18/78 [01:34<05:11, 5.19s/it, bpd=5.04, g_l=5.04, gn=3.33, l=4.74, p_l=9.81e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=5.16, g_l=5.16, gn=4.32, l=4.85, p_l=9.72e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 26% 20/78 [01:44<05:02, 5.21s/it, bpd=5.15, g_l=5.15, gn=4.07, l=4.85, p_l=9.81e-8]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 27% 21/78 [01:49<04:57, 5.21s/it, bpd=4.38, g_l=4.38, gn=3.61, l=4.13, p_l=1.07e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 28% 22/78 [01:55<04:52, 5.22s/it, bpd=4.42, g_l=4.42, gn=4.22, l=4.16, p_l=1.13e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 29% 23/78 [02:00<04:46, 5.21s/it, bpd=4.15, g_l=4.15, gn=4.1, l=3.91, p_l=1.41e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 31% 24/78 [02:05<04:41, 5.22s/it, bpd=5.03, g_l=5.03, gn=4.11, l=4.73, p_l=1.71e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=4.43, g_l=4.43, gn=3.83, l=4.17, p_l=1.73e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 33% 26/78 [02:16<04:31, 5.22s/it, bpd=3.03, g_l=3.03, gn=3.46, l=2.85, p_l=1.67e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 35% 27/78 [02:21<04:25, 5.21s/it, bpd=4.31, g_l=4.31, gn=3.74, l=4.06, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 36% 28/78 [02:26<04:20, 5.22s/it, bpd=4.02, g_l=4.02, gn=3.48, l=3.78, p_l=1.38e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=4.12, g_l=4.12, gn=3.07, l=3.88, p_l=1.25e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 38% 30/78 [02:36<04:10, 5.22s/it, bpd=5.25, g_l=5.25, gn=3.35, l=4.94, p_l=1.16e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 40% 31/78 [02:42<04:04, 5.21s/it, bpd=3.78, g_l=3.78, gn=3.03, l=3.56, p_l=1.12e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 41% 32/78 [02:47<03:59, 5.21s/it, bpd=3.63, g_l=3.63, gn=4.39, l=3.41, p_l=1.13e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 42% 33/78 [02:52<03:54, 5.21s/it, bpd=5.03, g_l=5.03, gn=3.2, l=4.73, p_l=1.14e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 44% 34/78 [02:57<03:49, 5.22s/it, bpd=3.7, g_l=3.7, gn=3.31, l=3.49, p_l=1.14e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 45% 35/78 [03:03<03:44, 5.21s/it, bpd=4.66, g_l=4.66, gn=4.38, l=4.39, p_l=1.1e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 46% 36/78 [03:08<03:39, 5.22s/it, bpd=4.33, g_l=4.33, gn=2.94, l=4.08, p_l=9.81e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 47% 37/78 [03:13<03:33, 5.21s/it, bpd=4.54, g_l=4.54, gn=3.96, l=4.28, p_l=9.14e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 49% 38/78 [03:18<03:28, 5.21s/it, bpd=3.7, g_l=3.7, gn=3.92, l=3.49, p_l=1.05e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 50% 39/78 [03:23<03:23, 5.22s/it, bpd=6.15, g_l=6.15, gn=2.92, l=5.79, p_l=1.12e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 51% 40/78 [03:29<03:18, 5.22s/it, bpd=4.87, g_l=4.87, gn=3.48, l=4.59, p_l=1.22e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 53% 41/78 [03:34<03:13, 5.22s/it, bpd=3.81, g_l=3.81, gn=3.01, l=3.58, p_l=1.34e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 54% 42/78 [03:39<03:08, 5.22s/it, bpd=5.05, g_l=5.05, gn=3.36, l=4.75, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 55% 43/78 [03:44<03:02, 5.22s/it, bpd=3.48, g_l=3.48, gn=2.94, l=3.28, p_l=1.63e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 56% 44/78 [03:49<02:57, 5.22s/it, bpd=4.53, g_l=4.53, gn=3.58, l=4.27, p_l=1.82e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 58% 45/78 [03:55<02:51, 5.21s/it, bpd=4.06, g_l=4.06, gn=3.27, l=3.82, p_l=1.85e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 59% 46/78 [04:00<02:46, 5.22s/it, bpd=5.48, g_l=5.48, gn=3.16, l=5.16, p_l=1.83e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 60% 47/78 [04:05<02:41, 5.22s/it, bpd=5.2, g_l=5.2, gn=3.09, l=4.89, p_l=1.84e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 62% 48/78 [04:10<02:36, 5.22s/it, bpd=4.71, g_l=4.71, gn=3.55, l=4.44, p_l=1.69e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 63% 49/78 [04:16<02:31, 5.21s/it, bpd=4.63, g_l=4.63, gn=3.2, l=4.36, p_l=1.71e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 64% 50/78 [04:21<02:25, 5.21s/it, bpd=4.72, g_l=4.72, gn=3.91, l=4.44, p_l=1.68e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 65% 51/78 [04:26<02:20, 5.21s/it, bpd=4.98, g_l=4.98, gn=3.68, l=4.68, p_l=1.74e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 67% 52/78 [04:31<02:15, 5.21s/it, bpd=5.56, g_l=5.56, gn=3.11, l=5.23, p_l=1.86e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 68% 53/78 [04:36<02:10, 5.21s/it, bpd=3.75, g_l=3.75, gn=4.05, l=3.53, p_l=1.93e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 69% 54/78 [04:42<02:04, 5.21s/it, bpd=4.66, g_l=4.66, gn=3.33, l=4.39, p_l=2.14e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 71% 55/78 [04:47<01:59, 5.20s/it, bpd=4.19, g_l=4.19, gn=3.15, l=3.95, p_l=2.32e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 72% 56/78 [04:52<01:54, 5.21s/it, bpd=3.68, g_l=3.68, gn=4.06, l=3.46, p_l=2.64e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 73% 57/78 [04:57<01:49, 5.20s/it, bpd=4.32, g_l=4.32, gn=3.43, l=4.06, p_l=2.97e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 74% 58/78 [05:08<02:15, 6.76s/it, bpd=4.14, g_l=4.14, gn=4.63, l=3.9, p_l=2.93e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 76% 59/78 [05:13<01:59, 6.27s/it, bpd=3.79, g_l=3.79, gn=4.75, l=3.57, p_l=2.94e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 77% 60/78 [05:18<01:46, 5.94s/it, bpd=5.36, g_l=5.36, gn=3.61, l=5.05, p_l=3e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 78% 61/78 [05:23<01:37, 5.73s/it, bpd=4.01, g_l=4.01, gn=3.22, l=3.77, p_l=3.07e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 79% 62/78 [05:28<01:29, 5.58s/it, bpd=3.81, g_l=3.81, gn=3.03, l=3.59, p_l=3.44e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 81% 63/78 [05:34<01:22, 5.50s/it, bpd=4.06, g_l=4.06, gn=3.32, l=3.82, p_l=3.94e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [05:39<01:15, 5.42s/it, bpd=5.14, g_l=5.14, gn=3.06, l=4.84, p_l=4.58e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 83% 65/78 [05:44<01:09, 5.38s/it, bpd=5.86, g_l=5.86, gn=3.75, l=5.52, p_l=4.89e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 85% 66/78 [05:49<01:04, 5.34s/it, bpd=4.2, g_l=4.2, gn=3.9, l=3.95, p_l=5.28e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 86% 67/78 [05:55<00:58, 5.31s/it, bpd=4.57, g_l=4.57, gn=3.73, l=4.3, p_l=5.34e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 87% 68/78 [06:00<00:52, 5.28s/it, bpd=4.1, g_l=4.1, gn=4.58, l=3.86, p_l=5.04e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 88% 69/78 [06:05<00:47, 5.25s/it, bpd=4.43, g_l=4.43, gn=3.3, l=4.17, p_l=4.17e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 90% 70/78 [06:10<00:41, 5.21s/it, bpd=4.78, g_l=4.78, gn=5.56, l=4.5, p_l=3.85e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 91% 71/78 [06:15<00:36, 5.20s/it, bpd=4.56, g_l=4.56, gn=3.19, l=4.29, p_l=3.69e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 92% 72/78 [06:20<00:31, 5.18s/it, bpd=3.49, g_l=3.49, gn=3.34, l=3.29, p_l=3.45e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:26<00:25, 5.18s/it, bpd=3.48, g_l=3.48, gn=3.04, l=3.27, p_l=3.59e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 95% 74/78 [06:31<00:20, 5.17s/it, bpd=4.17, g_l=4.17, gn=2.79, l=3.92, p_l=3.68e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 96% 75/78 [06:36<00:15, 5.17s/it, bpd=3.83, g_l=3.83, gn=2.95, l=3.6, p_l=4.13e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n","100% 78/78 [06:52<00:00, 5.28s/it, bpd=5.59, g_l=5.59, gn=3.11, l=5.26, p_l=5.76e-7]\n","Train bpd: 4.3974 prime_loss: 0.0000 gen_loss: 4.3974 loss: 4.1387 gn: 3.5739 lr: 0.0003 lg_loss_scale: 16.7220 epoch: 33.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2720\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.06s/it, bpd=4.88, l=4.59]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.93s/it, bpd=5.12, l=4.82]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 33% 3/9 [00:05<00:10, 1.77s/it, bpd=5.41, l=5.09]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.66s/it, bpd=4.59, l=4.32]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.58s/it, bpd=4.74, l=4.46]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 67% 6/9 [00:09<00:04, 1.53s/it, bpd=4.67, l=4.4]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.52s/it, bpd=5.72, l=5.38]\n","Ema bpd: 5.0487 prime_loss: 0.0121 gen_loss: 5.0487 loss: 4.7520 epoch: 33.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (12).txt\n","/content/gdrive/MyDrive/slon/slon (13).txt\n","/content/gdrive/MyDrive/slon/slon (28).txt\n"," 1% 1/78 [00:05<07:07, 5.55s/it, bpd=4.18, g_l=4.18, gn=3.78, l=3.93, p_l=5.8e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 3% 2/78 [00:10<06:54, 5.45s/it, bpd=5.39, g_l=5.39, gn=2.84, l=5.07, p_l=6.08e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 4% 3/78 [00:16<06:44, 5.40s/it, bpd=3.34, g_l=3.34, gn=3.15, l=3.14, p_l=6.38e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 5% 4/78 [00:21<06:37, 5.38s/it, bpd=3.97, g_l=3.97, gn=3.11, l=3.74, p_l=6.75e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 6% 5/78 [00:26<06:30, 5.35s/it, bpd=4.73, g_l=4.73, gn=3.18, l=4.45, p_l=6.98e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:24, 5.34s/it, bpd=3.46, g_l=3.46, gn=3, l=3.25, p_l=6.9e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:37<06:17, 5.31s/it, bpd=3.54, g_l=3.54, gn=2.66, l=3.33, p_l=6.55e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 10% 8/78 [00:42<06:10, 5.29s/it, bpd=3.82, g_l=3.82, gn=4.3, l=3.6, p_l=5.64e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 12% 9/78 [00:47<06:03, 5.27s/it, bpd=3.49, g_l=3.49, gn=2.7, l=3.29, p_l=5.22e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 13% 10/78 [00:52<05:57, 5.25s/it, bpd=3.5, g_l=3.5, gn=3.77, l=3.29, p_l=5.31e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 14% 11/78 [00:58<05:49, 5.22s/it, bpd=4.58, g_l=4.58, gn=3.74, l=4.31, p_l=5.09e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 15% 12/78 [01:03<05:43, 5.21s/it, bpd=5.27, g_l=5.27, gn=3.47, l=4.96, p_l=4.64e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=4.46, g_l=4.46, gn=4.22, l=4.19, p_l=4.47e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=4.21, g_l=4.21, gn=3.75, l=3.96, p_l=4.24e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 19% 15/78 [01:18<05:26, 5.18s/it, bpd=4.08, g_l=4.08, gn=4.09, l=3.84, p_l=3.94e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 21% 16/78 [01:23<05:21, 5.18s/it, bpd=3.66, g_l=3.66, gn=3.62, l=3.44, p_l=3.91e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 22% 17/78 [01:29<05:15, 5.18s/it, bpd=3.56, g_l=3.56, gn=3.47, l=3.35, p_l=3.96e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 23% 18/78 [01:34<05:11, 5.20s/it, bpd=4.59, g_l=4.59, gn=2.88, l=4.32, p_l=4.06e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=4.89, g_l=4.89, gn=4.6, l=4.6, p_l=4.38e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 26% 20/78 [01:44<05:02, 5.22s/it, bpd=4.75, g_l=4.75, gn=3.51, l=4.47, p_l=4.05e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 27% 21/78 [01:49<04:57, 5.21s/it, bpd=6.18, g_l=6.18, gn=3.52, l=5.82, p_l=3.83e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 28% 22/78 [01:55<04:52, 5.22s/it, bpd=4.94, g_l=4.94, gn=3.18, l=4.65, p_l=3.48e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 29% 23/78 [02:00<04:47, 5.22s/it, bpd=5.4, g_l=5.4, gn=3.64, l=5.08, p_l=2.96e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 31% 24/78 [02:05<04:41, 5.22s/it, bpd=4.39, g_l=4.39, gn=3.87, l=4.13, p_l=2.69e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=4.18, g_l=4.18, gn=3.59, l=3.93, p_l=2.81e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 33% 26/78 [02:16<04:31, 5.22s/it, bpd=4.01, g_l=4.01, gn=3.24, l=3.78, p_l=3.03e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 35% 27/78 [02:21<04:25, 5.21s/it, bpd=5.16, g_l=5.16, gn=2.95, l=4.85, p_l=3.57e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=4.43, g_l=4.43, gn=3.31, l=4.17, p_l=4.6e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 37% 29/78 [02:31<04:14, 5.20s/it, bpd=4.32, g_l=4.32, gn=6.25, l=4.07, p_l=5.5e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=4.23, g_l=4.23, gn=3.78, l=3.98, p_l=6.24e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 40% 31/78 [02:41<04:03, 5.19s/it, bpd=4.23, g_l=4.23, gn=3.81, l=3.98, p_l=6.26e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 41% 32/78 [02:47<03:58, 5.19s/it, bpd=3.77, g_l=3.77, gn=3.47, l=3.55, p_l=5.5e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 42% 33/78 [02:52<03:53, 5.19s/it, bpd=4.16, g_l=4.16, gn=3.36, l=3.92, p_l=4.6e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 44% 34/78 [02:57<03:48, 5.19s/it, bpd=5.42, g_l=5.42, gn=3.61, l=5.1, p_l=3.91e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 45% 35/78 [03:02<03:42, 5.18s/it, bpd=5, g_l=5, gn=4.56, l=4.71, p_l=3.87e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:07<03:37, 5.19s/it, bpd=5.58, g_l=5.58, gn=3.24, l=5.25, p_l=4.03e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 47% 37/78 [03:13<03:32, 5.18s/it, bpd=4.32, g_l=4.32, gn=8.11, l=4.07, p_l=4.02e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 49% 38/78 [03:18<03:27, 5.19s/it, bpd=3.93, g_l=3.93, gn=3.82, l=3.7, p_l=3.76e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 50% 39/78 [03:23<03:22, 5.18s/it, bpd=4.17, g_l=4.17, gn=4.32, l=3.93, p_l=3.27e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 51% 40/78 [03:28<03:17, 5.20s/it, bpd=5.22, g_l=5.22, gn=4.18, l=4.91, p_l=2.67e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 53% 41/78 [03:33<03:12, 5.19s/it, bpd=3.69, g_l=3.69, gn=3.04, l=3.47, p_l=2.41e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 54% 42/78 [03:39<03:07, 5.21s/it, bpd=4.5, g_l=4.5, gn=3.16, l=4.24, p_l=2.2e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 55% 43/78 [03:44<03:01, 5.20s/it, bpd=3.28, g_l=3.28, gn=4.55, l=3.09, p_l=2.15e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 56% 44/78 [03:49<02:57, 5.21s/it, bpd=4.74, g_l=4.74, gn=3.31, l=4.46, p_l=2.22e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 58% 45/78 [03:54<02:52, 5.21s/it, bpd=3.04, g_l=3.04, gn=3.12, l=2.86, p_l=2.06e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 59% 46/78 [03:59<02:47, 5.22s/it, bpd=5.05, g_l=5.05, gn=3.47, l=4.75, p_l=2.2e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 60% 47/78 [04:05<02:41, 5.22s/it, bpd=3.99, g_l=3.99, gn=3.56, l=3.75, p_l=2.09e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 62% 48/78 [04:10<02:36, 5.23s/it, bpd=4.9, g_l=4.9, gn=3.65, l=4.61, p_l=2.19e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 63% 49/78 [04:15<02:31, 5.22s/it, bpd=3.57, g_l=3.57, gn=3.47, l=3.36, p_l=2.03e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 64% 50/78 [04:20<02:26, 5.23s/it, bpd=4.11, g_l=4.11, gn=4.06, l=3.86, p_l=2e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 65% 51/78 [04:26<02:20, 5.22s/it, bpd=4.79, g_l=4.79, gn=4.08, l=4.51, p_l=1.99e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [04:31<02:15, 5.22s/it, bpd=4.15, g_l=4.15, gn=3.94, l=3.91, p_l=1.99e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 68% 53/78 [04:36<02:10, 5.21s/it, bpd=3.65, g_l=3.65, gn=3.51, l=3.43, p_l=1.78e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 69% 54/78 [04:41<02:05, 5.22s/it, bpd=3.84, g_l=3.84, gn=3.46, l=3.62, p_l=1.83e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 71% 55/78 [04:46<01:59, 5.21s/it, bpd=4.11, g_l=4.11, gn=3.44, l=3.87, p_l=1.95e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 72% 56/78 [04:52<01:54, 5.21s/it, bpd=4.59, g_l=4.59, gn=4.49, l=4.32, p_l=2.23e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 73% 57/78 [04:57<01:49, 5.21s/it, bpd=3.95, g_l=3.95, gn=3.35, l=3.72, p_l=2.59e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 74% 58/78 [05:02<01:44, 5.20s/it, bpd=2.91, g_l=2.91, gn=3.37, l=2.74, p_l=3.12e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 76% 59/78 [05:07<01:38, 5.20s/it, bpd=4.16, g_l=4.16, gn=4.09, l=3.92, p_l=3.51e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 77% 60/78 [05:12<01:33, 5.20s/it, bpd=4.04, g_l=4.04, gn=3.9, l=3.8, p_l=3.69e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 78% 61/78 [05:18<01:28, 5.20s/it, bpd=3.92, g_l=3.92, gn=3.74, l=3.69, p_l=3.59e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 79% 62/78 [05:23<01:23, 5.20s/it, bpd=4.19, g_l=4.19, gn=3.56, l=3.94, p_l=3.47e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 81% 63/78 [05:28<01:17, 5.20s/it, bpd=3.8, g_l=3.8, gn=3.5, l=3.58, p_l=3.13e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [05:33<01:12, 5.19s/it, bpd=3.03, g_l=3.03, gn=4.63, l=2.85, p_l=2.83e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 83% 65/78 [05:38<01:07, 5.19s/it, bpd=2.91, g_l=2.91, gn=3.46, l=2.74, p_l=2.38e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 85% 66/78 [05:44<01:02, 5.19s/it, bpd=3.88, g_l=3.88, gn=3.44, l=3.66, p_l=2.1e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 86% 67/78 [05:49<00:57, 5.19s/it, bpd=4.59, g_l=4.59, gn=3.29, l=4.32, p_l=1.76e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [05:54<00:51, 5.19s/it, bpd=5.27, g_l=5.27, gn=3.66, l=4.96, p_l=1.55e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 88% 69/78 [05:59<00:46, 5.19s/it, bpd=4.39, g_l=4.39, gn=3.4, l=4.14, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 90% 70/78 [06:04<00:41, 5.19s/it, bpd=3.24, g_l=3.24, gn=3.08, l=3.04, p_l=1.38e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 91% 71/78 [06:10<00:36, 5.19s/it, bpd=3.74, g_l=3.74, gn=3.75, l=3.52, p_l=1.4e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 92% 72/78 [06:15<00:31, 5.19s/it, bpd=5.58, g_l=5.58, gn=3.31, l=5.25, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 94% 73/78 [06:20<00:25, 5.19s/it, bpd=4.76, g_l=4.76, gn=2.91, l=4.48, p_l=1.44e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 95% 74/78 [06:25<00:20, 5.18s/it, bpd=5.99, g_l=5.99, gn=3.35, l=5.64, p_l=1.36e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 96% 75/78 [06:30<00:15, 5.18s/it, bpd=4.64, g_l=4.64, gn=3.25, l=4.37, p_l=1.25e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n","100% 78/78 [06:46<00:00, 5.21s/it, bpd=3.21, g_l=3.21, gn=3.54, l=3.02, p_l=6.63e-8]\n","Train bpd: 4.2753 prime_loss: 0.0000 gen_loss: 4.2753 loss: 4.0238 gn: 3.6571 lr: 0.0003 lg_loss_scale: 17.0340 epoch: 34.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2798\u001b[0m\n"," 11% 1/9 [00:01<00:14, 1.76s/it, bpd=3.89, l=3.66]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:11, 1.66s/it, bpd=4.92, l=4.63]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:04<00:09, 1.58s/it, bpd=5.19, l=4.88]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:05<00:07, 1.53s/it, bpd=5.42, l=5.1]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:05, 1.49s/it, bpd=5.68, l=5.34]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 67% 6/9 [00:08<00:04, 1.46s/it, bpd=4.37, l=4.12]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.46s/it, bpd=4.75, l=4.47]\n","Ema bpd: 4.9745 prime_loss: 0.0121 gen_loss: 4.9745 loss: 4.6822 epoch: 34.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (2).txt\n","/content/gdrive/MyDrive/slon/slon (1).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n"," 1% 1/78 [00:05<06:59, 5.45s/it, bpd=3.9, g_l=3.9, gn=4.31, l=3.67, p_l=5.96e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 3% 2/78 [00:15<08:46, 6.93s/it, bpd=3.72, g_l=3.72, gn=3.16, l=3.5, p_l=5.15e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 4% 3/78 [00:21<08:01, 6.41s/it, bpd=3.91, g_l=3.91, gn=3.23, l=3.68, p_l=4.7e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 5% 4/78 [00:26<07:29, 6.07s/it, bpd=3, g_l=3, gn=3.3, l=2.82, p_l=5.02e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 6% 5/78 [00:31<07:05, 5.82s/it, bpd=6.4, g_l=6.4, gn=2.97, l=6.02, p_l=5.11e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 8% 6/78 [00:36<06:47, 5.66s/it, bpd=4.07, g_l=4.07, gn=3.83, l=3.83, p_l=5.42e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:42<06:33, 5.54s/it, bpd=3.81, g_l=3.81, gn=3.38, l=3.58, p_l=5.55e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 10% 8/78 [00:47<06:21, 5.45s/it, bpd=5.25, g_l=5.25, gn=3.63, l=4.95, p_l=5.78e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 12% 9/78 [00:52<06:11, 5.38s/it, bpd=3.35, g_l=3.35, gn=3.59, l=3.16, p_l=6.63e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 13% 10/78 [00:57<06:03, 5.35s/it, bpd=4.09, g_l=4.09, gn=3.45, l=3.85, p_l=7.66e-8]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 14% 11/78 [01:03<05:55, 5.30s/it, bpd=4.84, g_l=4.84, gn=3.84, l=4.56, p_l=8.33e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 15% 12/78 [01:08<05:48, 5.28s/it, bpd=3.89, g_l=3.89, gn=3.87, l=3.66, p_l=7.97e-8]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 17% 13/78 [01:13<05:41, 5.25s/it, bpd=4.9, g_l=4.9, gn=3.66, l=4.61, p_l=7.3e-8]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 18% 14/78 [01:18<05:35, 5.24s/it, bpd=4.45, g_l=4.45, gn=2.94, l=4.19, p_l=6.94e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 19% 15/78 [01:23<05:28, 5.21s/it, bpd=4.02, g_l=4.02, gn=3.07, l=3.79, p_l=7.08e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 21% 16/78 [01:28<05:22, 5.20s/it, bpd=4.2, g_l=4.2, gn=3.21, l=3.96, p_l=7.93e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 22% 17/78 [01:34<05:16, 5.19s/it, bpd=4.39, g_l=4.39, gn=3.16, l=4.13, p_l=9.41e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 23% 18/78 [01:39<05:11, 5.20s/it, bpd=3.46, g_l=3.46, gn=3.92, l=3.26, p_l=1.14e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 24% 19/78 [01:44<05:06, 5.19s/it, bpd=4.93, g_l=4.93, gn=3.37, l=4.64, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 26% 20/78 [01:49<05:01, 5.20s/it, bpd=4.37, g_l=4.37, gn=3.24, l=4.11, p_l=1.47e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 27% 21/78 [01:54<04:56, 5.20s/it, bpd=4.02, g_l=4.02, gn=3.14, l=3.78, p_l=1.66e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 28% 22/78 [02:00<04:51, 5.20s/it, bpd=3.85, g_l=3.85, gn=3.66, l=3.62, p_l=1.67e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 29% 23/78 [02:05<04:45, 5.20s/it, bpd=4.38, g_l=4.38, gn=3.29, l=4.13, p_l=1.52e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 31% 24/78 [02:10<04:40, 5.20s/it, bpd=3.88, g_l=3.88, gn=3.38, l=3.65, p_l=1.4e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 32% 25/78 [02:15<04:35, 5.20s/it, bpd=3.79, g_l=3.79, gn=3.85, l=3.56, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 33% 26/78 [02:20<04:30, 5.20s/it, bpd=6.11, g_l=6.11, gn=3.01, l=5.76, p_l=1.49e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 35% 27/78 [02:26<04:25, 5.20s/it, bpd=4.64, g_l=4.64, gn=3.24, l=4.37, p_l=1.55e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 36% 28/78 [02:31<04:20, 5.20s/it, bpd=4.36, g_l=4.36, gn=4.07, l=4.11, p_l=1.76e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 37% 29/78 [02:36<04:14, 5.20s/it, bpd=4.42, g_l=4.42, gn=3.39, l=4.16, p_l=2.18e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 38% 30/78 [02:41<04:09, 5.20s/it, bpd=5.56, g_l=5.56, gn=3.2, l=5.24, p_l=2.71e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 40% 31/78 [02:46<04:04, 5.20s/it, bpd=5.06, g_l=5.06, gn=3.31, l=4.76, p_l=3.16e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 41% 32/78 [02:52<03:59, 5.20s/it, bpd=4.22, g_l=4.22, gn=6.14, l=3.98, p_l=3.35e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 42% 33/78 [02:57<03:54, 5.20s/it, bpd=4.73, g_l=4.73, gn=3.52, l=4.45, p_l=3.74e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 44% 34/78 [03:02<03:48, 5.20s/it, bpd=4.69, g_l=4.69, gn=3.63, l=4.41, p_l=3.73e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 45% 35/78 [03:07<03:43, 5.19s/it, bpd=4.25, g_l=4.25, gn=3.6, l=4, p_l=3.95e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n","\n","Overflow in backward. Loss 2.9198899269104004, grad norm inf, lgscale 17.332000000000416, new lgscale 16.332000000000416\n"," 46% 36/78 [03:12<03:28, 4.96s/it, bpd=4.25, g_l=4.25, gn=3.6, l=4, p_l=3.95e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 47% 37/78 [03:17<03:25, 5.02s/it, bpd=3.93, g_l=3.93, gn=3.22, l=3.7, p_l=4.3e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 49% 38/78 [03:22<03:22, 5.07s/it, bpd=3.82, g_l=3.82, gn=3.22, l=3.6, p_l=4.89e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 50% 39/78 [03:27<03:19, 5.11s/it, bpd=2.75, g_l=2.75, gn=4.47, l=2.59, p_l=5.11e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 51% 40/78 [03:32<03:15, 5.14s/it, bpd=3.81, g_l=3.81, gn=4.66, l=3.59, p_l=5.32e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 53% 41/78 [03:38<03:10, 5.15s/it, bpd=4.13, g_l=4.13, gn=3.25, l=3.89, p_l=5.11e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 54% 42/78 [03:43<03:05, 5.16s/it, bpd=4.73, g_l=4.73, gn=3.07, l=4.46, p_l=4.88e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 55% 43/78 [03:48<03:00, 5.16s/it, bpd=4.11, g_l=4.11, gn=3.25, l=3.87, p_l=4.48e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 56% 44/78 [03:53<02:55, 5.17s/it, bpd=3.22, g_l=3.22, gn=3.26, l=3.03, p_l=3.98e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 58% 45/78 [03:58<02:50, 5.18s/it, bpd=4.48, g_l=4.48, gn=3.37, l=4.22, p_l=3.82e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 59% 46/78 [04:04<02:46, 5.19s/it, bpd=4.04, g_l=4.04, gn=3, l=3.81, p_l=3.61e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [04:09<02:41, 5.20s/it, bpd=5.49, g_l=5.49, gn=3.16, l=5.17, p_l=3.78e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 62% 48/78 [04:14<02:36, 5.21s/it, bpd=4.19, g_l=4.19, gn=3.15, l=3.94, p_l=3.62e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 63% 49/78 [04:19<02:30, 5.21s/it, bpd=3.92, g_l=3.92, gn=3.98, l=3.69, p_l=3.68e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 64% 50/78 [04:24<02:25, 5.21s/it, bpd=4.43, g_l=4.43, gn=3.24, l=4.17, p_l=3.63e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 65% 51/78 [04:30<02:20, 5.21s/it, bpd=3.84, g_l=3.84, gn=3.26, l=3.62, p_l=3.51e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 67% 52/78 [04:35<02:15, 5.21s/it, bpd=5.51, g_l=5.51, gn=2.94, l=5.19, p_l=3.27e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 68% 53/78 [04:40<02:10, 5.21s/it, bpd=5.09, g_l=5.09, gn=3.57, l=4.79, p_l=3.25e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 69% 54/78 [04:45<02:04, 5.21s/it, bpd=4.49, g_l=4.49, gn=3.19, l=4.22, p_l=3.48e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 71% 55/78 [04:50<01:59, 5.21s/it, bpd=4.92, g_l=4.92, gn=3.02, l=4.63, p_l=4.08e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 72% 56/78 [04:56<01:54, 5.22s/it, bpd=4.52, g_l=4.52, gn=4.53, l=4.26, p_l=4.85e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 73% 57/78 [05:01<01:49, 5.23s/it, bpd=3.67, g_l=3.67, gn=3.3, l=3.45, p_l=5.8e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 74% 58/78 [05:06<01:44, 5.22s/it, bpd=3.88, g_l=3.88, gn=3.18, l=3.65, p_l=6.79e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 76% 59/78 [05:11<01:39, 5.22s/it, bpd=3.6, g_l=3.6, gn=3.12, l=3.39, p_l=7.03e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2857\u001b[0m\n"," 77% 60/78 [05:50<04:34, 15.28s/it, bpd=4.66, g_l=4.66, gn=3.18, l=4.39, p_l=6.67e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 78% 61/78 [05:55<03:27, 12.23s/it, bpd=5.64, g_l=5.64, gn=3.45, l=5.31, p_l=6.04e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 79% 62/78 [06:00<02:41, 10.07s/it, bpd=4.92, g_l=4.92, gn=3.98, l=4.63, p_l=5.17e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 81% 63/78 [06:05<02:08, 8.59s/it, bpd=3.98, g_l=3.98, gn=4.28, l=3.75, p_l=4.2e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 82% 64/78 [06:10<01:45, 7.53s/it, bpd=4.35, g_l=4.35, gn=3.05, l=4.09, p_l=4.04e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 83% 65/78 [06:16<01:28, 6.80s/it, bpd=4.52, g_l=4.52, gn=2.99, l=4.25, p_l=4.66e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 85% 66/78 [06:21<01:15, 6.29s/it, bpd=4.78, g_l=4.78, gn=3.28, l=4.5, p_l=5.43e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 86% 67/78 [06:26<01:05, 5.95s/it, bpd=3.84, g_l=3.84, gn=3.25, l=3.61, p_l=5.68e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [06:31<00:57, 5.70s/it, bpd=5.94, g_l=5.94, gn=4.25, l=5.59, p_l=5.8e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 88% 69/78 [06:36<00:50, 5.56s/it, bpd=4.52, g_l=4.52, gn=7.08, l=4.25, p_l=5.34e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 90% 70/78 [06:41<00:43, 5.44s/it, bpd=3.94, g_l=3.94, gn=3.1, l=3.7, p_l=4.77e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 91% 71/78 [06:47<00:37, 5.37s/it, bpd=3.31, g_l=3.31, gn=3.58, l=3.11, p_l=4.61e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 92% 72/78 [06:52<00:31, 5.32s/it, bpd=3.14, g_l=3.14, gn=3.36, l=2.95, p_l=4.55e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:57<00:26, 5.30s/it, bpd=3.81, g_l=3.81, gn=4.14, l=3.58, p_l=4.6e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 95% 74/78 [07:02<00:21, 5.29s/it, bpd=4.55, g_l=4.55, gn=3.55, l=4.28, p_l=4.58e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 96% 75/78 [07:07<00:15, 5.27s/it, bpd=4.09, g_l=4.09, gn=3.38, l=3.85, p_l=4.53e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n","100% 78/78 [07:24<00:00, 5.70s/it, bpd=4.01, g_l=4.01, gn=3.27, l=3.77, p_l=3.61e-7]\n","Train bpd: 4.3139 prime_loss: 0.0000 gen_loss: 4.3139 loss: 4.0601 gn: 3.5277 lr: 0.0003 lg_loss_scale: 16.7985 epoch: 35.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2875\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.07s/it, bpd=5.31, l=5]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.94s/it, bpd=5.15, l=4.84]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:05<00:10, 1.78s/it, bpd=5.46, l=5.14]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.67s/it, bpd=3.97, l=3.74]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.59s/it, bpd=5.11, l=4.81]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.54s/it, bpd=5.42, l=5.1]/content/gdrive/MyDrive/slon/slon (5).txt\n","100% 9/9 [00:13<00:00, 1.52s/it, bpd=4.84, l=4.55]\n","Ema bpd: 5.1395 prime_loss: 0.0119 gen_loss: 5.1395 loss: 4.8375 epoch: 35.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (27).txt\n","/content/gdrive/MyDrive/slon/slon (15).txt\n"," 1% 1/78 [00:05<06:53, 5.37s/it, bpd=3.61, g_l=3.61, gn=3.49, l=3.4, p_l=3.11e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 3% 2/78 [00:10<06:44, 5.32s/it, bpd=4.08, g_l=4.08, gn=2.93, l=3.84, p_l=2.71e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 4% 3/78 [00:15<06:36, 5.29s/it, bpd=4.71, g_l=4.71, gn=3.32, l=4.43, p_l=2.43e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 5% 4/78 [00:21<06:29, 5.27s/it, bpd=4.11, g_l=4.11, gn=3.83, l=3.87, p_l=2.23e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 6% 5/78 [00:26<06:24, 5.27s/it, bpd=3.36, g_l=3.36, gn=3.08, l=3.16, p_l=1.96e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:19, 5.27s/it, bpd=3.81, g_l=3.81, gn=4.87, l=3.59, p_l=1.64e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:36<06:14, 5.27s/it, bpd=5.97, g_l=5.97, gn=2.87, l=5.62, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:07, 5.25s/it, bpd=3.96, g_l=3.96, gn=3.63, l=3.73, p_l=1.29e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 12% 9/78 [00:47<06:02, 5.25s/it, bpd=3.74, g_l=3.74, gn=3.06, l=3.52, p_l=1.29e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=4.01, g_l=4.01, gn=4.1, l=3.78, p_l=1.3e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:50, 5.24s/it, bpd=4.03, g_l=4.03, gn=3.12, l=3.79, p_l=1.24e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 15% 12/78 [01:02<05:44, 5.22s/it, bpd=3.49, g_l=3.49, gn=5.2, l=3.29, p_l=1.12e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 17% 13/78 [01:08<05:39, 5.22s/it, bpd=3.64, g_l=3.64, gn=3.31, l=3.43, p_l=1.04e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 18% 14/78 [01:13<05:33, 5.21s/it, bpd=4.11, g_l=4.11, gn=3.33, l=3.87, p_l=9.99e-8]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 19% 15/78 [01:18<05:28, 5.21s/it, bpd=3.82, g_l=3.82, gn=3.28, l=3.6, p_l=9.85e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 21% 16/78 [01:23<05:22, 5.20s/it, bpd=5, g_l=5, gn=4.32, l=4.71, p_l=1.01e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 22% 17/78 [01:28<05:17, 5.20s/it, bpd=4.26, g_l=4.26, gn=3.36, l=4.01, p_l=1.17e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 23% 18/78 [01:34<05:11, 5.20s/it, bpd=4.95, g_l=4.95, gn=3.56, l=4.66, p_l=1.48e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=4.36, g_l=4.36, gn=2.94, l=4.11, p_l=1.85e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 26% 20/78 [01:44<05:00, 5.18s/it, bpd=5.31, g_l=5.31, gn=3.81, l=5, p_l=2.06e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 27% 21/78 [01:49<04:55, 5.19s/it, bpd=3.31, g_l=3.31, gn=3.32, l=3.11, p_l=2.17e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 28% 22/78 [01:54<04:50, 5.19s/it, bpd=5.1, g_l=5.1, gn=3.33, l=4.8, p_l=2.33e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n","\n","Overflow in backward. Loss 4.544325828552246, grad norm nan, lgscale 16.588000000000427, new lgscale 15.588000000000426\n"," 29% 23/78 [01:59<04:32, 4.96s/it, bpd=5.1, g_l=5.1, gn=3.33, l=4.8, p_l=2.33e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 31% 24/78 [02:04<04:31, 5.02s/it, bpd=4.88, g_l=4.88, gn=2.99, l=4.59, p_l=2.41e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 32% 25/78 [02:09<04:29, 5.08s/it, bpd=4.59, g_l=4.59, gn=3.4, l=4.32, p_l=2.44e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 33% 26/78 [02:20<05:51, 6.77s/it, bpd=4.22, g_l=4.22, gn=3.25, l=3.97, p_l=2.59e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 35% 27/78 [02:25<05:19, 6.26s/it, bpd=4.02, g_l=4.02, gn=3.65, l=3.79, p_l=2.45e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 36% 28/78 [02:30<04:56, 5.94s/it, bpd=4.32, g_l=4.32, gn=3.1, l=4.07, p_l=2.32e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 37% 29/78 [02:35<04:39, 5.71s/it, bpd=5.29, g_l=5.29, gn=3.01, l=4.98, p_l=2.21e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 38% 30/78 [02:41<04:27, 5.58s/it, bpd=4.21, g_l=4.21, gn=3.45, l=3.96, p_l=2.12e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 40% 31/78 [02:46<04:18, 5.49s/it, bpd=2.8, g_l=2.8, gn=3.92, l=2.64, p_l=2.06e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 41% 32/78 [02:51<04:10, 5.44s/it, bpd=3.93, g_l=3.93, gn=3.69, l=3.7, p_l=2.17e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 42% 33/78 [02:56<04:02, 5.38s/it, bpd=4.38, g_l=4.38, gn=3.86, l=4.12, p_l=2.3e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 44% 34/78 [03:02<03:55, 5.34s/it, bpd=4.84, g_l=4.84, gn=3.92, l=4.56, p_l=2.36e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 45% 35/78 [03:07<03:48, 5.31s/it, bpd=5.06, g_l=5.06, gn=3.5, l=4.76, p_l=2.42e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:12<03:41, 5.27s/it, bpd=5.38, g_l=5.38, gn=4.27, l=5.06, p_l=2.46e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 47% 37/78 [03:17<03:34, 5.24s/it, bpd=3.6, g_l=3.6, gn=3.65, l=3.39, p_l=2.33e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 49% 38/78 [03:22<03:28, 5.21s/it, bpd=3.68, g_l=3.68, gn=3.05, l=3.47, p_l=1.99e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 50% 39/78 [03:28<03:22, 5.19s/it, bpd=3.63, g_l=3.63, gn=3.47, l=3.42, p_l=1.83e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 51% 40/78 [03:33<03:16, 5.17s/it, bpd=3.87, g_l=3.87, gn=5.64, l=3.64, p_l=1.67e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 53% 41/78 [03:38<03:10, 5.16s/it, bpd=4.85, g_l=4.85, gn=3.48, l=4.56, p_l=1.61e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 54% 42/78 [03:43<03:05, 5.16s/it, bpd=4.99, g_l=4.99, gn=3.69, l=4.69, p_l=1.62e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 55% 43/78 [03:48<03:00, 5.15s/it, bpd=4.61, g_l=4.61, gn=3.2, l=4.34, p_l=1.58e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 56% 44/78 [03:53<02:55, 5.16s/it, bpd=3.9, g_l=3.9, gn=3.87, l=3.67, p_l=1.61e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 58% 45/78 [03:58<02:50, 5.17s/it, bpd=4.77, g_l=4.77, gn=4.64, l=4.49, p_l=1.68e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 59% 46/78 [04:04<02:45, 5.17s/it, bpd=4.69, g_l=4.69, gn=3.5, l=4.41, p_l=1.48e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 60% 47/78 [04:09<02:40, 5.18s/it, bpd=4.35, g_l=4.35, gn=6.07, l=4.1, p_l=1.29e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 62% 48/78 [04:14<02:35, 5.19s/it, bpd=4.01, g_l=4.01, gn=3.63, l=3.77, p_l=1.08e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 63% 49/78 [04:19<02:30, 5.20s/it, bpd=5.56, g_l=5.56, gn=3.64, l=5.23, p_l=9.99e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 64% 50/78 [04:24<02:25, 5.21s/it, bpd=4.67, g_l=4.67, gn=3.84, l=4.39, p_l=8.96e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 65% 51/78 [04:30<02:21, 5.22s/it, bpd=3.27, g_l=3.27, gn=3.32, l=3.08, p_l=8.87e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 67% 52/78 [04:35<02:15, 5.22s/it, bpd=3.9, g_l=3.9, gn=3.36, l=3.67, p_l=9.81e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 68% 53/78 [04:40<02:10, 5.23s/it, bpd=4.19, g_l=4.19, gn=3.49, l=3.95, p_l=1.25e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 69% 54/78 [04:45<02:05, 5.22s/it, bpd=3.06, g_l=3.06, gn=3.41, l=2.88, p_l=1.63e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 71% 55/78 [04:51<02:00, 5.23s/it, bpd=4.08, g_l=4.08, gn=3.25, l=3.84, p_l=2.08e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 72% 56/78 [04:56<01:54, 5.22s/it, bpd=4.07, g_l=4.07, gn=3.44, l=3.83, p_l=2.63e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 73% 57/78 [05:01<01:49, 5.22s/it, bpd=4.14, g_l=4.14, gn=3.44, l=3.9, p_l=3.33e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 74% 58/78 [05:06<01:44, 5.20s/it, bpd=4.56, g_l=4.56, gn=3.89, l=4.29, p_l=3.82e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 76% 59/78 [05:11<01:38, 5.20s/it, bpd=5.1, g_l=5.1, gn=3.15, l=4.8, p_l=4.16e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 77% 60/78 [05:17<01:33, 5.20s/it, bpd=4.84, g_l=4.84, gn=3.51, l=4.56, p_l=4.16e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 78% 61/78 [05:22<01:28, 5.20s/it, bpd=3.9, g_l=3.9, gn=3.28, l=3.67, p_l=4.34e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 79% 62/78 [05:27<01:23, 5.19s/it, bpd=4.27, g_l=4.27, gn=4.27, l=4.02, p_l=4.16e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 81% 63/78 [05:32<01:17, 5.20s/it, bpd=4.47, g_l=4.47, gn=3.05, l=4.2, p_l=3.66e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [05:37<01:12, 5.19s/it, bpd=4.55, g_l=4.55, gn=3.04, l=4.28, p_l=3.45e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 83% 65/78 [05:43<01:07, 5.19s/it, bpd=4.25, g_l=4.25, gn=3.23, l=4, p_l=3.51e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 85% 66/78 [05:48<01:02, 5.18s/it, bpd=3.84, g_l=3.84, gn=3.08, l=3.61, p_l=3.86e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 86% 67/78 [05:53<00:57, 5.18s/it, bpd=4.39, g_l=4.39, gn=3.36, l=4.13, p_l=4.07e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 87% 68/78 [05:58<00:51, 5.18s/it, bpd=3.83, g_l=3.83, gn=3.2, l=3.6, p_l=4.12e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 88% 69/78 [06:03<00:46, 5.19s/it, bpd=3.96, g_l=3.96, gn=3.17, l=3.73, p_l=4.28e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 90% 70/78 [06:08<00:41, 5.18s/it, bpd=5.47, g_l=5.47, gn=3.37, l=5.15, p_l=4.28e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 91% 71/78 [06:14<00:36, 5.19s/it, bpd=3.94, g_l=3.94, gn=4.94, l=3.71, p_l=4.34e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 92% 72/78 [06:19<00:31, 5.19s/it, bpd=4.41, g_l=4.41, gn=3.41, l=4.15, p_l=4.13e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 94% 73/78 [06:24<00:25, 5.18s/it, bpd=4.2, g_l=4.2, gn=3.98, l=3.96, p_l=3.88e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n","\n","Overflow in backward. Loss 4.100964546203613, grad norm nan, lgscale 15.788000000000434, new lgscale 14.788000000000434\n"," 95% 74/78 [06:28<00:19, 4.95s/it, bpd=4.2, g_l=4.2, gn=3.98, l=3.96, p_l=3.88e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 96% 75/78 [06:34<00:15, 5.01s/it, bpd=4.16, g_l=4.16, gn=3.36, l=3.92, p_l=4.05e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n","100% 78/78 [06:49<00:00, 5.26s/it, bpd=5.91, g_l=5.91, gn=3.15, l=5.57, p_l=5.47e-7]\n","Train bpd: 4.3087 prime_loss: 0.0000 gen_loss: 4.3087 loss: 4.0553 gn: 3.5755 lr: 0.0003 lg_loss_scale: 15.8868 epoch: 36.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:2951\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.97s/it, bpd=5.16, l=4.86]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 22% 2/9 [00:03<00:13, 1.87s/it, bpd=5.9, l=5.55]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:04<00:10, 1.73s/it, bpd=4, l=3.77]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.63s/it, bpd=4.97, l=4.68]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=5.28, l=4.97]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=4.6, l=4.33]/content/gdrive/MyDrive/slon/slon (5).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=4.93, l=4.64]\n","Ema bpd: 5.0274 prime_loss: 0.0116 gen_loss: 5.0274 loss: 4.7319 epoch: 36.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (35).txt\n","/content/gdrive/MyDrive/slon/slon (13).txt\n","/content/gdrive/MyDrive/slon/slon (24).txt\n"," 1% 1/78 [00:05<07:06, 5.54s/it, bpd=4.47, g_l=4.47, gn=3.27, l=4.21, p_l=5.41e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 3% 2/78 [00:10<06:54, 5.45s/it, bpd=4.72, g_l=4.72, gn=2.82, l=4.44, p_l=5.5e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 4% 3/78 [00:16<06:44, 5.39s/it, bpd=4.79, g_l=4.79, gn=3.51, l=4.51, p_l=5.58e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 5% 4/78 [00:21<06:37, 5.37s/it, bpd=4.84, g_l=4.84, gn=3.14, l=4.55, p_l=5.9e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 6% 5/78 [00:26<06:29, 5.34s/it, bpd=4.04, g_l=4.04, gn=2.94, l=3.8, p_l=5.73e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 8% 6/78 [00:31<06:23, 5.32s/it, bpd=3.93, g_l=3.93, gn=4.67, l=3.7, p_l=6.37e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 9% 7/78 [00:37<06:16, 5.30s/it, bpd=4.79, g_l=4.79, gn=3.16, l=4.51, p_l=6.28e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 10% 8/78 [00:42<06:10, 5.29s/it, bpd=4.99, g_l=4.99, gn=3.48, l=4.7, p_l=6.28e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 12% 9/78 [00:47<06:03, 5.27s/it, bpd=5.27, g_l=5.27, gn=3.51, l=4.96, p_l=6.16e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:52<05:56, 5.25s/it, bpd=3.92, g_l=3.92, gn=3.65, l=3.69, p_l=6.29e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:49, 5.22s/it, bpd=4.37, g_l=4.37, gn=3.76, l=4.11, p_l=6.71e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 15% 12/78 [01:03<05:43, 5.20s/it, bpd=3.51, g_l=3.51, gn=3.18, l=3.31, p_l=7.14e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 17% 13/78 [01:08<05:36, 5.18s/it, bpd=3.8, g_l=3.8, gn=3.74, l=3.58, p_l=8.22e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 18% 14/78 [01:13<05:30, 5.17s/it, bpd=4.36, g_l=4.36, gn=4.29, l=4.1, p_l=1.03e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 19% 15/78 [01:18<05:25, 5.17s/it, bpd=4.41, g_l=4.41, gn=3.24, l=4.15, p_l=1.2e-6]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 21% 16/78 [01:23<05:20, 5.17s/it, bpd=3.9, g_l=3.9, gn=3.26, l=3.67, p_l=1.26e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 22% 17/78 [01:28<05:16, 5.19s/it, bpd=4.15, g_l=4.15, gn=3.37, l=3.9, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 23% 18/78 [01:34<05:11, 5.20s/it, bpd=4.76, g_l=4.76, gn=3.4, l=4.48, p_l=1e-6]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 24% 19/78 [01:39<05:07, 5.21s/it, bpd=4.56, g_l=4.56, gn=3.62, l=4.3, p_l=8.14e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 26% 20/78 [01:44<05:02, 5.21s/it, bpd=4.39, g_l=4.39, gn=4.85, l=4.14, p_l=6.57e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 27% 21/78 [01:49<04:57, 5.22s/it, bpd=3.87, g_l=3.87, gn=3.52, l=3.64, p_l=5.31e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 28% 22/78 [01:55<04:52, 5.22s/it, bpd=3.02, g_l=3.02, gn=6, l=2.85, p_l=4.55e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 29% 23/78 [02:00<04:47, 5.22s/it, bpd=4.57, g_l=4.57, gn=3.49, l=4.3, p_l=4.07e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 31% 24/78 [02:05<04:41, 5.22s/it, bpd=3.9, g_l=3.9, gn=3.36, l=3.67, p_l=3.6e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 32% 25/78 [02:10<04:36, 5.22s/it, bpd=5.05, g_l=5.05, gn=3.5, l=4.75, p_l=3.46e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 33% 26/78 [02:15<04:30, 5.21s/it, bpd=4.65, g_l=4.65, gn=3.32, l=4.38, p_l=3.39e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 35% 27/78 [02:21<04:25, 5.21s/it, bpd=2.92, g_l=2.92, gn=3.05, l=2.75, p_l=3.45e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=3.52, g_l=3.52, gn=4.56, l=3.31, p_l=3.43e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=6.24, g_l=6.24, gn=4.15, l=5.87, p_l=3.55e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=3.96, g_l=3.96, gn=3.22, l=3.73, p_l=3.87e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 40% 31/78 [02:41<04:04, 5.20s/it, bpd=5.58, g_l=5.58, gn=2.98, l=5.26, p_l=3.91e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 41% 32/78 [02:47<03:58, 5.20s/it, bpd=3.98, g_l=3.98, gn=3.46, l=3.74, p_l=3.95e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 42% 33/78 [02:52<03:53, 5.19s/it, bpd=2.89, g_l=2.89, gn=4.08, l=2.72, p_l=3.73e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 44% 34/78 [02:57<03:48, 5.19s/it, bpd=4.91, g_l=4.91, gn=3.98, l=4.62, p_l=3.91e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 45% 35/78 [03:02<03:42, 5.18s/it, bpd=4.14, g_l=4.14, gn=3.64, l=3.9, p_l=4.23e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 46% 36/78 [03:07<03:37, 5.18s/it, bpd=5.02, g_l=5.02, gn=3.52, l=4.72, p_l=4.63e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 47% 37/78 [03:13<03:32, 5.18s/it, bpd=3.79, g_l=3.79, gn=5.05, l=3.57, p_l=4.38e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 49% 38/78 [03:18<03:26, 5.17s/it, bpd=4.83, g_l=4.83, gn=3.15, l=4.54, p_l=4.42e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 50% 39/78 [03:23<03:21, 5.18s/it, bpd=4.04, g_l=4.04, gn=3.32, l=3.8, p_l=4.37e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 51% 40/78 [03:28<03:16, 5.18s/it, bpd=4.91, g_l=4.91, gn=3.35, l=4.62, p_l=4.3e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 53% 41/78 [03:33<03:11, 5.17s/it, bpd=4.77, g_l=4.77, gn=3.08, l=4.49, p_l=3.99e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 54% 42/78 [03:38<03:06, 5.19s/it, bpd=4.51, g_l=4.51, gn=5.86, l=4.25, p_l=4.32e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 55% 43/78 [03:44<03:01, 5.19s/it, bpd=4.3, g_l=4.3, gn=3.34, l=4.04, p_l=4.39e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 56% 44/78 [03:49<02:56, 5.20s/it, bpd=4.63, g_l=4.63, gn=3.31, l=4.36, p_l=4.77e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 58% 45/78 [03:54<02:51, 5.20s/it, bpd=4.48, g_l=4.48, gn=3.9, l=4.21, p_l=5.66e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [03:59<02:46, 5.21s/it, bpd=4.81, g_l=4.81, gn=3.01, l=4.53, p_l=6.34e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 60% 47/78 [04:05<02:41, 5.21s/it, bpd=3.76, g_l=3.76, gn=3.09, l=3.54, p_l=7.17e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 62% 48/78 [04:10<02:36, 5.21s/it, bpd=3, g_l=3, gn=3.02, l=2.82, p_l=8.13e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 63% 49/78 [04:20<03:18, 6.85s/it, bpd=4.54, g_l=4.54, gn=2.82, l=4.28, p_l=9.07e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 64% 50/78 [04:26<02:57, 6.34s/it, bpd=3.51, g_l=3.51, gn=3.23, l=3.3, p_l=1.04e-6]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 65% 51/78 [04:31<02:42, 6.00s/it, bpd=3.91, g_l=3.91, gn=5.74, l=3.68, p_l=1.16e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 67% 52/78 [04:36<02:29, 5.76s/it, bpd=3.91, g_l=3.91, gn=2.98, l=3.68, p_l=1.24e-6]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 68% 53/78 [04:41<02:20, 5.61s/it, bpd=4.45, g_l=4.45, gn=3.42, l=4.19, p_l=1.21e-6]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 69% 54/78 [04:47<02:12, 5.51s/it, bpd=6.36, g_l=6.36, gn=3.09, l=5.98, p_l=1.06e-6]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 71% 55/78 [04:52<02:05, 5.44s/it, bpd=4.19, g_l=4.19, gn=3.29, l=3.94, p_l=8.46e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 72% 56/78 [04:57<01:58, 5.38s/it, bpd=5.43, g_l=5.43, gn=3.81, l=5.11, p_l=6.53e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 73% 57/78 [05:02<01:51, 5.33s/it, bpd=3.56, g_l=3.56, gn=3.13, l=3.35, p_l=5.07e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 74% 58/78 [05:07<01:46, 5.30s/it, bpd=3.86, g_l=3.86, gn=6.94, l=3.63, p_l=4.48e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 76% 59/78 [05:13<01:40, 5.26s/it, bpd=4.84, g_l=4.84, gn=5.12, l=4.56, p_l=4.34e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 77% 60/78 [05:18<01:34, 5.24s/it, bpd=4.18, g_l=4.18, gn=3.74, l=3.93, p_l=3.93e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 78% 61/78 [05:23<01:28, 5.22s/it, bpd=4.14, g_l=4.14, gn=3.88, l=3.89, p_l=3.79e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 79% 62/78 [05:28<01:23, 5.20s/it, bpd=4.38, g_l=4.38, gn=3.43, l=4.12, p_l=3.79e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 81% 63/78 [05:33<01:17, 5.18s/it, bpd=5.04, g_l=5.04, gn=3.52, l=4.75, p_l=3.76e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 82% 64/78 [05:38<01:12, 5.18s/it, bpd=5.06, g_l=5.06, gn=3.09, l=4.76, p_l=3.69e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 83% 65/78 [05:44<01:07, 5.19s/it, bpd=3.9, g_l=3.9, gn=3.19, l=3.67, p_l=3.26e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 85% 66/78 [05:49<01:02, 5.20s/it, bpd=4.89, g_l=4.89, gn=3.1, l=4.6, p_l=2.73e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [05:54<00:57, 5.20s/it, bpd=5.01, g_l=5.01, gn=3.06, l=4.71, p_l=2.19e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [05:59<00:52, 5.20s/it, bpd=3.49, g_l=3.49, gn=3.59, l=3.29, p_l=1.76e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 88% 69/78 [06:05<00:46, 5.20s/it, bpd=3.78, g_l=3.78, gn=3.01, l=3.56, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 90% 70/78 [06:10<00:41, 5.20s/it, bpd=3.85, g_l=3.85, gn=2.94, l=3.63, p_l=1.1e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 91% 71/78 [06:15<00:36, 5.21s/it, bpd=4.14, g_l=4.14, gn=4.08, l=3.9, p_l=9.76e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 92% 72/78 [06:20<00:31, 5.21s/it, bpd=3.6, g_l=3.6, gn=3.92, l=3.39, p_l=9.18e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 94% 73/78 [06:25<00:26, 5.22s/it, bpd=5.15, g_l=5.15, gn=3.17, l=4.85, p_l=8.96e-8]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 95% 74/78 [06:31<00:20, 5.21s/it, bpd=5.1, g_l=5.1, gn=3.22, l=4.8, p_l=8.11e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 96% 75/78 [06:36<00:15, 5.22s/it, bpd=4.17, g_l=4.17, gn=3.63, l=3.92, p_l=8.2e-8]/content/gdrive/MyDrive/slon/slon (32).txt\n","100% 78/78 [06:52<00:00, 5.28s/it, bpd=4.83, g_l=4.83, gn=5.32, l=4.55, p_l=6.09e-8]\n","Train bpd: 4.3410 prime_loss: 0.0000 gen_loss: 4.3410 loss: 4.0856 gn: 3.6457 lr: 0.0003 lg_loss_scale: 14.9580 epoch: 37.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (9).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:3029\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.90s/it, bpd=5.08, l=4.78]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 22% 2/9 [00:03<00:13, 1.92s/it, bpd=6.01, l=5.66]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 33% 3/9 [00:05<00:10, 1.76s/it, bpd=5.19, l=4.89]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=4.89, l=4.6]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 56% 5/9 [00:08<00:06, 1.57s/it, bpd=4.75, l=4.47]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=4.58, l=4.31]/content/gdrive/MyDrive/slon/slon (6).txt\n","100% 9/9 [00:13<00:00, 1.53s/it, bpd=5.47, l=5.15]\n","Ema bpd: 5.2534 prime_loss: 0.0113 gen_loss: 5.2534 loss: 4.9447 epoch: 37.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (30).txt\n","/content/gdrive/MyDrive/slon/slon (12).txt\n","/content/gdrive/MyDrive/slon/slon (16).txt\n"," 1% 1/78 [00:05<06:53, 5.38s/it, bpd=5.78, g_l=5.78, gn=3.45, l=5.44, p_l=5.73e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 3% 2/78 [00:10<06:44, 5.32s/it, bpd=4.32, g_l=4.32, gn=3.52, l=4.06, p_l=5.55e-8]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 4% 3/78 [00:15<06:36, 5.28s/it, bpd=4.73, g_l=4.73, gn=3.16, l=4.45, p_l=5.46e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 5% 4/78 [00:21<06:31, 5.29s/it, bpd=4.65, g_l=4.65, gn=3.98, l=4.37, p_l=5.46e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 6% 5/78 [00:26<06:25, 5.28s/it, bpd=4.71, g_l=4.71, gn=3.31, l=4.43, p_l=5.87e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 8% 6/78 [00:31<06:21, 5.29s/it, bpd=3.95, g_l=3.95, gn=3.35, l=3.71, p_l=6.14e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 9% 7/78 [00:36<06:14, 5.28s/it, bpd=6.38, g_l=6.38, gn=3.36, l=6.01, p_l=6.94e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 10% 8/78 [00:42<06:09, 5.28s/it, bpd=3.81, g_l=3.81, gn=2.87, l=3.59, p_l=7.03e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 12% 9/78 [00:47<06:03, 5.26s/it, bpd=4.33, g_l=4.33, gn=3.98, l=4.07, p_l=7.35e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 13% 10/78 [00:52<05:57, 5.26s/it, bpd=3.91, g_l=3.91, gn=3.32, l=3.68, p_l=7.08e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 14% 11/78 [00:57<05:50, 5.23s/it, bpd=4.75, g_l=4.75, gn=3.34, l=4.47, p_l=7.57e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 15% 12/78 [01:02<05:43, 5.21s/it, bpd=3.18, g_l=3.18, gn=3.71, l=2.99, p_l=8.02e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 17% 13/78 [01:08<05:37, 5.19s/it, bpd=4.24, g_l=4.24, gn=3.09, l=3.99, p_l=8.46e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 18% 14/78 [01:13<05:34, 5.22s/it, bpd=4.81, g_l=4.81, gn=3.16, l=4.52, p_l=8.55e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 19% 15/78 [01:18<05:27, 5.20s/it, bpd=3.95, g_l=3.95, gn=3.55, l=3.72, p_l=9.18e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 21% 16/78 [01:23<05:21, 5.18s/it, bpd=2.72, g_l=2.72, gn=3.96, l=2.56, p_l=9e-8]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 22% 17/78 [01:28<05:16, 5.19s/it, bpd=3.96, g_l=3.96, gn=3.88, l=3.73, p_l=8.29e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 23% 18/78 [01:34<05:10, 5.18s/it, bpd=3.89, g_l=3.89, gn=3.14, l=3.66, p_l=7.3e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 24% 19/78 [01:39<05:06, 5.19s/it, bpd=4.2, g_l=4.2, gn=4.2, l=3.95, p_l=6.45e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 26% 20/78 [01:44<05:01, 5.19s/it, bpd=3.71, g_l=3.71, gn=3.02, l=3.49, p_l=5.24e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 27% 21/78 [01:49<04:56, 5.20s/it, bpd=4.51, g_l=4.51, gn=3.68, l=4.24, p_l=4.57e-8]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 28% 22/78 [01:54<04:51, 5.20s/it, bpd=4.57, g_l=4.57, gn=3.54, l=4.3, p_l=4.48e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 29% 23/78 [02:00<04:46, 5.21s/it, bpd=2.94, g_l=2.94, gn=3.4, l=2.77, p_l=4.43e-8]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=4.11, g_l=4.11, gn=6.3, l=3.87, p_l=4.66e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 32% 25/78 [02:10<04:36, 5.22s/it, bpd=5.69, g_l=5.69, gn=3.21, l=5.35, p_l=4.75e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=3.86, g_l=3.86, gn=4.11, l=3.63, p_l=4.79e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 35% 27/78 [02:20<04:25, 5.21s/it, bpd=4.3, g_l=4.3, gn=4.98, l=4.04, p_l=4.75e-8]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 36% 28/78 [02:26<04:20, 5.21s/it, bpd=3.97, g_l=3.97, gn=3.28, l=3.74, p_l=4.39e-8]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 37% 29/78 [02:31<04:14, 5.20s/it, bpd=3.18, g_l=3.18, gn=3.17, l=2.99, p_l=4.17e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 38% 30/78 [02:36<04:10, 5.21s/it, bpd=5.36, g_l=5.36, gn=3.4, l=5.05, p_l=3.45e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 40% 31/78 [02:41<04:04, 5.21s/it, bpd=4.23, g_l=4.23, gn=4.24, l=3.98, p_l=2.82e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 41% 32/78 [02:47<03:59, 5.21s/it, bpd=4.07, g_l=4.07, gn=3.3, l=3.83, p_l=2.64e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 42% 33/78 [02:52<03:54, 5.21s/it, bpd=4.76, g_l=4.76, gn=3.1, l=4.48, p_l=2.42e-8]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 44% 34/78 [02:57<03:49, 5.21s/it, bpd=3.58, g_l=3.58, gn=4.53, l=3.37, p_l=2.78e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 45% 35/78 [03:02<03:43, 5.20s/it, bpd=4.96, g_l=4.96, gn=4.27, l=4.66, p_l=3.22e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 46% 36/78 [03:07<03:38, 5.20s/it, bpd=4.96, g_l=4.96, gn=4.11, l=4.67, p_l=3.4e-8]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 47% 37/78 [03:12<03:32, 5.19s/it, bpd=4.61, g_l=4.61, gn=4.1, l=4.34, p_l=3.9e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 49% 38/78 [03:18<03:27, 5.18s/it, bpd=4.16, g_l=4.16, gn=3.82, l=3.92, p_l=4.39e-8]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 50% 39/78 [03:23<03:22, 5.19s/it, bpd=4.8, g_l=4.8, gn=3.41, l=4.52, p_l=4.97e-8]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 51% 40/78 [03:28<03:17, 5.19s/it, bpd=3.94, g_l=3.94, gn=3.29, l=3.71, p_l=5.73e-8]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 53% 41/78 [03:33<03:11, 5.18s/it, bpd=4.09, g_l=4.09, gn=4.22, l=3.85, p_l=6.18e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 54% 42/78 [03:38<03:06, 5.18s/it, bpd=4.41, g_l=4.41, gn=3.97, l=4.15, p_l=6.58e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 55% 43/78 [03:44<03:01, 5.18s/it, bpd=5.39, g_l=5.39, gn=3.73, l=5.07, p_l=7.17e-8]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 56% 44/78 [03:49<02:55, 5.18s/it, bpd=4.06, g_l=4.06, gn=3.23, l=3.82, p_l=7.52e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 58% 45/78 [03:54<02:50, 5.18s/it, bpd=3.98, g_l=3.98, gn=4.71, l=3.75, p_l=7.75e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [03:59<02:45, 5.17s/it, bpd=3.04, g_l=3.04, gn=3.13, l=2.86, p_l=7.43e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [04:04<02:40, 5.17s/it, bpd=3.96, g_l=3.96, gn=3.26, l=3.73, p_l=7.52e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 62% 48/78 [04:09<02:35, 5.17s/it, bpd=3.64, g_l=3.64, gn=2.95, l=3.42, p_l=7.08e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 63% 49/78 [04:15<02:29, 5.17s/it, bpd=3.55, g_l=3.55, gn=2.94, l=3.34, p_l=7.03e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 64% 50/78 [04:20<02:25, 5.18s/it, bpd=5.43, g_l=5.43, gn=2.99, l=5.11, p_l=7.39e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 65% 51/78 [04:25<02:19, 5.18s/it, bpd=3.21, g_l=3.21, gn=4.07, l=3.02, p_l=7.35e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 67% 52/78 [04:30<02:15, 5.19s/it, bpd=4.53, g_l=4.53, gn=2.92, l=4.27, p_l=7.97e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 68% 53/78 [04:35<02:09, 5.19s/it, bpd=4.02, g_l=4.02, gn=3.06, l=3.79, p_l=8.46e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 69% 54/78 [04:41<02:04, 5.20s/it, bpd=4.91, g_l=4.91, gn=3.06, l=4.62, p_l=8.6e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 71% 55/78 [04:46<01:59, 5.20s/it, bpd=4.5, g_l=4.5, gn=3.65, l=4.24, p_l=8.38e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 72% 56/78 [04:51<01:54, 5.19s/it, bpd=3.95, g_l=3.95, gn=3.42, l=3.72, p_l=6.99e-8]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 73% 57/78 [04:56<01:49, 5.20s/it, bpd=4.04, g_l=4.04, gn=3.32, l=3.8, p_l=5.87e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 74% 58/78 [05:01<01:44, 5.20s/it, bpd=4.2, g_l=4.2, gn=2.99, l=3.96, p_l=4.97e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 76% 59/78 [05:07<01:39, 5.22s/it, bpd=4.45, g_l=4.45, gn=4.88, l=4.19, p_l=4.43e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 77% 60/78 [05:12<01:33, 5.21s/it, bpd=4.64, g_l=4.64, gn=3.09, l=4.37, p_l=4.03e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 78% 61/78 [05:17<01:28, 5.22s/it, bpd=4.29, g_l=4.29, gn=3.37, l=4.04, p_l=3.85e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 79% 62/78 [05:22<01:23, 5.21s/it, bpd=3.83, g_l=3.83, gn=3.07, l=3.61, p_l=3.94e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 81% 63/78 [05:27<01:18, 5.22s/it, bpd=4.09, g_l=4.09, gn=7.17, l=3.85, p_l=4.21e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [05:33<01:12, 5.21s/it, bpd=4.11, g_l=4.11, gn=3.31, l=3.87, p_l=4.39e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 83% 65/78 [05:38<01:07, 5.20s/it, bpd=4.58, g_l=4.58, gn=8.51, l=4.31, p_l=4.48e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:3095\u001b[0m\n"," 85% 66/78 [06:19<03:11, 15.94s/it, bpd=3.88, g_l=3.88, gn=4.13, l=3.65, p_l=4.57e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 86% 67/78 [06:24<02:20, 12.80s/it, bpd=4.34, g_l=4.34, gn=3.31, l=4.08, p_l=4.25e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 87% 68/78 [06:29<01:45, 10.50s/it, bpd=4.67, g_l=4.67, gn=3.2, l=4.39, p_l=4.08e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 88% 69/78 [06:34<01:19, 8.85s/it, bpd=5.1, g_l=5.1, gn=3.14, l=4.8, p_l=4.12e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 90% 70/78 [06:40<01:01, 7.75s/it, bpd=3.75, g_l=3.75, gn=3.41, l=3.53, p_l=4.12e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 91% 71/78 [06:48<00:54, 7.81s/it, bpd=4.24, g_l=4.24, gn=3.62, l=3.99, p_l=4.7e-8]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 92% 72/78 [06:53<00:41, 6.99s/it, bpd=3.61, g_l=3.61, gn=2.85, l=3.4, p_l=5.46e-8]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 94% 73/78 [06:58<00:32, 6.45s/it, bpd=4.47, g_l=4.47, gn=3.18, l=4.2, p_l=6.09e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 95% 74/78 [07:03<00:24, 6.04s/it, bpd=5.48, g_l=5.48, gn=3.58, l=5.16, p_l=6.94e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 96% 75/78 [07:08<00:17, 5.81s/it, bpd=3.55, g_l=3.55, gn=3.63, l=3.34, p_l=7.97e-8]/content/gdrive/MyDrive/slon/slon (20).txt\n","100% 78/78 [07:24<00:00, 5.70s/it, bpd=3.78, g_l=3.78, gn=3.42, l=3.56, p_l=1.22e-7]\n","Train bpd: 4.2519 prime_loss: 0.0000 gen_loss: 4.2519 loss: 4.0017 gn: 3.7218 lr: 0.0003 lg_loss_scale: 15.2700 epoch: 38.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (9).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:3107\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.10s/it, bpd=5.24, l=4.93]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 22% 2/9 [00:03<00:13, 1.99s/it, bpd=5.24, l=4.93]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 33% 3/9 [00:05<00:10, 1.81s/it, bpd=4.81, l=4.53]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.69s/it, bpd=5.69, l=5.36]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:08<00:06, 1.61s/it, bpd=5.28, l=4.97]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.55s/it, bpd=5.73, l=5.4]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.53s/it, bpd=4.21, l=3.96]\n","Ema bpd: 5.1350 prime_loss: 0.0109 gen_loss: 5.1350 loss: 4.8332 epoch: 38.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (32).txt\n","/content/gdrive/MyDrive/slon/slon (3).txt\n"," 1% 1/78 [00:05<07:09, 5.58s/it, bpd=4.19, g_l=4.19, gn=3.62, l=3.94, p_l=1.5e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 3% 2/78 [00:10<06:55, 5.46s/it, bpd=4.67, g_l=4.67, gn=3.3, l=4.4, p_l=1.47e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 4% 3/78 [00:16<06:46, 5.42s/it, bpd=3.91, g_l=3.91, gn=5.83, l=3.68, p_l=1.52e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 5% 4/78 [00:21<06:35, 5.35s/it, bpd=3.95, g_l=3.95, gn=4.79, l=3.71, p_l=1.67e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 6% 5/78 [00:26<06:28, 5.32s/it, bpd=4.56, g_l=4.56, gn=3.05, l=4.29, p_l=1.81e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 8% 6/78 [00:31<06:24, 5.34s/it, bpd=3.96, g_l=3.96, gn=3.54, l=3.72, p_l=1.99e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 9% 7/78 [00:37<06:17, 5.32s/it, bpd=5.88, g_l=5.88, gn=3.02, l=5.54, p_l=2.28e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 10% 8/78 [00:42<06:14, 5.35s/it, bpd=3.88, g_l=3.88, gn=2.96, l=3.65, p_l=2.31e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 12% 9/78 [00:47<06:07, 5.32s/it, bpd=5.77, g_l=5.77, gn=3.7, l=5.43, p_l=2.23e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:53<06:01, 5.31s/it, bpd=4.97, g_l=4.97, gn=4.29, l=4.68, p_l=2.08e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 14% 11/78 [00:58<05:53, 5.28s/it, bpd=4.54, g_l=4.54, gn=3.55, l=4.27, p_l=1.78e-7]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 15% 12/78 [01:03<05:46, 5.26s/it, bpd=3.71, g_l=3.71, gn=3.35, l=3.49, p_l=1.63e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 17% 13/78 [01:08<05:41, 5.25s/it, bpd=4.41, g_l=4.41, gn=3.52, l=4.15, p_l=1.47e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 18% 14/78 [01:13<05:34, 5.23s/it, bpd=5, g_l=5, gn=4.3, l=4.71, p_l=1.25e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 19% 15/78 [01:19<05:28, 5.22s/it, bpd=4.73, g_l=4.73, gn=3.12, l=4.45, p_l=1.11e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 21% 16/78 [01:24<05:23, 5.22s/it, bpd=3.97, g_l=3.97, gn=3.97, l=3.73, p_l=9.99e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 22% 17/78 [01:29<05:17, 5.20s/it, bpd=3.87, g_l=3.87, gn=3.25, l=3.65, p_l=1.03e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 23% 18/78 [01:34<05:12, 5.20s/it, bpd=4.3, g_l=4.3, gn=3.51, l=4.05, p_l=1.07e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 24% 19/78 [01:39<05:06, 5.20s/it, bpd=4.29, g_l=4.29, gn=3.6, l=4.04, p_l=9.76e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 26% 20/78 [01:45<05:01, 5.20s/it, bpd=4.61, g_l=4.61, gn=3.29, l=4.34, p_l=8.78e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 27% 21/78 [01:50<04:56, 5.20s/it, bpd=3.74, g_l=3.74, gn=2.96, l=3.52, p_l=8.46e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 28% 22/78 [01:55<04:51, 5.20s/it, bpd=4.89, g_l=4.89, gn=3.04, l=4.61, p_l=8.29e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 29% 23/78 [02:00<04:45, 5.20s/it, bpd=3.54, g_l=3.54, gn=3.21, l=3.33, p_l=8.2e-8]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 31% 24/78 [02:05<04:40, 5.19s/it, bpd=3.63, g_l=3.63, gn=3.41, l=3.42, p_l=7.97e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 32% 25/78 [02:11<04:35, 5.21s/it, bpd=4.18, g_l=4.18, gn=3.12, l=3.94, p_l=7.35e-8]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 33% 26/78 [02:16<04:30, 5.20s/it, bpd=4.72, g_l=4.72, gn=3.36, l=4.44, p_l=6.85e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 35% 27/78 [02:21<04:26, 5.22s/it, bpd=3.63, g_l=3.63, gn=3.03, l=3.42, p_l=6e-8]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 36% 28/78 [02:26<04:20, 5.22s/it, bpd=2.94, g_l=2.94, gn=3.54, l=2.77, p_l=5.73e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 37% 29/78 [02:32<04:15, 5.22s/it, bpd=3.87, g_l=3.87, gn=3.19, l=3.64, p_l=5.46e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 38% 30/78 [02:37<04:10, 5.22s/it, bpd=3.87, g_l=3.87, gn=3.25, l=3.64, p_l=5.28e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 40% 31/78 [02:42<04:04, 5.21s/it, bpd=4.82, g_l=4.82, gn=3.2, l=4.53, p_l=5.6e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 41% 32/78 [02:47<03:59, 5.21s/it, bpd=4.68, g_l=4.68, gn=3.23, l=4.4, p_l=5.6e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 42% 33/78 [02:52<03:54, 5.21s/it, bpd=4.39, g_l=4.39, gn=3.19, l=4.13, p_l=5.91e-8]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 44% 34/78 [02:58<03:49, 5.23s/it, bpd=4.79, g_l=4.79, gn=3.25, l=4.51, p_l=6.36e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 45% 35/78 [03:03<03:44, 5.23s/it, bpd=4.19, g_l=4.19, gn=3.34, l=3.94, p_l=7.61e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 46% 36/78 [03:08<03:39, 5.23s/it, bpd=5.47, g_l=5.47, gn=4.68, l=5.15, p_l=8.87e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 47% 37/78 [03:13<03:34, 5.23s/it, bpd=4.86, g_l=4.86, gn=3.13, l=4.58, p_l=9.54e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 49% 38/78 [03:19<03:28, 5.22s/it, bpd=4.3, g_l=4.3, gn=4.1, l=4.05, p_l=1e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 50% 39/78 [03:24<03:23, 5.23s/it, bpd=2.52, g_l=2.52, gn=3.12, l=2.37, p_l=1.07e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 51% 40/78 [03:29<03:18, 5.22s/it, bpd=4.21, g_l=4.21, gn=3.07, l=3.96, p_l=1.12e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 53% 41/78 [03:34<03:13, 5.23s/it, bpd=4.5, g_l=4.5, gn=3.43, l=4.23, p_l=9.85e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 54% 42/78 [03:39<03:07, 5.22s/it, bpd=3.81, g_l=3.81, gn=3.4, l=3.59, p_l=8.42e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 55% 43/78 [03:45<03:02, 5.21s/it, bpd=4.74, g_l=4.74, gn=6.6, l=4.46, p_l=7.39e-8]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 56% 44/78 [03:50<02:57, 5.22s/it, bpd=3.88, g_l=3.88, gn=5.26, l=3.65, p_l=6.36e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 58% 45/78 [03:55<02:51, 5.21s/it, bpd=5.29, g_l=5.29, gn=3.07, l=4.98, p_l=5.64e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 59% 46/78 [04:00<02:47, 5.22s/it, bpd=3.96, g_l=3.96, gn=3.52, l=3.73, p_l=5.37e-8]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 60% 47/78 [04:05<02:41, 5.21s/it, bpd=5.4, g_l=5.4, gn=3.34, l=5.08, p_l=5.73e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 62% 48/78 [04:11<02:36, 5.22s/it, bpd=4.09, g_l=4.09, gn=3.25, l=3.85, p_l=6.09e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 63% 49/78 [04:16<02:31, 5.22s/it, bpd=5.51, g_l=5.51, gn=3.66, l=5.19, p_l=6.27e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 64% 50/78 [04:21<02:25, 5.21s/it, bpd=3.72, g_l=3.72, gn=4.43, l=3.51, p_l=6.94e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 65% 51/78 [04:26<02:20, 5.21s/it, bpd=4.13, g_l=4.13, gn=3.08, l=3.88, p_l=7.75e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 67% 52/78 [04:32<02:15, 5.20s/it, bpd=3.61, g_l=3.61, gn=3.55, l=3.4, p_l=8.69e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 68% 53/78 [04:37<02:10, 5.21s/it, bpd=3.66, g_l=3.66, gn=3.16, l=3.44, p_l=9.14e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 69% 54/78 [04:42<02:05, 5.21s/it, bpd=3.52, g_l=3.52, gn=3.15, l=3.31, p_l=9.76e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 71% 55/78 [04:47<01:59, 5.21s/it, bpd=4.34, g_l=4.34, gn=3.06, l=4.08, p_l=1.01e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 72% 56/78 [04:52<01:54, 5.22s/it, bpd=4.74, g_l=4.74, gn=3.6, l=4.46, p_l=1.01e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 73% 57/78 [04:58<01:49, 5.20s/it, bpd=3.56, g_l=3.56, gn=4.23, l=3.36, p_l=1.11e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 74% 58/78 [05:03<01:44, 5.21s/it, bpd=3.64, g_l=3.64, gn=3.19, l=3.43, p_l=1.11e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 76% 59/78 [05:08<01:38, 5.20s/it, bpd=4.64, g_l=4.64, gn=3.82, l=4.36, p_l=1.09e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 77% 60/78 [05:13<01:33, 5.21s/it, bpd=3.71, g_l=3.71, gn=2.86, l=3.49, p_l=1.14e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 78% 61/78 [05:18<01:28, 5.21s/it, bpd=4.57, g_l=4.57, gn=3.61, l=4.3, p_l=1.29e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 79% 62/78 [05:24<01:23, 5.20s/it, bpd=3.88, g_l=3.88, gn=5.66, l=3.65, p_l=1.62e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 81% 63/78 [05:29<01:18, 5.21s/it, bpd=4.94, g_l=4.94, gn=3.61, l=4.65, p_l=1.97e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 82% 64/78 [05:34<01:12, 5.20s/it, bpd=4.04, g_l=4.04, gn=4.2, l=3.8, p_l=2.23e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 83% 65/78 [05:39<01:07, 5.22s/it, bpd=3.46, g_l=3.46, gn=4.8, l=3.26, p_l=2.36e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 85% 66/78 [05:44<01:02, 5.21s/it, bpd=3.87, g_l=3.87, gn=3.66, l=3.64, p_l=2.43e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [05:50<00:57, 5.19s/it, bpd=4.96, g_l=4.96, gn=3, l=4.66, p_l=2.57e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 87% 68/78 [05:55<00:51, 5.20s/it, bpd=4.28, g_l=4.28, gn=3.01, l=4.02, p_l=2.54e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 88% 69/78 [06:00<00:46, 5.20s/it, bpd=3.33, g_l=3.33, gn=3.37, l=3.13, p_l=2.66e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 90% 70/78 [06:05<00:41, 5.21s/it, bpd=5.63, g_l=5.63, gn=3.12, l=5.3, p_l=2.92e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 91% 71/78 [06:10<00:36, 5.20s/it, bpd=4.87, g_l=4.87, gn=3.66, l=4.58, p_l=3.26e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 92% 72/78 [06:16<00:31, 5.20s/it, bpd=5.09, g_l=5.09, gn=3.41, l=4.79, p_l=3.56e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 94% 73/78 [06:21<00:26, 5.20s/it, bpd=3.77, g_l=3.77, gn=3.47, l=3.55, p_l=3.7e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 95% 74/78 [06:26<00:20, 5.20s/it, bpd=3.91, g_l=3.91, gn=3.06, l=3.68, p_l=3.7e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 96% 75/78 [06:31<00:15, 5.21s/it, bpd=3.89, g_l=3.89, gn=3.04, l=3.66, p_l=3.38e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n","100% 78/78 [06:47<00:00, 5.22s/it, bpd=2.74, g_l=2.74, gn=3.47, l=2.58, p_l=3.27e-7]\n","Train bpd: 4.2462 prime_loss: 0.0000 gen_loss: 4.2462 loss: 3.9964 gn: 3.5703 lr: 0.0003 lg_loss_scale: 15.5820 epoch: 39.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","/content/gdrive/MyDrive/slon/slon (6).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:3185\u001b[0m\n"," 11% 1/9 [00:01<00:15, 1.99s/it, bpd=4.81, l=4.53]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.88s/it, bpd=3.94, l=3.71]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:04<00:10, 1.73s/it, bpd=5.11, l=4.81]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.63s/it, bpd=4.74, l=4.47]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.56s/it, bpd=3.94, l=3.71]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 67% 6/9 [00:09<00:04, 1.51s/it, bpd=4.76, l=4.48]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.50s/it, bpd=5.31, l=4.99]\n","Ema bpd: 4.8517 prime_loss: 0.0109 gen_loss: 4.8517 loss: 4.5666 epoch: 39.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (15).txt\n","/content/gdrive/MyDrive/slon/slon (24).txt\n","/content/gdrive/MyDrive/slon/slon (4).txt\n"," 1% 1/78 [00:05<06:57, 5.42s/it, bpd=4.22, g_l=4.22, gn=3.73, l=3.97, p_l=3.32e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 3% 2/78 [00:10<06:48, 5.37s/it, bpd=5.4, g_l=5.4, gn=2.95, l=5.08, p_l=3.19e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 4% 3/78 [00:15<06:40, 5.34s/it, bpd=4.38, g_l=4.38, gn=4.57, l=4.12, p_l=3.05e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 5% 4/78 [00:21<06:33, 5.32s/it, bpd=3.51, g_l=3.51, gn=2.79, l=3.3, p_l=2.43e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 6% 5/78 [00:26<06:27, 5.31s/it, bpd=4.22, g_l=4.22, gn=3.35, l=3.97, p_l=1.9e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 8% 6/78 [00:31<06:21, 5.30s/it, bpd=3.82, g_l=3.82, gn=3.18, l=3.59, p_l=1.5e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 9% 7/78 [00:37<06:15, 5.29s/it, bpd=3.54, g_l=3.54, gn=3.59, l=3.33, p_l=1.18e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 10% 8/78 [00:42<06:09, 5.28s/it, bpd=5.38, g_l=5.38, gn=3.58, l=5.06, p_l=9.05e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 12% 9/78 [00:47<06:03, 5.27s/it, bpd=5.78, g_l=5.78, gn=4.44, l=5.44, p_l=7.48e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:52<05:56, 5.24s/it, bpd=5.44, g_l=5.44, gn=2.9, l=5.12, p_l=6.81e-8]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 14% 11/78 [00:57<05:50, 5.23s/it, bpd=4.72, g_l=4.72, gn=3.35, l=4.44, p_l=6.05e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 15% 12/78 [01:03<05:44, 5.22s/it, bpd=3.93, g_l=3.93, gn=3.01, l=3.7, p_l=5.69e-8]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 17% 13/78 [01:08<05:38, 5.21s/it, bpd=3.09, g_l=3.09, gn=3.83, l=2.91, p_l=5.11e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 18% 14/78 [01:13<05:32, 5.19s/it, bpd=3.26, g_l=3.26, gn=3.12, l=3.07, p_l=4.79e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 19% 15/78 [01:23<07:05, 6.75s/it, bpd=5.12, g_l=5.12, gn=3.66, l=4.82, p_l=4.93e-8]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 21% 16/78 [01:28<06:27, 6.25s/it, bpd=3.84, g_l=3.84, gn=3.34, l=3.61, p_l=4.3e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:34<06:01, 5.93s/it, bpd=4.14, g_l=4.14, gn=2.92, l=3.89, p_l=3.81e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 23% 18/78 [01:39<05:42, 5.71s/it, bpd=4.23, g_l=4.23, gn=3.59, l=3.98, p_l=3.27e-8]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 24% 19/78 [01:44<05:28, 5.58s/it, bpd=3.47, g_l=3.47, gn=3.85, l=3.26, p_l=2.78e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 26% 20/78 [01:49<05:19, 5.50s/it, bpd=3.77, g_l=3.77, gn=3.46, l=3.55, p_l=2.64e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 27% 21/78 [01:55<05:10, 5.44s/it, bpd=3.54, g_l=3.54, gn=2.92, l=3.33, p_l=2.51e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 28% 22/78 [02:00<05:02, 5.39s/it, bpd=4.38, g_l=4.38, gn=3.17, l=4.13, p_l=2.87e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 29% 23/78 [02:05<04:53, 5.34s/it, bpd=3.8, g_l=3.8, gn=3.41, l=3.57, p_l=3.05e-8]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 31% 24/78 [02:10<04:46, 5.30s/it, bpd=3.88, g_l=3.88, gn=4.53, l=3.65, p_l=3.14e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 32% 25/78 [02:16<04:39, 5.27s/it, bpd=4.17, g_l=4.17, gn=3.59, l=3.92, p_l=2.87e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 33% 26/78 [02:21<04:32, 5.24s/it, bpd=3.6, g_l=3.6, gn=3.53, l=3.39, p_l=2.51e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 35% 27/78 [02:26<04:26, 5.23s/it, bpd=4.41, g_l=4.41, gn=3.34, l=4.15, p_l=2.19e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 36% 28/78 [02:31<04:20, 5.20s/it, bpd=3.8, g_l=3.8, gn=4.05, l=3.58, p_l=2.19e-8]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 37% 29/78 [02:36<04:14, 5.18s/it, bpd=5.07, g_l=5.07, gn=3.09, l=4.77, p_l=2.33e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 38% 30/78 [02:41<04:08, 5.18s/it, bpd=5.52, g_l=5.52, gn=3.52, l=5.19, p_l=3e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 40% 31/78 [02:47<04:03, 5.18s/it, bpd=3.82, g_l=3.82, gn=4.21, l=3.6, p_l=3.63e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 41% 32/78 [02:52<03:58, 5.19s/it, bpd=4.01, g_l=4.01, gn=4.05, l=3.77, p_l=4.21e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 42% 33/78 [02:57<03:53, 5.19s/it, bpd=4.26, g_l=4.26, gn=3.98, l=4.01, p_l=4.61e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 44% 34/78 [03:02<03:48, 5.18s/it, bpd=4.73, g_l=4.73, gn=4.09, l=4.45, p_l=4.88e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 45% 35/78 [03:07<03:43, 5.20s/it, bpd=4.82, g_l=4.82, gn=3.87, l=4.54, p_l=6.23e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:13<03:38, 5.20s/it, bpd=2.27, g_l=2.27, gn=2.96, l=2.13, p_l=7.84e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 47% 37/78 [03:18<03:33, 5.21s/it, bpd=3.83, g_l=3.83, gn=4.67, l=3.61, p_l=1.08e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 49% 38/78 [03:23<03:28, 5.21s/it, bpd=3.43, g_l=3.43, gn=3.31, l=3.23, p_l=1.4e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 50% 39/78 [03:28<03:23, 5.21s/it, bpd=4.07, g_l=4.07, gn=5.14, l=3.83, p_l=1.7e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 51% 40/78 [03:34<03:18, 5.22s/it, bpd=4.94, g_l=4.94, gn=3.23, l=4.65, p_l=2.03e-7]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 53% 41/78 [03:39<03:12, 5.21s/it, bpd=4.61, g_l=4.61, gn=3.29, l=4.34, p_l=2.21e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 54% 42/78 [03:44<03:07, 5.22s/it, bpd=3.83, g_l=3.83, gn=3.16, l=3.6, p_l=2.25e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 55% 43/78 [03:49<03:02, 5.22s/it, bpd=4.28, g_l=4.28, gn=3.35, l=4.03, p_l=2.36e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 56% 44/78 [03:54<02:57, 5.21s/it, bpd=3.3, g_l=3.3, gn=3.14, l=3.11, p_l=2.41e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 58% 45/78 [04:00<02:52, 5.22s/it, bpd=4.32, g_l=4.32, gn=4.3, l=4.07, p_l=2.53e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 59% 46/78 [04:05<02:46, 5.22s/it, bpd=4.1, g_l=4.1, gn=3.16, l=3.86, p_l=2.78e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [04:10<02:41, 5.22s/it, bpd=4.76, g_l=4.76, gn=3.34, l=4.48, p_l=3.36e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 62% 48/78 [04:15<02:36, 5.22s/it, bpd=5.82, g_l=5.82, gn=3.24, l=5.48, p_l=4.1e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 63% 49/78 [04:20<02:31, 5.21s/it, bpd=3.69, g_l=3.69, gn=3, l=3.47, p_l=4.84e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 64% 50/78 [04:26<02:26, 5.22s/it, bpd=4.09, g_l=4.09, gn=2.96, l=3.85, p_l=5.98e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 65% 51/78 [04:31<02:20, 5.22s/it, bpd=5.16, g_l=5.16, gn=3.22, l=4.86, p_l=7.75e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 67% 52/78 [04:36<02:15, 5.23s/it, bpd=4.27, g_l=4.27, gn=3.25, l=4.01, p_l=9.32e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 68% 53/78 [04:41<02:10, 5.22s/it, bpd=5.98, g_l=5.98, gn=3.07, l=5.63, p_l=1.05e-6]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 69% 54/78 [04:47<02:05, 5.21s/it, bpd=5.03, g_l=5.03, gn=3.21, l=4.74, p_l=1.04e-6]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 71% 55/78 [04:52<02:00, 5.23s/it, bpd=3.75, g_l=3.75, gn=3.55, l=3.53, p_l=1e-6]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 72% 56/78 [04:57<01:54, 5.22s/it, bpd=4.92, g_l=4.92, gn=3.04, l=4.63, p_l=9.46e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 73% 57/78 [05:02<01:49, 5.22s/it, bpd=4.49, g_l=4.49, gn=4.34, l=4.22, p_l=8.59e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 74% 58/78 [05:07<01:44, 5.21s/it, bpd=5.14, g_l=5.14, gn=2.81, l=4.84, p_l=8.32e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 76% 59/78 [05:13<01:39, 5.21s/it, bpd=4.89, g_l=4.89, gn=3.15, l=4.6, p_l=8.11e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 77% 60/78 [05:18<01:34, 5.22s/it, bpd=3.93, g_l=3.93, gn=3.53, l=3.7, p_l=8.29e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 78% 61/78 [05:23<01:28, 5.22s/it, bpd=3.74, g_l=3.74, gn=3.42, l=3.52, p_l=7.83e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 79% 62/78 [05:28<01:23, 5.22s/it, bpd=2.5, g_l=2.5, gn=3.39, l=2.35, p_l=7.73e-7]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 81% 63/78 [05:34<01:18, 5.21s/it, bpd=4.31, g_l=4.31, gn=6.23, l=4.05, p_l=7.57e-7]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 82% 64/78 [05:39<01:12, 5.21s/it, bpd=4.73, g_l=4.73, gn=3.85, l=4.45, p_l=7.77e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 83% 65/78 [05:44<01:07, 5.22s/it, bpd=4.16, g_l=4.16, gn=4.8, l=3.92, p_l=7.57e-7]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 85% 66/78 [05:49<01:02, 5.22s/it, bpd=3.59, g_l=3.59, gn=3.77, l=3.38, p_l=7.64e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 86% 67/78 [05:54<00:57, 5.22s/it, bpd=4.56, g_l=4.56, gn=3.16, l=4.29, p_l=8.33e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 87% 68/78 [06:00<00:52, 5.22s/it, bpd=5.1, g_l=5.1, gn=3.37, l=4.8, p_l=8.56e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 88% 69/78 [06:05<00:46, 5.21s/it, bpd=3.58, g_l=3.58, gn=3.26, l=3.37, p_l=8.73e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 90% 70/78 [06:10<00:41, 5.21s/it, bpd=3.83, g_l=3.83, gn=3.37, l=3.6, p_l=8.64e-7]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 91% 71/78 [06:15<00:36, 5.21s/it, bpd=3.61, g_l=3.61, gn=4.73, l=3.39, p_l=8.1e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 92% 72/78 [06:20<00:31, 5.21s/it, bpd=4.43, g_l=4.43, gn=4.68, l=4.17, p_l=7.32e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 94% 73/78 [06:26<00:26, 5.20s/it, bpd=4.09, g_l=4.09, gn=3.38, l=3.85, p_l=5.84e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 95% 74/78 [06:31<00:20, 5.20s/it, bpd=3.83, g_l=3.83, gn=4.25, l=3.6, p_l=4.65e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 96% 75/78 [06:36<00:15, 5.21s/it, bpd=3.3, g_l=3.3, gn=3.63, l=3.1, p_l=3.86e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n","100% 78/78 [06:52<00:00, 5.29s/it, bpd=4.13, g_l=4.13, gn=3.83, l=3.88, p_l=2.54e-7]\n","Train bpd: 4.2046 prime_loss: 0.0000 gen_loss: 4.2046 loss: 3.9572 gn: 3.6338 lr: 0.0003 lg_loss_scale: 15.8940 epoch: 40.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:3263\u001b[0m\n"," 11% 1/9 [00:02<00:16, 2.04s/it, bpd=5.83, l=5.49]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:13, 1.90s/it, bpd=4.76, l=4.48]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 33% 3/9 [00:05<00:10, 1.75s/it, bpd=5.72, l=5.39]/content/gdrive/MyDrive/slon/slon (7).txt\n"," 44% 4/9 [00:06<00:08, 1.65s/it, bpd=3.97, l=3.74]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:07<00:06, 1.57s/it, bpd=5.38, l=5.07]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 67% 6/9 [00:09<00:04, 1.52s/it, bpd=5.03, l=4.73]/content/gdrive/MyDrive/slon/slon (9).txt\n","100% 9/9 [00:13<00:00, 1.51s/it, bpd=4.63, l=4.35]\n","Ema bpd: 5.0195 prime_loss: 0.0106 gen_loss: 5.0195 loss: 4.7245 epoch: 40.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (25).txt\n","/content/gdrive/MyDrive/slon/slon (17).txt\n","/content/gdrive/MyDrive/slon/slon (22).txt\n"," 1% 1/78 [00:05<06:55, 5.40s/it, bpd=4.07, g_l=4.07, gn=3.04, l=3.83, p_l=2.19e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 3% 2/78 [00:10<06:45, 5.33s/it, bpd=3.22, g_l=3.22, gn=3.16, l=3.03, p_l=1.92e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 4% 3/78 [00:15<06:37, 5.30s/it, bpd=4.11, g_l=4.11, gn=4.34, l=3.86, p_l=1.72e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 5% 4/78 [00:21<06:31, 5.29s/it, bpd=4.65, g_l=4.65, gn=4.07, l=4.38, p_l=1.5e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 6% 5/78 [00:26<06:25, 5.28s/it, bpd=3.99, g_l=3.99, gn=3.74, l=3.76, p_l=1.39e-7]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 8% 6/78 [00:31<06:20, 5.29s/it, bpd=3.94, g_l=3.94, gn=4.32, l=3.71, p_l=1.3e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 9% 7/78 [00:36<06:13, 5.27s/it, bpd=6.08, g_l=6.08, gn=3.14, l=5.72, p_l=1.21e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 10% 8/78 [00:42<06:07, 5.25s/it, bpd=4.61, g_l=4.61, gn=3.14, l=4.34, p_l=1.08e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 12% 9/78 [00:47<06:01, 5.24s/it, bpd=3.73, g_l=3.73, gn=3.43, l=3.51, p_l=1.08e-7]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 13% 10/78 [00:52<05:54, 5.21s/it, bpd=4.25, g_l=4.25, gn=3.35, l=4, p_l=1.11e-7]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 14% 11/78 [00:57<05:48, 5.21s/it, bpd=4.58, g_l=4.58, gn=3.21, l=4.31, p_l=1.17e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 15% 12/78 [01:02<05:42, 5.19s/it, bpd=4.5, g_l=4.5, gn=3.06, l=4.24, p_l=1.41e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 17% 13/78 [01:07<05:36, 5.18s/it, bpd=3.48, g_l=3.48, gn=3.92, l=3.28, p_l=1.8e-7]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 18% 14/78 [01:13<05:31, 5.18s/it, bpd=4.03, g_l=4.03, gn=4.11, l=3.79, p_l=1.93e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 19% 15/78 [01:18<05:26, 5.18s/it, bpd=4, g_l=4, gn=3.49, l=3.76, p_l=2e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 21% 16/78 [01:23<05:21, 5.19s/it, bpd=5.4, g_l=5.4, gn=3.3, l=5.08, p_l=1.77e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 22% 17/78 [01:28<05:16, 5.18s/it, bpd=5.62, g_l=5.62, gn=2.98, l=5.29, p_l=1.42e-7]/content/gdrive/MyDrive/slon/slon (10).txt\n"," 23% 18/78 [01:33<05:10, 5.18s/it, bpd=3.75, g_l=3.75, gn=4.71, l=3.53, p_l=1.12e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 24% 19/78 [01:39<05:06, 5.19s/it, bpd=3.91, g_l=3.91, gn=3.74, l=3.68, p_l=9.45e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 26% 20/78 [01:44<05:01, 5.20s/it, bpd=3.92, g_l=3.92, gn=3.3, l=3.69, p_l=8.69e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 27% 21/78 [01:49<04:57, 5.21s/it, bpd=5.68, g_l=5.68, gn=3.22, l=5.35, p_l=8.46e-8]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 28% 22/78 [01:54<04:51, 5.21s/it, bpd=3.76, g_l=3.76, gn=3.86, l=3.54, p_l=8.64e-8]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 29% 23/78 [01:59<04:46, 5.20s/it, bpd=3.09, g_l=3.09, gn=6.64, l=2.9, p_l=8.82e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 31% 24/78 [02:05<04:41, 5.21s/it, bpd=4.17, g_l=4.17, gn=3.66, l=3.93, p_l=9.9e-8]/content/gdrive/MyDrive/slon/slon (24).txt\n"," 32% 25/78 [02:10<04:36, 5.21s/it, bpd=4.59, g_l=4.59, gn=4.38, l=4.32, p_l=1.08e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 33% 26/78 [02:15<04:31, 5.22s/it, bpd=4, g_l=4, gn=3.39, l=3.76, p_l=1.07e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 35% 27/78 [02:20<04:25, 5.21s/it, bpd=4.85, g_l=4.85, gn=3.08, l=4.57, p_l=1.05e-7]/content/gdrive/MyDrive/slon/slon (20).txt\n"," 36% 28/78 [02:25<04:20, 5.20s/it, bpd=3.84, g_l=3.84, gn=3.69, l=3.61, p_l=9.45e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 37% 29/78 [02:31<04:15, 5.21s/it, bpd=3.57, g_l=3.57, gn=2.97, l=3.36, p_l=9.58e-8]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 38% 30/78 [02:36<04:09, 5.20s/it, bpd=4.02, g_l=4.02, gn=3.43, l=3.78, p_l=9.23e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 40% 31/78 [02:41<04:04, 5.20s/it, bpd=4.03, g_l=4.03, gn=3.5, l=3.79, p_l=9.14e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 41% 32/78 [02:46<03:59, 5.20s/it, bpd=3.26, g_l=3.26, gn=7.04, l=3.06, p_l=8.55e-8]/content/gdrive/MyDrive/slon/slon (1).txt\n"," 42% 33/78 [02:51<03:53, 5.19s/it, bpd=4.59, g_l=4.59, gn=3.6, l=4.32, p_l=8.06e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 44% 34/78 [02:57<03:49, 5.20s/it, bpd=5.07, g_l=5.07, gn=3.14, l=4.77, p_l=8.73e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 45% 35/78 [03:02<03:43, 5.20s/it, bpd=3.83, g_l=3.83, gn=3.18, l=3.61, p_l=8.87e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 46% 36/78 [03:07<03:38, 5.19s/it, bpd=4.37, g_l=4.37, gn=3.18, l=4.11, p_l=8.82e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 47% 37/78 [03:18<04:39, 6.82s/it, bpd=4.98, g_l=4.98, gn=3.63, l=4.69, p_l=8.69e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 49% 38/78 [03:23<04:12, 6.31s/it, bpd=4.04, g_l=4.04, gn=3.22, l=3.81, p_l=8.38e-8]/content/gdrive/MyDrive/slon/slon (32).txt\n"," 50% 39/78 [03:28<03:52, 5.97s/it, bpd=4.09, g_l=4.09, gn=3.37, l=3.85, p_l=7.52e-8]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 51% 40/78 [03:33<03:37, 5.73s/it, bpd=4.21, g_l=4.21, gn=3.3, l=3.96, p_l=7.35e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 53% 41/78 [03:38<03:26, 5.59s/it, bpd=4.57, g_l=4.57, gn=3.11, l=4.3, p_l=6.81e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 54% 42/78 [03:44<03:17, 5.50s/it, bpd=3.82, g_l=3.82, gn=4.56, l=3.6, p_l=7.21e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 55% 43/78 [03:49<03:10, 5.43s/it, bpd=4.34, g_l=4.34, gn=3.4, l=4.09, p_l=8.64e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 56% 44/78 [03:54<03:03, 5.38s/it, bpd=4.74, g_l=4.74, gn=3.28, l=4.46, p_l=1.03e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 58% 45/78 [03:59<02:56, 5.34s/it, bpd=4.34, g_l=4.34, gn=2.92, l=4.09, p_l=1.17e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 59% 46/78 [04:05<02:49, 5.31s/it, bpd=3.8, g_l=3.8, gn=3.36, l=3.57, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 60% 47/78 [04:10<02:43, 5.28s/it, bpd=4.6, g_l=4.6, gn=3.24, l=4.33, p_l=1.7e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 62% 48/78 [04:15<02:37, 5.24s/it, bpd=4.01, g_l=4.01, gn=3.24, l=3.77, p_l=2.28e-7]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 63% 49/78 [04:20<02:31, 5.23s/it, bpd=3.98, g_l=3.98, gn=3.2, l=3.75, p_l=2.96e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 64% 50/78 [04:25<02:25, 5.21s/it, bpd=3.62, g_l=3.62, gn=3.13, l=3.41, p_l=3.61e-7]/content/gdrive/MyDrive/slon/slon (35).txt\n"," 65% 51/78 [04:31<02:20, 5.19s/it, bpd=3.91, g_l=3.91, gn=3.8, l=3.68, p_l=4.15e-7]/content/gdrive/MyDrive/slon/slon (15).txt\n"," 67% 52/78 [04:36<02:14, 5.17s/it, bpd=3.46, g_l=3.46, gn=2.96, l=3.26, p_l=4.65e-7]/content/gdrive/MyDrive/slon/slon (23).txt\n"," 68% 53/78 [04:41<02:09, 5.16s/it, bpd=5.01, g_l=5.01, gn=3.47, l=4.71, p_l=5.28e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 69% 54/78 [04:46<02:04, 5.18s/it, bpd=4.06, g_l=4.06, gn=6.15, l=3.82, p_l=5.5e-7]/content/gdrive/MyDrive/slon/slon (12).txt\n"," 71% 55/78 [04:51<01:59, 5.18s/it, bpd=4.48, g_l=4.48, gn=3.2, l=4.22, p_l=5.67e-7]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 72% 56/78 [04:56<01:54, 5.18s/it, bpd=3.93, g_l=3.93, gn=3.39, l=3.7, p_l=5.58e-7]/content/gdrive/MyDrive/slon/slon (33).txt\n"," 73% 57/78 [05:02<01:48, 5.18s/it, bpd=3.93, g_l=3.93, gn=3.63, l=3.7, p_l=4.86e-7]/content/gdrive/MyDrive/slon/slon (29).txt\n"," 74% 58/78 [05:07<01:43, 5.19s/it, bpd=4.76, g_l=4.76, gn=3.09, l=4.48, p_l=4.18e-7]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 76% 59/78 [05:12<01:38, 5.20s/it, bpd=3.86, g_l=3.86, gn=3.36, l=3.63, p_l=3.58e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 77% 60/78 [05:17<01:33, 5.21s/it, bpd=4.01, g_l=4.01, gn=3.26, l=3.78, p_l=3.17e-7]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 78% 61/78 [05:22<01:28, 5.21s/it, bpd=4.1, g_l=4.1, gn=3.88, l=3.86, p_l=2.32e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 79% 62/78 [05:28<01:23, 5.22s/it, bpd=3.77, g_l=3.77, gn=4.52, l=3.55, p_l=1.85e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 81% 63/78 [05:33<01:18, 5.21s/it, bpd=2.64, g_l=2.64, gn=4.55, l=2.48, p_l=1.64e-7]/content/gdrive/MyDrive/slon/slon (3).txt\n"," 82% 64/78 [05:38<01:13, 5.22s/it, bpd=4.53, g_l=4.53, gn=4.47, l=4.26, p_l=1.64e-7]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 83% 65/78 [05:43<01:07, 5.21s/it, bpd=3.87, g_l=3.87, gn=5.21, l=3.65, p_l=1.59e-7]/content/gdrive/MyDrive/slon/slon (30).txt\n"," 85% 66/78 [05:49<01:02, 5.20s/it, bpd=4.49, g_l=4.49, gn=4.3, l=4.22, p_l=1.46e-7]/content/gdrive/MyDrive/slon/slon (13).txt\n"," 86% 67/78 [05:54<00:57, 5.20s/it, bpd=3.47, g_l=3.47, gn=3.23, l=3.27, p_l=1.31e-7]/content/gdrive/MyDrive/slon/slon (4).txt\n"," 87% 68/78 [05:59<00:51, 5.19s/it, bpd=5.69, g_l=5.69, gn=3.35, l=5.36, p_l=1.23e-7]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 88% 69/78 [06:04<00:46, 5.19s/it, bpd=5.07, g_l=5.07, gn=3.22, l=4.77, p_l=1.02e-7]/content/gdrive/MyDrive/slon/slon (2).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:3333\u001b[0m\n"," 90% 70/78 [06:42<02:00, 15.12s/it, bpd=3.81, g_l=3.81, gn=4.81, l=3.59, p_l=8.46e-8]/content/gdrive/MyDrive/slon/slon (28).txt\n"," 91% 71/78 [06:47<01:24, 12.11s/it, bpd=4.52, g_l=4.52, gn=3.53, l=4.25, p_l=6.85e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 92% 72/78 [06:53<01:00, 10.02s/it, bpd=4.02, g_l=4.02, gn=3.48, l=3.79, p_l=5.87e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 94% 73/78 [06:58<00:42, 8.54s/it, bpd=2.85, g_l=2.85, gn=3.11, l=2.68, p_l=5.02e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 95% 74/78 [07:03<00:30, 7.53s/it, bpd=3.57, g_l=3.57, gn=2.82, l=3.36, p_l=4.57e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 96% 75/78 [07:08<00:20, 6.80s/it, bpd=3.64, g_l=3.64, gn=3.76, l=3.43, p_l=4.79e-8]/content/gdrive/MyDrive/slon/slon (15).txt\n","100% 78/78 [07:24<00:00, 5.69s/it, bpd=3.43, g_l=3.43, gn=3.27, l=3.23, p_l=7.08e-8]\n","Train bpd: 4.1769 prime_loss: 0.0000 gen_loss: 4.1769 loss: 3.9312 gn: 3.6639 lr: 0.0003 lg_loss_scale: 16.2060 epoch: 41.0000\n"," 0% 0/9 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (5).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","/content/gdrive/MyDrive/slon/slon (7).txt\n","Logging train inputs/ouputs\n","\u001b[35msteps:3341\u001b[0m\n"," 11% 1/9 [00:02<00:17, 2.24s/it, bpd=4.83, l=4.55]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 22% 2/9 [00:03<00:14, 2.08s/it, bpd=5.76, l=5.42]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 33% 3/9 [00:05<00:11, 1.87s/it, bpd=5.22, l=4.92]/content/gdrive/MyDrive/slon/slon (5).txt\n"," 44% 4/9 [00:06<00:08, 1.72s/it, bpd=5.18, l=4.88]/content/gdrive/MyDrive/slon/slon (9).txt\n"," 56% 5/9 [00:08<00:06, 1.62s/it, bpd=4.58, l=4.31]/content/gdrive/MyDrive/slon/slon (6).txt\n"," 67% 6/9 [00:09<00:04, 1.55s/it, bpd=4.83, l=4.54]/content/gdrive/MyDrive/slon/slon (7).txt\n","100% 9/9 [00:13<00:00, 1.53s/it, bpd=5.81, l=5.47]\n","Ema bpd: 5.2046 prime_loss: 0.0103 gen_loss: 5.2046 loss: 4.8987 epoch: 41.0000\n"," 0% 0/78 [00:00, ?it/s]/content/gdrive/MyDrive/slon/slon (16).txt\n","/content/gdrive/MyDrive/slon/slon (25).txt\n","/content/gdrive/MyDrive/slon/slon (32).txt\n"," 1% 1/78 [00:05<06:57, 5.42s/it, bpd=4.67, g_l=4.67, gn=3.13, l=4.4, p_l=7.84e-8]/content/gdrive/MyDrive/slon/slon (31).txt\n"," 3% 2/78 [00:10<06:44, 5.33s/it, bpd=4.44, g_l=4.44, gn=3.7, l=4.17, p_l=8.69e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 4% 3/78 [00:15<06:37, 5.29s/it, bpd=4.47, g_l=4.47, gn=3.77, l=4.21, p_l=8.91e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"," 5% 4/78 [00:20<06:28, 5.25s/it, bpd=4.14, g_l=4.14, gn=6.43, l=3.9, p_l=8.33e-8]/content/gdrive/MyDrive/slon/slon (27).txt\n"," 6% 5/78 [00:26<06:21, 5.22s/it, bpd=3.95, g_l=3.95, gn=3.36, l=3.71, p_l=7.84e-8]/content/gdrive/MyDrive/slon/slon (26).txt\n"," 8% 6/78 [00:31<06:16, 5.23s/it, bpd=4.23, g_l=4.23, gn=3.44, l=3.98, p_l=7.39e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 9% 7/78 [00:36<06:11, 5.23s/it, bpd=4.8, g_l=4.8, gn=4.21, l=4.51, p_l=6.45e-8]/content/gdrive/MyDrive/slon/slon (21).txt\n"," 10% 8/78 [00:41<06:07, 5.26s/it, bpd=5.01, g_l=5.01, gn=3.47, l=4.72, p_l=6.18e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 12% 9/78 [00:47<06:02, 5.26s/it, bpd=4.11, g_l=4.11, gn=3.86, l=3.87, p_l=6.4e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 13% 10/78 [00:52<05:56, 5.25s/it, bpd=3.98, g_l=3.98, gn=3.28, l=3.75, p_l=7.17e-8]/content/gdrive/MyDrive/slon/slon (17).txt\n"," 14% 11/78 [00:57<05:54, 5.29s/it, bpd=3.8, g_l=3.8, gn=3.73, l=3.57, p_l=7.43e-8]/content/gdrive/MyDrive/slon/slon (19).txt\n"," 15% 12/78 [01:02<05:48, 5.28s/it, bpd=3.89, g_l=3.89, gn=3.14, l=3.66, p_l=7.48e-8]/content/gdrive/MyDrive/slon/slon (14).txt\n"," 17% 13/78 [01:08<05:42, 5.26s/it, bpd=3.56, g_l=3.56, gn=2.8, l=3.35, p_l=7.57e-8]/content/gdrive/MyDrive/slon/slon (34).txt\n"," 18% 14/78 [01:13<05:38, 5.29s/it, bpd=4.7, g_l=4.7, gn=4.8, l=4.42, p_l=8.06e-8]/content/gdrive/MyDrive/slon/slon (25).txt\n"," 19% 15/78 [01:18<05:31, 5.27s/it, bpd=4.91, g_l=4.91, gn=2.98, l=4.62, p_l=8.29e-8]/content/gdrive/MyDrive/slon/slon (2).txt\n"," 21% 16/78 [01:24<05:28, 5.30s/it, bpd=4.1, g_l=4.1, gn=3.92, l=3.86, p_l=7.79e-8]/content/gdrive/MyDrive/slon/slon (22).txt\n"," 22% 17/78 [01:29<05:20, 5.25s/it, bpd=4.59, g_l=4.59, gn=3.75, l=4.32, p_l=7.03e-8]/content/gdrive/MyDrive/slon/slon (11).txt\n"," 23% 18/78 [01:34<05:13, 5.22s/it, bpd=3.71, g_l=3.71, gn=3.33, l=3.49, p_l=7.03e-8]/content/gdrive/MyDrive/slon/slon (16).txt\n"]}]},{"cell_type":"markdown","metadata":{"id":"G2XtTS4tVqB8"},"source":[" ๐ด๏ธโโ๏ธ "]}]}
\ No newline at end of file