diff --git "a/experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/Benchmark-V5headsize2x.ipynb" "b/experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/Benchmark-V5headsize2x.ipynb" deleted file mode 100644--- "a/experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/Benchmark-V5headsize2x.ipynb" +++ /dev/null @@ -1,19376 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "bd243115", - "metadata": { - "papermill": { - "duration": 0.003152, - "end_time": "2023-08-30T19:28:18.604602", - "exception": false, - "start_time": "2023-08-30T19:28:18.601450", - "status": "completed" - }, - "tags": [] - }, - "source": [ - "## Custom Experimental Memory benchmarking\n", - "\n", - "The following is meant to observe the memory performance in a more verbose CSV logging mode, for the baseline raven models" - ] - }, - { - "cell_type": "code", - "execution_count": 1, - "id": "9f03f5a0", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T19:28:18.611545Z", - "iopub.status.busy": "2023-08-30T19:28:18.611261Z", - "iopub.status.idle": "2023-08-30T19:35:58.624824Z", - "shell.execute_reply": "2023-08-30T19:35:58.624025Z" - }, - "papermill": { - "duration": 460.019656, - "end_time": "2023-08-30T19:35:58.627171", - "exception": false, - "start_time": "2023-08-30T19:28:18.607515", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "--2023-08-30 19:28:18-- https://huggingface.co/rwkv-x-dev/rwkv-x-playground/resolve/main/experiment/rwkv-x-exp/v5-headsize2x/v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth\r\n", - "Resolving huggingface.co (huggingface.co)... 13.33.33.55, 13.33.33.110, 13.33.33.102, ...\r\n", - "Connecting to huggingface.co (huggingface.co)|13.33.33.55|:443... connected.\r\n", - "HTTP request sent, awaiting response... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "302 Found\r\n", - "Location: https://cdn-lfs.huggingface.co/repos/2e/f7/2ef78555202aa92abdbdf476ce3d0fd5a8b15f7245edf0b80d4d30572355f30d/fae9799e56fd469c6c1694dae6ae77f78130c06d340e945a3dc8e8ea2bd4e5bb?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693682899&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzY4Mjg5OX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy8yZS9mNy8yZWY3ODU1NTIwMmFhOTJhYmRiZGY0NzZjZTNkMGZkNWE4YjE1ZjcyNDVlZGYwYjgwZDRkMzA1NzIzNTVmMzBkL2ZhZTk3OTllNTZmZDQ2OWM2YzE2OTRkYWU2YWU3N2Y3ODEzMGMwNmQzNDBlOTQ1YTNkYzhlOGVhMmJkNGU1YmI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=M1ZkwkjY8Vf2G5qv1yOEa%7EDz6gDhVDvKvGeLWVHwxMY4MX4wy1NnV3LeOkO2lkiQ2yaMAH0tMPVROOpY7sDQCLbGnXeWwtqlbxTKm5jDzp57jEe6vj4-vRtUxlG%7E1Mwc8aBI9-3AIH6D%7Es3B21iA0XkQnPrbLK1KdIf3wzJvzgs6ihrF49CjXqJEPAKUKQtk8jxpC9qeKv0Sk7LNk5Qz9NK8TpYhDYVCGXhO-4Cm93em053DF%7E-uxiMELYY8uEnZt3sjpYgQihYsGQtJipqa3RzBO0fTpzNHSj751FBfy6BkbWsqltQUZICixOu96pHXXasi-BH-QXmrZJK1nKpTvQ__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", - "--2023-08-30 19:28:19-- https://cdn-lfs.huggingface.co/repos/2e/f7/2ef78555202aa92abdbdf476ce3d0fd5a8b15f7245edf0b80d4d30572355f30d/fae9799e56fd469c6c1694dae6ae77f78130c06d340e945a3dc8e8ea2bd4e5bb?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693682899&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzY4Mjg5OX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy8yZS9mNy8yZWY3ODU1NTIwMmFhOTJhYmRiZGY0NzZjZTNkMGZkNWE4YjE1ZjcyNDVlZGYwYjgwZDRkMzA1NzIzNTVmMzBkL2ZhZTk3OTllNTZmZDQ2OWM2YzE2OTRkYWU2YWU3N2Y3ODEzMGMwNmQzNDBlOTQ1YTNkYzhlOGVhMmJkNGU1YmI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=M1ZkwkjY8Vf2G5qv1yOEa%7EDz6gDhVDvKvGeLWVHwxMY4MX4wy1NnV3LeOkO2lkiQ2yaMAH0tMPVROOpY7sDQCLbGnXeWwtqlbxTKm5jDzp57jEe6vj4-vRtUxlG%7E1Mwc8aBI9-3AIH6D%7Es3B21iA0XkQnPrbLK1KdIf3wzJvzgs6ihrF49CjXqJEPAKUKQtk8jxpC9qeKv0Sk7LNk5Qz9NK8TpYhDYVCGXhO-4Cm93em053DF%7E-uxiMELYY8uEnZt3sjpYgQihYsGQtJipqa3RzBO0fTpzNHSj751FBfy6BkbWsqltQUZICixOu96pHXXasi-BH-QXmrZJK1nKpTvQ__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", - "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "18.155.68.128, 18.155.68.73, 18.155.68.98, ...\r\n", - "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|18.155.68.128|:443... connected.\r\n", - "HTTP request sent, awaiting response... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "200 OK\r\n", - "Length: 3441599109 (3.2G) [binary/octet-stream]\r\n", - "Saving to: ‘v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth’\r\n", - "\r\n", - "\r", - " v5-hs2x-L 0%[ ] 0 --.-KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 0%[ ] 8.00K 32.6KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 0%[ ] 41.37K 84.2KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 0%[ ] 107.84K 146KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 0%[ ] 226.84K 231KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 0%[ ] 447.84K 365KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 0%[ ] 923.84K 627KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 0%[ ] 1.81M 1.06MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 0%[ ] 3.63M 1.88MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 0%[ ] 7.29M 3.29MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 0%[ ] 10.71M 4.35MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 0%[ ] 13.51M 4.97MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 0%[ ] 14.04M 4.74MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 0%[ ] 17.88M 5.58MB/s eta 9m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 0%[ ] 21.09M 6.11MB/s eta 9m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 0%[ ] 24.96M 6.74MB/s eta 9m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 0%[ ] 28.71M 7.27MB/s eta 9m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 0%[ ] 32.51M 7.74MB/s eta 7m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 1%[ ] 36.29M 8.16MB/s eta 7m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 1%[ ] 40.49M 8.62MB/s eta 7m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 1%[ ] 44.46M 9.46MB/s eta 7m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 1%[ ] 48.23M 10.2MB/s eta 5m 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 1%[ ] 52.17M 11.1MB/s eta 5m 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 1%[ ] 56.03M 11.9MB/s eta 5m 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 1%[ ] 59.78M 12.6MB/s eta 5m 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 1%[ ] 63.49M 13.3MB/s eta 5m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 2%[ ] 67.31M 13.9MB/s eta 5m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 2%[ ] 71.46M 14.2MB/s eta 5m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 2%[ ] 75.20M 14.1MB/s eta 5m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 2%[ ] 78.28M 13.7MB/s eta 4m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 2%[ ] 82.21M 14.4MB/s eta 4m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 2%[ ] 85.99M 14.6MB/s eta 4m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 2%[ ] 89.96M 15.3MB/s eta 4m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 2%[ ] 93.96M 15.3MB/s eta 4m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 2%[ ] 97.84M 15.4MB/s eta 4m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 3%[ ] 101.71M 15.4MB/s eta 4m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 3%[ ] 102.88M 14.9MB/s eta 4m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 3%[ ] 105.49M 14.6MB/s eta 4m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 3%[ ] 109.32M 14.6MB/s eta 4m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 3%[ ] 113.12M 14.6MB/s eta 4m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 3%[ ] 116.85M 14.5MB/s eta 4m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 3%[ ] 120.56M 14.5MB/s eta 4m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 3%[ ] 124.46M 14.5MB/s eta 4m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 3%[ ] 128.28M 14.5MB/s eta 4m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 4%[ ] 132.01M 14.5MB/s eta 4m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 4%[ ] 135.81M 14.5MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 4%[ ] 139.56M 14.5MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 4%[ ] 142.81M 14.3MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 4%[ ] 145.63M 14.1MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 4%[ ] 148.32M 14.1MB/s eta 4m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 4%[ ] 148.49M 13.3MB/s eta 4m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 4%[ ] 152.31M 13.3MB/s eta 4m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 4%[ ] 155.17M 13.1MB/s eta 4m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 4%[ ] 158.04M 12.9MB/s eta 4m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 4%[ ] 160.78M 12.7MB/s eta 4m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 4%[ ] 163.76M 12.5MB/s eta 4m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 5%[> ] 166.79M 12.9MB/s eta 4m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 5%[> ] 169.45M 12.9MB/s eta 4m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 5%[> ] 172.54M 12.8MB/s eta 4m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 5%[> ] 175.67M 12.6MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 5%[> ] 178.59M 12.5MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 5%[> ] 181.76M 12.4MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 5%[> ] 184.96M 12.2MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 5%[> ] 188.20M 12.1MB/s eta 4m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 5%[> ] 191.43M 12.0MB/s eta 4m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 5%[> ] 194.67M 11.9MB/s eta 4m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 6%[> ] 197.96M 11.8MB/s eta 4m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 6%[> ] 201.26M 11.9MB/s eta 4m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 6%[> ] 204.57M 12.0MB/s eta 4m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 6%[> ] 207.93M 12.1MB/s eta 4m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 6%[> ] 211.28M 12.7MB/s eta 4m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 6%[> ] 214.34M 12.5MB/s eta 4m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 6%[> ] 217.71M 12.6MB/s eta 4m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 6%[> ] 221.09M 12.7MB/s eta 4m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 6%[> ] 224.49M 12.9MB/s eta 4m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 6%[> ] 227.88M 13.0MB/s eta 4m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 7%[> ] 231.31M 13.0MB/s eta 4m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 7%[> ] 234.67M 13.2MB/s eta 4m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 7%[> ] 238.10M 13.3MB/s eta 4m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 7%[> ] 241.46M 13.3MB/s eta 4m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 7%[> ] 244.35M 13.3MB/s eta 4m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 7%[> ] 247.49M 13.3MB/s eta 4m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 7%[> ] 250.90M 13.3MB/s eta 4m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 7%[> ] 254.35M 13.4MB/s eta 4m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 7%[> ] 257.81M 13.4MB/s eta 4m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 7%[> ] 261.26M 13.5MB/s eta 4m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 8%[> ] 264.60M 13.5MB/s eta 4m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 8%[> ] 267.99M 13.5MB/s eta 4m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 8%[> ] 271.38M 13.5MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 8%[> ] 274.73M 13.5MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 8%[> ] 278.17M 13.5MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 8%[> ] 281.59M 13.7MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 8%[> ] 284.93M 13.7MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 8%[> ] 288.37M 13.0MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 8%[> ] 292.15M 13.1MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 8%[> ] 294.57M 12.9MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 9%[> ] 297.09M 12.7MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 9%[> ] 299.67M 12.6MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 9%[> ] 302.31M 12.4MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 9%[> ] 304.99M 12.3MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 9%[> ] 307.71M 12.3MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 9%[> ] 310.49M 12.2MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 9%[> ] 313.32M 12.1MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 9%[> ] 316.10M 11.9MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 9%[> ] 319.03M 11.8MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 9%[> ] 321.87M 11.7MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 9%[> ] 324.82M 11.6MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 9%[> ] 327.38M 11.4MB/s eta 4m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 10%[=> ] 330.43M 11.4MB/s eta 4m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 10%[=> ] 333.53M 11.3MB/s eta 4m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 10%[=> ] 336.63M 11.3MB/s eta 4m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 10%[=> ] 339.78M 11.2MB/s eta 4m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 10%[=> ] 342.26M 11.0MB/s eta 4m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 10%[=> ] 345.45M 11.5MB/s eta 4m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 10%[=> ] 348.67M 11.4MB/s eta 4m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 10%[=> ] 351.88M 11.6MB/s eta 4m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 10%[=> ] 355.17M 11.7MB/s eta 4m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 10%[=> ] 358.42M 11.9MB/s eta 4m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 11%[=> ] 361.70M 12.0MB/s eta 3m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 11%[=> ] 365.03M 12.1MB/s eta 3m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 11%[=> ] 368.35M 12.3MB/s eta 3m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 11%[=> ] 371.71M 12.4MB/s eta 3m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 11%[=> ] 375.09M 12.5MB/s eta 3m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 11%[=> ] 378.43M 12.7MB/s eta 3m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 11%[=> ] 381.82M 12.8MB/s eta 3m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 11%[=> ] 385.21M 12.9MB/s eta 3m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 11%[=> ] 388.59M 12.9MB/s eta 3m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 11%[=> ] 392.01M 13.1MB/s eta 3m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 12%[=> ] 394.96M 13.0MB/s eta 3m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 12%[=> ] 398.26M 13.0MB/s eta 3m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 12%[=> ] 401.68M 13.1MB/s eta 3m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 12%[=> ] 405.04M 13.1MB/s eta 3m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 12%[=> ] 408.45M 13.3MB/s eta 3m 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 12%[=> ] 411.87M 13.4MB/s eta 3m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 12%[=> ] 415.23M 13.4MB/s eta 3m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 12%[=> ] 418.68M 13.5MB/s eta 3m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 12%[=> ] 422.01M 13.5MB/s eta 3m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 12%[=> ] 425.48M 13.5MB/s eta 3m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 13%[=> ] 428.92M 13.5MB/s eta 3m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 13%[=> ] 432.38M 13.6MB/s eta 3m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 13%[=> ] 435.82M 13.6MB/s eta 3m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 13%[=> ] 439.29M 13.6MB/s eta 3m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 13%[=> ] 442.63M 13.6MB/s eta 3m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 13%[=> ] 446.10M 13.6MB/s eta 3m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 13%[=> ] 449.54M 13.6MB/s eta 3m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 13%[=> ] 452.92M 13.6MB/s eta 3m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 13%[=> ] 456.37M 13.6MB/s eta 3m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 14%[=> ] 459.74M 13.6MB/s eta 3m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 14%[=> ] 463.20M 13.9MB/s eta 3m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 14%[=> ] 466.57M 13.9MB/s eta 3m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 14%[=> ] 469.10M 13.7MB/s eta 3m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 14%[=> ] 472.45M 13.7MB/s eta 3m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 14%[=> ] 475.84M 13.7MB/s eta 3m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 14%[=> ] 479.18M 13.7MB/s eta 3m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 14%[=> ] 482.59M 13.7MB/s eta 3m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 14%[=> ] 485.96M 13.7MB/s eta 3m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 14%[=> ] 489.43M 13.7MB/s eta 3m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 15%[==> ] 492.92M 13.7MB/s eta 3m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 15%[==> ] 496.34M 13.7MB/s eta 3m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 15%[==> ] 499.74M 13.7MB/s eta 3m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 15%[==> ] 503.21M 13.7MB/s eta 3m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 15%[==> ] 506.71M 13.7MB/s eta 3m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 15%[==> ] 509.53M 13.4MB/s eta 3m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 15%[==> ] 512.95M 13.4MB/s eta 3m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 15%[==> ] 516.48M 13.4MB/s eta 3m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 15%[==> ] 519.88M 13.4MB/s eta 3m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 15%[==> ] 523.37M 13.4MB/s eta 3m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 15%[==> ] 524.68M 12.9MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 16%[==> ] 527.68M 12.9MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 16%[==> ] 530.18M 12.7MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 16%[==> ] 532.76M 12.7MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 16%[==> ] 535.40M 12.7MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 16%[==> ] 538.10M 12.5MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 16%[==> ] 540.87M 12.3MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 16%[==> ] 543.67M 12.2MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 16%[==> ] 546.53M 12.2MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 16%[==> ] 549.45M 12.0MB/s eta 3m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 16%[==> ] 552.40M 11.9MB/s eta 3m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 16%[==> ] 555.38M 11.8MB/s eta 3m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 17%[==> ] 558.43M 11.7MB/s eta 3m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 17%[==> ] 561.48M 11.7MB/s eta 3m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 17%[==> ] 564.56M 11.6MB/s eta 3m 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 17%[==> ] 567.70M 11.8MB/s eta 3m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 17%[==> ] 570.88M 11.8MB/s eta 3m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 17%[==> ] 574.09M 11.7MB/s eta 3m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 17%[==> ] 577.32M 11.7MB/s eta 3m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 17%[==> ] 580.59M 11.6MB/s eta 3m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 17%[==> ] 583.88M 12.1MB/s eta 3m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 17%[==> ] 587.21M 12.1MB/s eta 3m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 17%[==> ] 590.56M 12.3MB/s eta 3m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 18%[==> ] 593.93M 12.4MB/s eta 3m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 18%[==> ] 597.31M 12.5MB/s eta 3m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 18%[==> ] 600.09M 12.4MB/s eta 3m 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 18%[==> ] 603.70M 12.6MB/s eta 3m 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 18%[==> ] 606.09M 12.6MB/s eta 3m 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 18%[==> ] 608.54M 12.4MB/s eta 3m 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 18%[==> ] 611.03M 12.4MB/s eta 3m 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 18%[==> ] 613.54M 12.3MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 18%[==> ] 616.09M 12.2MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 18%[==> ] 618.63M 12.2MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 18%[==> ] 621.24M 12.2MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 19%[==> ] 623.88M 12.1MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 19%[==> ] 626.54M 12.0MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 19%[==> ] 629.21M 11.9MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 19%[==> ] 631.92M 11.8MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 19%[==> ] 634.63M 11.7MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 19%[==> ] 637.38M 11.5MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 19%[==> ] 640.15M 11.3MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 19%[==> ] 642.92M 11.3MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 19%[==> ] 645.71M 11.1MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 19%[==> ] 648.53M 11.0MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 19%[==> ] 651.32M 10.9MB/s eta 3m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 19%[==> ] 654.13M 11.1MB/s eta 3m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 20%[===> ] 656.96M 10.7MB/s eta 3m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 20%[===> ] 659.81M 10.8MB/s eta 3m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 20%[===> ] 662.65M 10.8MB/s eta 3m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 20%[===> ] 665.53M 10.9MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 20%[===> ] 668.38M 11.0MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 20%[===> ] 671.26M 11.0MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 20%[===> ] 674.12M 11.1MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 20%[===> ] 677.01M 11.1MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 20%[===> ] 679.59M 11.1MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 20%[===> ] 682.48M 11.2MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 20%[===> ] 685.37M 11.2MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 20%[===> ] 687.90M 11.2MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 21%[===> ] 690.81M 11.2MB/s eta 3m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 21%[===> ] 693.57M 11.2MB/s eta 3m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 21%[===> ] 696.45M 11.3MB/s eta 3m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 21%[===> ] 699.03M 11.2MB/s eta 3m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 21%[===> ] 701.92M 11.3MB/s eta 3m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 21%[===> ] 704.82M 11.3MB/s eta 3m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 21%[===> ] 707.54M 11.3MB/s eta 3m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 21%[===> ] 710.42M 11.3MB/s eta 3m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 21%[===> ] 713.31M 11.4MB/s eta 3m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 21%[===> ] 716.23M 11.5MB/s eta 3m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 21%[===> ] 718.74M 11.4MB/s eta 3m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 21%[===> ] 721.65M 11.4MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 22%[===> ] 724.54M 11.4MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 22%[===> ] 727.46M 11.4MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 22%[===> ] 730.09M 11.4MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 22%[===> ] 732.99M 11.4MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 22%[===> ] 735.68M 11.4MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 22%[===> ] 736.71M 11.0MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 22%[===> ] 740.40M 11.1MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 22%[===> ] 742.43M 11.0MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 22%[===> ] 744.57M 10.9MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 22%[===> ] 746.74M 10.8MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 22%[===> ] 748.98M 10.6MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 22%[===> ] 751.26M 10.6MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 22%[===> ] 753.57M 10.5MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 23%[===> ] 755.93M 10.4MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 23%[===> ] 758.34M 10.3MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 23%[===> ] 760.78M 10.2MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 23%[===> ] 763.24M 10.1MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 23%[===> ] 765.73M 10.0MB/s eta 3m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 23%[===> ] 768.28M 10.0MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 23%[===> ] 770.82M 9.96MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 23%[===> ] 773.40M 9.90MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 23%[===> ] 776.01M 9.84MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 23%[===> ] 778.67M 9.85MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 23%[===> ] 781.31M 9.79MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 23%[===> ] 784.01M 9.80MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 23%[===> ] 786.73M 10.2MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 24%[===> ] 789.45M 9.98MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 24%[===> ] 792.20M 10.1MB/s eta 3m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 24%[===> ] 794.96M 10.2MB/s eta 3m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 24%[===> ] 797.76M 10.4MB/s eta 3m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 24%[===> ] 800.54M 10.5MB/s eta 3m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 24%[===> ] 803.37M 10.6MB/s eta 3m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 24%[===> ] 806.18M 10.7MB/s eta 3m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 24%[===> ] 809.03M 10.8MB/s eta 3m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 24%[===> ] 811.87M 10.9MB/s eta 3m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 24%[===> ] 814.73M 11.0MB/s eta 3m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 24%[===> ] 817.57M 11.0MB/s eta 3m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 24%[===> ] 820.40M 11.1MB/s eta 3m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 25%[====> ] 823.26M 11.2MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 25%[====> ] 826.13M 11.3MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 25%[====> ] 829.03M 11.3MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 25%[====> ] 831.92M 11.4MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 25%[====> ] 833.13M 11.0MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 25%[====> ] 835.60M 11.1MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 25%[====> ] 837.65M 10.8MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 25%[====> ] 839.73M 10.8MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 25%[====> ] 841.84M 10.6MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 25%[====> ] 843.98M 10.3MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 25%[====> ] 846.15M 10.3MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 25%[====> ] 848.35M 10.1MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 25%[====> ] 850.57M 9.82MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 25%[====> ] 852.81M 9.56MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 26%[====> ] 855.07M 9.41MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 26%[====> ] 857.35M 9.12MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 26%[====> ] 859.67M 8.87MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 26%[====> ] 861.99M 8.95MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 26%[====> ] 864.32M 8.67MB/s eta 3m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 26%[====> ] 866.68M 9.03MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 26%[====> ] 869.04M 8.99MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 26%[====> ] 871.42M 8.88MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 26%[====> ] 873.81M 9.31MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 26%[====> ] 876.21M 9.02MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 26%[====> ] 878.62M 9.29MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 26%[====> ] 881.03M 9.14MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 26%[====> ] 883.46M 9.41MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 26%[====> ] 885.88M 9.24MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 27%[====> ] 888.32M 9.69MB/s eta 3m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 27%[====> ] 890.76M 9.33MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 27%[====> ] 893.21M 9.59MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 27%[====> ] 895.67M 9.38MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 27%[====> ] 898.12M 9.66MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 27%[====> ] 900.57M 9.47MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 27%[====> ] 903.04M 9.71MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 27%[====> ] 905.51M 9.48MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 27%[====> ] 907.96M 9.75MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 27%[====> ] 910.42M 9.55MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 27%[====> ] 912.88M 9.78MB/s eta 3m 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 27%[====> ] 915.35M 9.54MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 27%[====> ] 917.82M 9.99MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 28%[====> ] 920.29M 9.57MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 28%[====> ] 922.76M 9.82MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 28%[====> ] 925.21M 9.61MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 28%[====> ] 927.68M 9.84MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 28%[====> ] 930.13M 9.61MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 28%[====> ] 932.62M 9.83MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 28%[====> ] 935.07M 9.61MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 28%[====> ] 937.54M 10.0MB/s eta 3m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 28%[====> ] 939.99M 9.65MB/s eta 3m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 28%[====> ] 942.43M 10.2MB/s eta 3m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 28%[====> ] 944.90M 9.75MB/s eta 3m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 28%[====> ] 947.37M 10.2MB/s eta 3m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 28%[====> ] 949.85M 9.77MB/s eta 3m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 29%[====> ] 952.32M 10.2MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 29%[====> ] 954.79M 9.78MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 29%[====> ] 957.28M 10.2MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 29%[====> ] 959.76M 9.79MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 29%[====> ] 962.10M 10.3MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 29%[====> ] 964.59M 10.2MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 29%[====> ] 967.09M 9.91MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 29%[====> ] 969.59M 10.2MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 29%[====> ] 972.10M 10.0MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 29%[====> ] 974.62M 10.5MB/s eta 3m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 29%[====> ] 975.68M 10.1MB/s eta 3m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 29%[====> ] 977.38M 10.1MB/s eta 3m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 29%[====> ] 979.92M 10.1MB/s eta 3m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 29%[====> ] 982.28M 9.93MB/s eta 3m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 30%[=====> ] 984.84M 10.2MB/s eta 3m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 30%[=====> ] 987.43M 9.99MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 30%[=====> ] 990.03M 10.5MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 30%[=====> ] 992.62M 10.3MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 30%[=====> ] 993.74M 10.4MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 30%[=====> ] 995.62M 10.2MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 30%[=====> ] 998.13M 10.2MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 30%[=====> ] 1001M 10.6MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 30%[=====> ] 1003M 10.5MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 30%[=====> ] 1006M 10.6MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 30%[=====> ] 1009M 11.0MB/s eta 3m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 30%[=====> ] 1010M 10.6MB/s eta 3m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 30%[=====> ] 1012M 10.3MB/s eta 3m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 30%[=====> ] 1015M 10.9MB/s eta 3m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 30%[=====> ] 1017M 10.3MB/s eta 3m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 31%[=====> ] 1020M 10.8MB/s eta 3m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 31%[=====> ] 1023M 10.8MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 31%[=====> ] 1.00G 10.2MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 31%[=====> ] 1.00G 10.4MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 31%[=====> ] 1.00G 10.2MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 31%[=====> ] 1.01G 9.86MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 31%[=====> ] 1.01G 10.1MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 31%[=====> ] 1.01G 9.91MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 31%[=====> ] 1.01G 9.61MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 31%[=====> ] 1.01G 9.89MB/s eta 3m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 31%[=====> ] 1.02G 9.72MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 31%[=====> ] 1.02G 9.47MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 31%[=====> ] 1.02G 9.76MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 31%[=====> ] 1.02G 9.61MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 32%[=====> ] 1.03G 9.39MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 32%[=====> ] 1.03G 9.69MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 32%[=====> ] 1.03G 9.57MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 32%[=====> ] 1.03G 9.36MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 32%[=====> ] 1.04G 9.67MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 32%[=====> ] 1.04G 9.74MB/s eta 3m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 32%[=====> ] 1.04G 9.69MB/s eta 3m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 32%[=====> ] 1.04G 9.66MB/s eta 3m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 32%[=====> ] 1.05G 9.89MB/s eta 3m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 32%[=====> ] 1.05G 10.3MB/s eta 3m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 32%[=====> ] 1.05G 10.2MB/s eta 3m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 32%[=====> ] 1.06G 10.3MB/s eta 3m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 33%[=====> ] 1.06G 10.5MB/s eta 3m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 33%[=====> ] 1.06G 10.7MB/s eta 3m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 33%[=====> ] 1.06G 10.8MB/s eta 3m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 33%[=====> ] 1.07G 10.8MB/s eta 3m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 33%[=====> ] 1.07G 10.9MB/s eta 3m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 33%[=====> ] 1.07G 11.0MB/s eta 3m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 33%[=====> ] 1.08G 11.1MB/s eta 3m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 33%[=====> ] 1.08G 11.2MB/s eta 3m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 33%[=====> ] 1.08G 11.3MB/s eta 3m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 33%[=====> ] 1.08G 11.3MB/s eta 3m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 33%[=====> ] 1.09G 11.4MB/s eta 3m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 34%[=====> ] 1.09G 11.5MB/s eta 3m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 34%[=====> ] 1.09G 11.5MB/s eta 3m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 34%[=====> ] 1.09G 11.6MB/s eta 3m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 34%[=====> ] 1.10G 11.6MB/s eta 3m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 34%[=====> ] 1.10G 11.7MB/s eta 3m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 34%[=====> ] 1.10G 11.7MB/s eta 3m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 34%[=====> ] 1.11G 11.8MB/s eta 3m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 34%[=====> ] 1.11G 11.7MB/s eta 3m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 34%[=====> ] 1.11G 11.5MB/s eta 3m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 34%[=====> ] 1.12G 11.4MB/s eta 3m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 34%[=====> ] 1.12G 11.8MB/s eta 3m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 34%[=====> ] 1.12G 11.8MB/s eta 3m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 35%[======> ] 1.12G 11.9MB/s eta 3m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 35%[======> ] 1.13G 11.9MB/s eta 3m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 35%[======> ] 1.13G 11.9MB/s eta 3m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 35%[======> ] 1.13G 11.9MB/s eta 3m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 35%[======> ] 1.14G 11.9MB/s eta 3m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 35%[======> ] 1.14G 11.9MB/s eta 3m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 35%[======> ] 1.14G 11.9MB/s eta 3m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 35%[======> ] 1.14G 11.9MB/s eta 3m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 35%[======> ] 1.15G 11.9MB/s eta 3m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 35%[======> ] 1.15G 11.9MB/s eta 3m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 35%[======> ] 1.15G 11.9MB/s eta 3m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 36%[======> ] 1.16G 11.9MB/s eta 3m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 36%[======> ] 1.16G 11.9MB/s eta 3m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 36%[======> ] 1.16G 11.9MB/s eta 3m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 36%[======> ] 1.16G 11.9MB/s eta 3m 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 36%[======> ] 1.17G 12.0MB/s eta 3m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 36%[======> ] 1.17G 12.0MB/s eta 3m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 36%[======> ] 1.17G 12.0MB/s eta 3m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 36%[======> ] 1.18G 12.0MB/s eta 3m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 36%[======> ] 1.18G 12.0MB/s eta 3m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 36%[======> ] 1.18G 12.0MB/s eta 3m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 36%[======> ] 1.18G 12.0MB/s eta 3m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 37%[======> ] 1.19G 12.0MB/s eta 3m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 37%[======> ] 1.19G 12.0MB/s eta 3m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 37%[======> ] 1.19G 12.0MB/s eta 2m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 37%[======> ] 1.20G 12.0MB/s eta 2m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 37%[======> ] 1.20G 12.1MB/s eta 2m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 37%[======> ] 1.20G 12.2MB/s eta 2m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 37%[======> ] 1.21G 12.2MB/s eta 2m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 37%[======> ] 1.21G 12.2MB/s eta 2m 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 37%[======> ] 1.21G 12.2MB/s eta 2m 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 37%[======> ] 1.21G 12.1MB/s eta 2m 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 38%[======> ] 1.22G 12.2MB/s eta 2m 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 38%[======> ] 1.22G 12.2MB/s eta 2m 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 38%[======> ] 1.22G 12.3MB/s eta 2m 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 38%[======> ] 1.23G 12.3MB/s eta 2m 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 38%[======> ] 1.23G 12.3MB/s eta 2m 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 38%[======> ] 1.23G 12.5MB/s eta 2m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 38%[======> ] 1.24G 12.4MB/s eta 2m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 38%[======> ] 1.24G 12.4MB/s eta 2m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 38%[======> ] 1.24G 12.5MB/s eta 2m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 38%[======> ] 1.25G 12.4MB/s eta 2m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 38%[======> ] 1.25G 12.5MB/s eta 2m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 39%[======> ] 1.25G 12.6MB/s eta 2m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 39%[======> ] 1.25G 12.7MB/s eta 2m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 39%[======> ] 1.26G 12.8MB/s eta 2m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 39%[======> ] 1.26G 12.9MB/s eta 2m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 39%[======> ] 1.27G 13.0MB/s eta 2m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 39%[======> ] 1.27G 13.1MB/s eta 2m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 39%[======> ] 1.27G 13.3MB/s eta 2m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 39%[======> ] 1.28G 13.2MB/s eta 2m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 39%[======> ] 1.28G 13.5MB/s eta 2m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 40%[=======> ] 1.28G 13.6MB/s eta 2m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 40%[=======> ] 1.29G 13.7MB/s eta 2m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 40%[=======> ] 1.29G 13.8MB/s eta 2m 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 40%[=======> ] 1.29G 13.8MB/s eta 2m 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 40%[=======> ] 1.30G 13.9MB/s eta 2m 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 40%[=======> ] 1.30G 13.9MB/s eta 2m 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 40%[=======> ] 1.30G 14.1MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 40%[=======> ] 1.31G 14.3MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 40%[=======> ] 1.31G 14.4MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 41%[=======> ] 1.32G 14.5MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 41%[=======> ] 1.32G 14.6MB/s eta 2m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 41%[=======> ] 1.32G 14.7MB/s eta 2m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 41%[=======> ] 1.32G 14.2MB/s eta 2m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 41%[=======> ] 1.33G 14.2MB/s eta 2m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 41%[=======> ] 1.33G 14.2MB/s eta 2m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 41%[=======> ] 1.33G 14.1MB/s eta 2m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 41%[=======> ] 1.34G 14.1MB/s eta 2m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 41%[=======> ] 1.34G 13.6MB/s eta 2m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 41%[=======> ] 1.34G 13.7MB/s eta 2m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 41%[=======> ] 1.34G 13.4MB/s eta 2m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 42%[=======> ] 1.35G 13.2MB/s eta 2m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 42%[=======> ] 1.35G 12.9MB/s eta 2m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 42%[=======> ] 1.35G 12.7MB/s eta 2m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 42%[=======> ] 1.36G 12.7MB/s eta 2m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 42%[=======> ] 1.36G 12.5MB/s eta 2m 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 42%[=======> ] 1.36G 12.3MB/s eta 2m 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 42%[=======> ] 1.36G 12.1MB/s eta 2m 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 42%[=======> ] 1.37G 11.9MB/s eta 2m 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 42%[=======> ] 1.37G 11.7MB/s eta 2m 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 42%[=======> ] 1.37G 11.5MB/s eta 2m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 42%[=======> ] 1.37G 11.4MB/s eta 2m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 42%[=======> ] 1.38G 11.2MB/s eta 2m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 43%[=======> ] 1.38G 11.3MB/s eta 2m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 43%[=======> ] 1.38G 11.2MB/s eta 2m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 43%[=======> ] 1.38G 11.1MB/s eta 2m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 43%[=======> ] 1.39G 11.0MB/s eta 2m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 43%[=======> ] 1.39G 10.8MB/s eta 2m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 43%[=======> ] 1.39G 11.1MB/s eta 2m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 43%[=======> ] 1.40G 11.0MB/s eta 2m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 43%[=======> ] 1.40G 11.1MB/s eta 2m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 43%[=======> ] 1.40G 11.2MB/s eta 2m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 43%[=======> ] 1.40G 11.3MB/s eta 2m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 43%[=======> ] 1.41G 11.3MB/s eta 2m 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 44%[=======> ] 1.41G 11.4MB/s eta 2m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 44%[=======> ] 1.41G 11.5MB/s eta 2m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 44%[=======> ] 1.42G 11.5MB/s eta 2m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 44%[=======> ] 1.42G 11.6MB/s eta 2m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 44%[=======> ] 1.42G 11.6MB/s eta 2m 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 44%[=======> ] 1.42G 11.6MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 44%[=======> ] 1.43G 11.7MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 44%[=======> ] 1.43G 11.6MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 44%[=======> ] 1.43G 11.7MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 44%[=======> ] 1.44G 11.8MB/s eta 2m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 44%[=======> ] 1.44G 11.9MB/s eta 2m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 45%[========> ] 1.44G 12.0MB/s eta 2m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 45%[========> ] 1.45G 12.0MB/s eta 2m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 45%[========> ] 1.45G 12.1MB/s eta 2m 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 45%[========> ] 1.45G 12.1MB/s eta 2m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 45%[========> ] 1.45G 12.1MB/s eta 2m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 45%[========> ] 1.46G 12.2MB/s eta 2m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 45%[========> ] 1.46G 12.0MB/s eta 2m 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 45%[========> ] 1.46G 12.1MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 45%[========> ] 1.46G 11.9MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 45%[========> ] 1.47G 11.8MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 45%[========> ] 1.47G 11.6MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 45%[========> ] 1.47G 11.5MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 45%[========> ] 1.47G 11.4MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 46%[========> ] 1.48G 11.2MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 46%[========> ] 1.48G 11.1MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 46%[========> ] 1.48G 11.0MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 46%[========> ] 1.48G 10.9MB/s eta 2m 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 46%[========> ] 1.49G 10.8MB/s eta 2m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 46%[========> ] 1.49G 10.8MB/s eta 2m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 46%[========> ] 1.49G 10.7MB/s eta 2m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 46%[========> ] 1.49G 10.6MB/s eta 2m 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 46%[========> ] 1.50G 10.5MB/s eta 2m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 46%[========> ] 1.50G 10.4MB/s eta 2m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 46%[========> ] 1.50G 10.4MB/s eta 2m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 46%[========> ] 1.50G 10.3MB/s eta 2m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 47%[========> ] 1.51G 10.3MB/s eta 2m 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 47%[========> ] 1.51G 10.5MB/s eta 2m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 47%[========> ] 1.51G 10.3MB/s eta 2m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 47%[========> ] 1.51G 10.4MB/s eta 2m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 47%[========> ] 1.52G 10.5MB/s eta 2m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 47%[========> ] 1.52G 10.7MB/s eta 2m 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 47%[========> ] 1.52G 10.8MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 47%[========> ] 1.53G 10.9MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 47%[========> ] 1.53G 11.0MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 47%[========> ] 1.53G 11.1MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 47%[========> ] 1.53G 11.2MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 47%[========> ] 1.54G 11.2MB/s eta 2m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 48%[========> ] 1.54G 11.3MB/s eta 2m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 48%[========> ] 1.54G 11.4MB/s eta 2m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 48%[========> ] 1.55G 11.4MB/s eta 2m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 48%[========> ] 1.55G 11.5MB/s eta 2m 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 48%[========> ] 1.55G 11.5MB/s eta 2m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 48%[========> ] 1.55G 11.6MB/s eta 2m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 48%[========> ] 1.56G 11.6MB/s eta 2m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 48%[========> ] 1.56G 11.7MB/s eta 2m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 48%[========> ] 1.56G 11.7MB/s eta 2m 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 48%[========> ] 1.57G 11.8MB/s eta 2m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 48%[========> ] 1.57G 11.8MB/s eta 2m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 49%[========> ] 1.57G 11.8MB/s eta 2m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 49%[========> ] 1.58G 11.9MB/s eta 2m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 49%[========> ] 1.58G 11.9MB/s eta 2m 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 49%[========> ] 1.58G 11.9MB/s eta 2m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 49%[========> ] 1.58G 11.9MB/s eta 2m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 49%[========> ] 1.59G 11.9MB/s eta 2m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 49%[========> ] 1.59G 12.0MB/s eta 2m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 49%[========> ] 1.59G 12.0MB/s eta 2m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 49%[========> ] 1.60G 12.1MB/s eta 2m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 49%[========> ] 1.60G 12.1MB/s eta 2m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 49%[========> ] 1.60G 12.1MB/s eta 2m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 50%[=========> ] 1.60G 12.2MB/s eta 2m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 50%[=========> ] 1.61G 12.2MB/s eta 2m 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 50%[=========> ] 1.61G 12.2MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 50%[=========> ] 1.61G 12.2MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 50%[=========> ] 1.62G 12.2MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 50%[=========> ] 1.62G 12.2MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 50%[=========> ] 1.62G 11.9MB/s eta 2m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 50%[=========> ] 1.62G 12.0MB/s eta 2m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 50%[=========> ] 1.62G 11.6MB/s eta 2m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 50%[=========> ] 1.63G 11.4MB/s eta 2m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 50%[=========> ] 1.63G 11.3MB/s eta 2m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 50%[=========> ] 1.63G 11.1MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 50%[=========> ] 1.63G 11.0MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 51%[=========> ] 1.64G 10.8MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 51%[=========> ] 1.64G 10.7MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 51%[=========> ] 1.64G 10.6MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 51%[=========> ] 1.64G 10.5MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 51%[=========> ] 1.65G 10.3MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 51%[=========> ] 1.65G 10.3MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 51%[=========> ] 1.65G 10.2MB/s eta 2m 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 51%[=========> ] 1.65G 9.65MB/s eta 2m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 51%[=========> ] 1.66G 9.79MB/s eta 2m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 51%[=========> ] 1.66G 9.53MB/s eta 2m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 51%[=========> ] 1.66G 9.30MB/s eta 2m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 51%[=========> ] 1.66G 8.89MB/s eta 2m 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 51%[=========> ] 1.66G 9.08MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 51%[=========> ] 1.66G 9.06MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 51%[=========> ] 1.67G 9.26MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 52%[=========> ] 1.67G 8.99MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 52%[=========> ] 1.67G 8.96MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 52%[=========> ] 1.67G 8.94MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 52%[=========> ] 1.67G 8.90MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 52%[=========> ] 1.68G 8.86MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 52%[=========> ] 1.68G 8.81MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 52%[=========> ] 1.68G 8.76MB/s eta 2m 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 52%[=========> ] 1.68G 8.70MB/s eta 2m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 52%[=========> ] 1.68G 8.63MB/s eta 2m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 52%[=========> ] 1.69G 8.56MB/s eta 2m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 52%[=========> ] 1.69G 8.39MB/s eta 2m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 52%[=========> ] 1.69G 8.80MB/s eta 2m 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 52%[=========> ] 1.69G 8.55MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 52%[=========> ] 1.70G 8.71MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 52%[=========> ] 1.70G 8.84MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 53%[=========> ] 1.70G 8.94MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 53%[=========> ] 1.70G 9.06MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 53%[=========> ] 1.70G 8.77MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 53%[=========> ] 1.70G 8.82MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 53%[=========> ] 1.71G 8.85MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 53%[=========> ] 1.71G 8.92MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 53%[=========> ] 1.71G 8.95MB/s eta 2m 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 53%[=========> ] 1.71G 9.07MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 53%[=========> ] 1.71G 9.01MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 53%[=========> ] 1.72G 8.94MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 53%[=========> ] 1.72G 8.98MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 53%[=========> ] 1.72G 9.30MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 53%[=========> ] 1.72G 9.12MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 53%[=========> ] 1.72G 8.97MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 53%[=========> ] 1.73G 8.83MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 53%[=========> ] 1.73G 8.83MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 53%[=========> ] 1.73G 9.01MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 54%[=========> ] 1.73G 9.05MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 54%[=========> ] 1.73G 9.40MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 54%[=========> ] 1.74G 9.38MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 54%[=========> ] 1.74G 8.72MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 54%[=========> ] 1.74G 9.12MB/s eta 2m 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 54%[=========> ] 1.74G 8.92MB/s eta 2m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 54%[=========> ] 1.74G 9.17MB/s eta 2m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 54%[=========> ] 1.75G 9.24MB/s eta 2m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 54%[=========> ] 1.75G 9.13MB/s eta 2m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 54%[=========> ] 1.75G 9.14MB/s eta 2m 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 54%[=========> ] 1.75G 9.29MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 54%[=========> ] 1.75G 8.75MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 54%[=========> ] 1.75G 9.24MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 54%[=========> ] 1.76G 8.87MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 54%[=========> ] 1.76G 9.25MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 54%[=========> ] 1.76G 8.89MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 55%[==========> ] 1.76G 9.32MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 55%[==========> ] 1.77G 9.25MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 55%[==========> ] 1.77G 9.16MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 55%[==========> ] 1.77G 9.34MB/s eta 2m 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 55%[==========> ] 1.77G 8.80MB/s eta 2m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 55%[==========> ] 1.77G 9.28MB/s eta 2m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 55%[==========> ] 1.77G 9.01MB/s eta 2m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 55%[==========> ] 1.78G 9.06MB/s eta 2m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 55%[==========> ] 1.78G 9.47MB/s eta 2m 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 55%[==========> ] 1.78G 9.32MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 55%[==========> ] 1.78G 9.57MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 55%[==========> ] 1.78G 8.98MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 55%[==========> ] 1.79G 9.11MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 55%[==========> ] 1.79G 9.16MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 55%[==========> ] 1.79G 9.27MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 55%[==========> ] 1.79G 9.64MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 56%[==========> ] 1.79G 9.53MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 56%[==========> ] 1.80G 9.82MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 56%[==========> ] 1.80G 9.21MB/s eta 2m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 56%[==========> ] 1.80G 9.33MB/s eta 2m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 56%[==========> ] 1.80G 9.43MB/s eta 2m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 56%[==========> ] 1.80G 9.87MB/s eta 2m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 56%[==========> ] 1.81G 9.99MB/s eta 2m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 56%[==========> ] 1.81G 9.90MB/s eta 2m 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 56%[==========> ] 1.81G 10.2MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 56%[==========> ] 1.81G 9.61MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 56%[==========> ] 1.81G 9.79MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 56%[==========> ] 1.82G 9.92MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 56%[==========> ] 1.82G 10.1MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 56%[==========> ] 1.82G 10.5MB/s eta 2m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 56%[==========> ] 1.83G 10.7MB/s eta 2m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 57%[==========> ] 1.83G 10.9MB/s eta 2m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 57%[==========> ] 1.83G 10.2MB/s eta 2m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 57%[==========> ] 1.83G 10.3MB/s eta 2m 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 57%[==========> ] 1.83G 10.6MB/s eta 2m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 57%[==========> ] 1.84G 10.5MB/s eta 2m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 57%[==========> ] 1.84G 10.5MB/s eta 2m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 57%[==========> ] 1.84G 10.8MB/s eta 2m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 57%[==========> ] 1.84G 10.7MB/s eta 2m 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 57%[==========> ] 1.85G 11.0MB/s eta 2m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 57%[==========> ] 1.85G 11.3MB/s eta 2m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 57%[==========> ] 1.85G 11.2MB/s eta 2m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 57%[==========> ] 1.86G 11.3MB/s eta 2m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 58%[==========> ] 1.86G 11.7MB/s eta 2m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 58%[==========> ] 1.86G 11.7MB/s eta 2m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 58%[==========> ] 1.87G 12.0MB/s eta 2m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 58%[==========> ] 1.87G 12.2MB/s eta 2m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 58%[==========> ] 1.87G 12.3MB/s eta 2m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 58%[==========> ] 1.88G 12.7MB/s eta 2m 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 58%[==========> ] 1.88G 12.7MB/s eta 1m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 58%[==========> ] 1.89G 12.7MB/s eta 1m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 58%[==========> ] 1.89G 13.1MB/s eta 1m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 59%[==========> ] 1.89G 13.3MB/s eta 1m 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 59%[==========> ] 1.90G 13.3MB/s eta 1m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 59%[==========> ] 1.90G 13.4MB/s eta 1m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 59%[==========> ] 1.90G 13.6MB/s eta 1m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 59%[==========> ] 1.91G 13.9MB/s eta 1m 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 59%[==========> ] 1.91G 14.0MB/s eta 1m 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 59%[==========> ] 1.91G 14.2MB/s eta 1m 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 59%[==========> ] 1.92G 14.3MB/s eta 1m 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 59%[==========> ] 1.92G 14.4MB/s eta 1m 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 60%[===========> ] 1.92G 14.5MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 60%[===========> ] 1.93G 14.6MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 60%[===========> ] 1.93G 14.6MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 60%[===========> ] 1.94G 14.7MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 60%[===========> ] 1.94G 14.8MB/s eta 1m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 60%[===========> ] 1.94G 14.8MB/s eta 1m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 60%[===========> ] 1.95G 14.8MB/s eta 1m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 60%[===========> ] 1.95G 14.8MB/s eta 1m 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 60%[===========> ] 1.95G 15.0MB/s eta 1m 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 61%[===========> ] 1.96G 15.0MB/s eta 1m 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 61%[===========> ] 1.96G 15.0MB/s eta 1m 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 61%[===========> ] 1.97G 15.0MB/s eta 1m 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 61%[===========> ] 1.97G 15.2MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 61%[===========> ] 1.97G 15.2MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 61%[===========> ] 1.98G 15.2MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 61%[===========> ] 1.98G 15.2MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 61%[===========> ] 1.98G 15.2MB/s eta 1m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 62%[===========> ] 1.99G 15.2MB/s eta 1m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 62%[===========> ] 1.99G 15.2MB/s eta 1m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 62%[===========> ] 2.00G 15.2MB/s eta 1m 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 62%[===========> ] 2.00G 15.2MB/s eta 1m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 62%[===========> ] 2.00G 15.2MB/s eta 1m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 62%[===========> ] 2.01G 15.2MB/s eta 1m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 62%[===========> ] 2.01G 15.2MB/s eta 1m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 62%[===========> ] 2.01G 15.2MB/s eta 1m 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 62%[===========> ] 2.02G 15.2MB/s eta 1m 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 63%[===========> ] 2.02G 15.1MB/s eta 1m 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 63%[===========> ] 2.02G 15.1MB/s eta 1m 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 63%[===========> ] 2.03G 15.1MB/s eta 1m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 63%[===========> ] 2.03G 15.1MB/s eta 1m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 63%[===========> ] 2.04G 15.1MB/s eta 1m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 63%[===========> ] 2.04G 15.1MB/s eta 1m 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 63%[===========> ] 2.04G 15.1MB/s eta 1m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 63%[===========> ] 2.05G 15.1MB/s eta 1m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 63%[===========> ] 2.05G 15.2MB/s eta 1m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 64%[===========> ] 2.05G 15.1MB/s eta 1m 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 64%[===========> ] 2.06G 14.9MB/s eta 1m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 64%[===========> ] 2.06G 14.8MB/s eta 1m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 64%[===========> ] 2.06G 14.7MB/s eta 1m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 64%[===========> ] 2.07G 14.5MB/s eta 1m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 64%[===========> ] 2.07G 14.3MB/s eta 1m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 64%[===========> ] 2.07G 14.2MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 64%[===========> ] 2.07G 14.1MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 64%[===========> ] 2.08G 14.0MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 64%[===========> ] 2.08G 13.9MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 65%[============> ] 2.08G 13.9MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 65%[============> ] 2.09G 13.8MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 65%[============> ] 2.09G 13.8MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 65%[============> ] 2.09G 13.8MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 65%[============> ] 2.10G 13.7MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 65%[============> ] 2.10G 13.7MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 65%[============> ] 2.11G 13.7MB/s eta 97s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 65%[============> ] 2.11G 13.7MB/s eta 97s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 65%[============> ] 2.11G 13.6MB/s eta 97s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 66%[============> ] 2.12G 13.5MB/s eta 97s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 66%[============> ] 2.12G 13.6MB/s eta 95s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 66%[============> ] 2.12G 13.8MB/s eta 95s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 66%[============> ] 2.13G 13.9MB/s eta 95s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 66%[============> ] 2.13G 14.0MB/s eta 95s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 66%[============> ] 2.13G 13.9MB/s eta 94s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 66%[============> ] 2.14G 14.3MB/s eta 94s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 66%[============> ] 2.14G 14.3MB/s eta 94s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 66%[============> ] 2.14G 14.3MB/s eta 94s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 67%[============> ] 2.15G 14.4MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 67%[============> ] 2.15G 14.3MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 67%[============> ] 2.15G 14.4MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 67%[============> ] 2.16G 14.4MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 67%[============> ] 2.16G 14.5MB/s eta 91s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 67%[============> ] 2.17G 14.5MB/s eta 91s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 67%[============> ] 2.17G 14.5MB/s eta 91s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 67%[============> ] 2.17G 14.5MB/s eta 91s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 67%[============> ] 2.18G 14.5MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 67%[============> ] 2.18G 13.8MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 68%[============> ] 2.18G 13.9MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 68%[============> ] 2.18G 13.7MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 68%[============> ] 2.18G 13.3MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 68%[============> ] 2.19G 13.0MB/s eta 89s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 68%[============> ] 2.19G 12.7MB/s eta 89s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 68%[============> ] 2.19G 12.3MB/s eta 89s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 68%[============> ] 2.19G 12.3MB/s eta 89s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 68%[============> ] 2.19G 11.9MB/s eta 89s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 68%[============> ] 2.20G 11.6MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 68%[============> ] 2.20G 11.3MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 68%[============> ] 2.20G 11.0MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 68%[============> ] 2.20G 10.9MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 68%[============> ] 2.20G 10.3MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 68%[============> ] 2.21G 10.2MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 68%[============> ] 2.21G 9.73MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 68%[============> ] 2.21G 9.31MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 69%[============> ] 2.21G 8.89MB/s eta 88s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 69%[============> ] 2.21G 8.46MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 69%[============> ] 2.21G 8.17MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 69%[============> ] 2.22G 8.42MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 69%[============> ] 2.22G 7.97MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 69%[============> ] 2.22G 7.76MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 69%[============> ] 2.22G 7.83MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 69%[============> ] 2.22G 7.68MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 69%[============> ] 2.23G 7.62MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 69%[============> ] 2.23G 7.56MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 69%[============> ] 2.23G 7.48MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 69%[============> ] 2.23G 7.36MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 69%[============> ] 2.23G 7.35MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 69%[============> ] 2.23G 7.20MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 69%[============> ] 2.24G 7.07MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 69%[============> ] 2.24G 7.14MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 69%[============> ] 2.24G 7.20MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 69%[============> ] 2.24G 7.29MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 70%[=============> ] 2.24G 7.32MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 70%[=============> ] 2.25G 7.41MB/s eta 86s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 70%[=============> ] 2.25G 7.37MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 70%[=============> ] 2.25G 7.39MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 70%[=============> ] 2.25G 7.60MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 70%[=============> ] 2.25G 7.72MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 70%[=============> ] 2.25G 7.66MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 70%[=============> ] 2.25G 7.14MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 70%[=============> ] 2.26G 7.29MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 70%[=============> ] 2.26G 7.07MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 70%[=============> ] 2.26G 7.20MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 70%[=============> ] 2.26G 7.04MB/s eta 85s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 70%[=============> ] 2.26G 6.81MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 70%[=============> ] 2.26G 6.87MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 70%[=============> ] 2.26G 6.54MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 70%[=============> ] 2.27G 6.42MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 70%[=============> ] 2.27G 6.37MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 70%[=============> ] 2.27G 6.18MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 70%[=============> ] 2.27G 6.22MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 70%[=============> ] 2.27G 6.05MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 70%[=============> ] 2.27G 6.18MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 70%[=============> ] 2.27G 5.91MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 70%[=============> ] 2.27G 6.07MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 71%[=============> ] 2.28G 6.25MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 71%[=============> ] 2.28G 5.77MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 71%[=============> ] 2.28G 6.01MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 71%[=============> ] 2.28G 6.14MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 71%[=============> ] 2.28G 6.12MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 71%[=============> ] 2.28G 6.34MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 71%[=============> ] 2.28G 6.14MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 71%[=============> ] 2.29G 6.13MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 71%[=============> ] 2.29G 6.07MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 71%[=============> ] 2.29G 6.29MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 71%[=============> ] 2.29G 6.48MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 71%[=============> ] 2.29G 6.42MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 71%[=============> ] 2.29G 6.65MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 71%[=============> ] 2.29G 6.42MB/s eta 83s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 71%[=============> ] 2.29G 6.17MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 71%[=============> ] 2.30G 6.51MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 71%[=============> ] 2.30G 6.45MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 71%[=============> ] 2.30G 6.42MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 71%[=============> ] 2.30G 6.59MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 71%[=============> ] 2.30G 6.40MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 71%[=============> ] 2.30G 6.50MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 71%[=============> ] 2.30G 6.44MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 71%[=============> ] 2.30G 6.67MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 71%[=============> ] 2.31G 6.58MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 72%[=============> ] 2.31G 6.52MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 72%[=============> ] 2.31G 6.69MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 72%[=============> ] 2.31G 6.26MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 72%[=============> ] 2.31G 6.53MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 72%[=============> ] 2.31G 6.27MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 72%[=============> ] 2.31G 6.64MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 72%[=============> ] 2.32G 6.61MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 72%[=============> ] 2.32G 6.54MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 72%[=============> ] 2.32G 6.81MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 72%[=============> ] 2.32G 6.54MB/s eta 81s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 72%[=============> ] 2.32G 6.28MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 72%[=============> ] 2.32G 6.63MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 72%[=============> ] 2.32G 6.43MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 72%[=============> ] 2.33G 6.78MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 72%[=============> ] 2.33G 6.66MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 72%[=============> ] 2.33G 6.43MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 72%[=============> ] 2.33G 6.41MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 72%[=============> ] 2.33G 6.38MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 72%[=============> ] 2.33G 6.74MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 72%[=============> ] 2.33G 6.65MB/s eta 80s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 72%[=============> ] 2.33G 6.88MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 72%[=============> ] 2.34G 6.59MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 72%[=============> ] 2.34G 6.35MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 72%[=============> ] 2.34G 6.72MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 73%[=============> ] 2.34G 6.55MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 73%[=============> ] 2.34G 6.91MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 73%[=============> ] 2.34G 6.81MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 73%[=============> ] 2.34G 6.59MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 73%[=============> ] 2.34G 6.59MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 73%[=============> ] 2.35G 6.59MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 73%[=============> ] 2.35G 6.96MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 73%[=============> ] 2.35G 6.91MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 73%[=============> ] 2.35G 7.17MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 73%[=============> ] 2.35G 6.89MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 73%[=============> ] 2.35G 6.68MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 73%[=============> ] 2.36G 7.09MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 73%[=============> ] 2.36G 6.95MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 73%[=============> ] 2.36G 7.35MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 73%[=============> ] 2.36G 7.29MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 73%[=============> ] 2.36G 7.07MB/s eta 78s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 73%[=============> ] 2.36G 7.11MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 73%[=============> ] 2.36G 7.15MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 73%[=============> ] 2.37G 7.58MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 73%[=============> ] 2.37G 7.58MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 73%[=============> ] 2.37G 7.90MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 74%[=============> ] 2.37G 7.64MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 74%[=============> ] 2.37G 7.44MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 74%[=============> ] 2.38G 7.90MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 74%[=============> ] 2.38G 7.82MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 74%[=============> ] 2.38G 8.31MB/s eta 77s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 74%[=============> ] 2.38G 8.30MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 74%[=============> ] 2.38G 8.08MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 74%[=============> ] 2.38G 8.17MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 74%[=============> ] 2.39G 8.18MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 74%[=============> ] 2.39G 8.70MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 74%[=============> ] 2.39G 8.66MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 74%[=============> ] 2.39G 9.22MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 74%[=============> ] 2.39G 9.24MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 74%[=============> ] 2.40G 9.02MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 74%[=============> ] 2.40G 9.17MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 74%[=============> ] 2.40G 9.28MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 74%[=============> ] 2.40G 9.88MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 75%[==============> ] 2.41G 9.97MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 75%[==============> ] 2.41G 10.3MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 75%[==============> ] 2.41G 10.1MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 75%[==============> ] 2.41G 9.89MB/s eta 73s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 75%[==============> ] 2.41G 10.4MB/s eta 73s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 75%[==============> ] 2.42G 10.4MB/s eta 73s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 75%[==============> ] 2.42G 10.4MB/s eta 73s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 75%[==============> ] 2.42G 11.0MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 75%[==============> ] 2.43G 11.1MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 75%[==============> ] 2.43G 11.1MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 75%[==============> ] 2.43G 11.7MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 76%[==============> ] 2.44G 11.8MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 76%[==============> ] 2.44G 11.9MB/s eta 70s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 76%[==============> ] 2.44G 12.5MB/s eta 70s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 76%[==============> ] 2.45G 12.5MB/s eta 70s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 76%[==============> ] 2.45G 12.6MB/s eta 70s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 76%[==============> ] 2.46G 13.1MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 76%[==============> ] 2.46G 13.1MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 76%[==============> ] 2.46G 12.7MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 76%[==============> ] 2.46G 13.1MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 76%[==============> ] 2.47G 12.9MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 77%[==============> ] 2.47G 12.9MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 77%[==============> ] 2.47G 13.1MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 77%[==============> ] 2.48G 13.2MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 77%[==============> ] 2.48G 13.2MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 77%[==============> ] 2.48G 13.2MB/s eta 66s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 77%[==============> ] 2.48G 13.2MB/s eta 66s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 77%[==============> ] 2.49G 13.1MB/s eta 66s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 77%[==============> ] 2.49G 13.1MB/s eta 66s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 77%[==============> ] 2.49G 13.1MB/s eta 66s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 77%[==============> ] 2.50G 13.0MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 78%[==============> ] 2.50G 13.0MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 78%[==============> ] 2.50G 12.9MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 78%[==============> ] 2.51G 12.8MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 78%[==============> ] 2.51G 12.8MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 78%[==============> ] 2.51G 12.7MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 78%[==============> ] 2.52G 12.6MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 78%[==============> ] 2.52G 12.6MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 78%[==============> ] 2.52G 13.0MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 78%[==============> ] 2.53G 13.0MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 78%[==============> ] 2.53G 13.2MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 79%[==============> ] 2.53G 12.9MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 79%[==============> ] 2.54G 13.0MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 79%[==============> ] 2.54G 12.9MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 79%[==============> ] 2.54G 12.9MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 79%[==============> ] 2.54G 12.8MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 79%[==============> ] 2.55G 12.7MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 79%[==============> ] 2.55G 12.8MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 79%[==============> ] 2.55G 12.7MB/s eta 60s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 79%[==============> ] 2.55G 12.6MB/s eta 60s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 79%[==============> ] 2.56G 12.5MB/s eta 60s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 79%[==============> ] 2.56G 12.3MB/s eta 60s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 79%[==============> ] 2.56G 12.2MB/s eta 60s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 80%[===============> ] 2.57G 12.2MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 80%[===============> ] 2.57G 12.1MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 80%[===============> ] 2.57G 12.0MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 80%[===============> ] 2.57G 11.9MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 80%[===============> ] 2.58G 11.8MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 80%[===============> ] 2.58G 11.6MB/s eta 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 80%[===============> ] 2.58G 11.6MB/s eta 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 80%[===============> ] 2.59G 11.4MB/s eta 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 80%[===============> ] 2.59G 11.8MB/s eta 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 80%[===============> ] 2.59G 11.7MB/s eta 57s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 80%[===============> ] 2.59G 11.8MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 81%[===============> ] 2.60G 11.9MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 81%[===============> ] 2.60G 11.9MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 81%[===============> ] 2.60G 12.1MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 81%[===============> ] 2.61G 12.1MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 81%[===============> ] 2.61G 12.1MB/s eta 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 81%[===============> ] 2.61G 12.3MB/s eta 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 81%[===============> ] 2.62G 12.3MB/s eta 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 81%[===============> ] 2.62G 12.4MB/s eta 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 81%[===============> ] 2.62G 12.4MB/s eta 54s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 81%[===============> ] 2.63G 12.5MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 81%[===============> ] 2.63G 12.1MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 82%[===============> ] 2.63G 12.3MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 82%[===============> ] 2.63G 12.2MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 82%[===============> ] 2.63G 12.0MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 82%[===============> ] 2.64G 11.9MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 82%[===============> ] 2.64G 11.8MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 82%[===============> ] 2.64G 11.6MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 82%[===============> ] 2.64G 11.5MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 82%[===============> ] 2.65G 11.3MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 82%[===============> ] 2.65G 11.2MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 82%[===============> ] 2.65G 11.1MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 82%[===============> ] 2.65G 11.0MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 82%[===============> ] 2.66G 10.8MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 82%[===============> ] 2.66G 10.8MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 83%[===============> ] 2.66G 10.7MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 83%[===============> ] 2.66G 10.5MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 83%[===============> ] 2.67G 10.4MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 83%[===============> ] 2.67G 10.3MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 83%[===============> ] 2.67G 10.2MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 83%[===============> ] 2.67G 10.1MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 83%[===============> ] 2.68G 10.4MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 83%[===============> ] 2.68G 10.2MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 83%[===============> ] 2.68G 10.2MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 83%[===============> ] 2.68G 10.3MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 83%[===============> ] 2.69G 10.4MB/s eta 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 83%[===============> ] 2.69G 10.5MB/s eta 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 84%[===============> ] 2.69G 10.5MB/s eta 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 84%[===============> ] 2.69G 10.5MB/s eta 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 84%[===============> ] 2.70G 10.6MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 84%[===============> ] 2.70G 10.7MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 84%[===============> ] 2.70G 10.7MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 84%[===============> ] 2.71G 10.8MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 84%[===============> ] 2.71G 10.6MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 84%[===============> ] 2.71G 10.6MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 84%[===============> ] 2.71G 10.7MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 84%[===============> ] 2.72G 10.8MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 84%[===============> ] 2.72G 10.9MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 84%[===============> ] 2.72G 10.8MB/s eta 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 84%[===============> ] 2.72G 10.8MB/s eta 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 85%[================> ] 2.73G 11.0MB/s eta 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 85%[================> ] 2.73G 10.9MB/s eta 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 85%[================> ] 2.73G 10.9MB/s eta 44s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 85%[================> ] 2.73G 11.0MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 85%[================> ] 2.74G 11.0MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 85%[================> ] 2.74G 11.0MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 85%[================> ] 2.74G 11.0MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 85%[================> ] 2.75G 11.1MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 85%[================> ] 2.75G 11.0MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 85%[================> ] 2.75G 11.0MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 85%[================> ] 2.75G 11.0MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 85%[================> ] 2.75G 11.0MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 85%[================> ] 2.76G 9.85MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 86%[================> ] 2.76G 10.5MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 86%[================> ] 2.76G 10.3MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 86%[================> ] 2.76G 9.79MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 86%[================> ] 2.76G 10.1MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 86%[================> ] 2.77G 9.67MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 86%[================> ] 2.77G 9.26MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 86%[================> ] 2.77G 9.35MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 86%[================> ] 2.77G 8.98MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 86%[================> ] 2.78G 9.07MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 86%[================> ] 2.78G 8.72MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 86%[================> ] 2.78G 8.83MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 86%[================> ] 2.78G 8.51MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 86%[================> ] 2.78G 8.62MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 86%[================> ] 2.79G 9.40MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 87%[================> ] 2.79G 9.05MB/s eta 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 87%[================> ] 2.79G 9.28MB/s eta 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 87%[================> ] 2.79G 9.36MB/s eta 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 87%[================> ] 2.79G 9.04MB/s eta 38s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 87%[================> ] 2.80G 9.22MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 87%[================> ] 2.80G 8.93MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 87%[================> ] 2.80G 9.23MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 87%[================> ] 2.80G 8.85MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 87%[================> ] 2.81G 9.22MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 87%[================> ] 2.81G 8.97MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 87%[================> ] 2.81G 9.02MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 87%[================> ] 2.81G 8.68MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 87%[================> ] 2.81G 8.71MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 87%[================> ] 2.81G 8.47MB/s eta 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 87%[================> ] 2.82G 8.47MB/s eta 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 87%[================> ] 2.82G 8.32MB/s eta 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 88%[================> ] 2.82G 7.94MB/s eta 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 88%[================> ] 2.82G 8.00MB/s eta 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 88%[================> ] 2.82G 8.34MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 88%[================> ] 2.83G 7.93MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 88%[================> ] 2.83G 7.81MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 88%[================> ] 2.83G 8.08MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 88%[================> ] 2.83G 8.03MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 88%[================> ] 2.83G 8.50MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 88%[================> ] 2.84G 8.53MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 88%[================> ] 2.84G 7.91MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 88%[================> ] 2.84G 8.31MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 88%[================> ] 2.84G 8.30MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 88%[================> ] 2.84G 8.55MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 88%[================> ] 2.84G 8.45MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 88%[================> ] 2.85G 8.48MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 88%[================> ] 2.85G 8.06MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 89%[================> ] 2.85G 8.37MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 89%[================> ] 2.85G 8.36MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 89%[================> ] 2.86G 8.09MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 89%[================> ] 2.86G 8.08MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 89%[================> ] 2.86G 7.85MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 89%[================> ] 2.86G 7.55MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 89%[================> ] 2.86G 7.56MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 89%[================> ] 2.86G 7.31MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 89%[================> ] 2.87G 7.55MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 89%[================> ] 2.87G 7.08MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 89%[================> ] 2.87G 7.30MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 89%[================> ] 2.87G 6.80MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 89%[================> ] 2.87G 7.12MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 89%[================> ] 2.87G 7.19MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 89%[================> ] 2.88G 6.48MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 89%[================> ] 2.88G 6.82MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 89%[================> ] 2.88G 6.32MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 89%[================> ] 2.88G 6.30MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 89%[================> ] 2.88G 6.48MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 89%[================> ] 2.88G 6.36MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 89%[================> ] 2.88G 6.45MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 90%[=================> ] 2.88G 6.33MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 90%[=================> ] 2.89G 6.03MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 90%[=================> ] 2.89G 6.21MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 90%[=================> ] 2.89G 5.80MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 90%[=================> ] 2.89G 6.07MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 90%[=================> ] 2.89G 5.86MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 90%[=================> ] 2.89G 5.81MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 90%[=================> ] 2.89G 5.71MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 90%[=================> ] 2.90G 5.31MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 90%[=================> ] 2.90G 5.55MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 90%[=================> ] 2.90G 5.77MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 90%[=================> ] 2.90G 5.98MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 90%[=================> ] 2.90G 5.67MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 90%[=================> ] 2.90G 5.64MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 90%[=================> ] 2.90G 5.78MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 90%[=================> ] 2.90G 5.48MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 90%[=================> ] 2.91G 5.79MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 90%[=================> ] 2.91G 5.80MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 90%[=================> ] 2.91G 5.75MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 90%[=================> ] 2.91G 6.07MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 90%[=================> ] 2.91G 5.97MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 90%[=================> ] 2.91G 5.79MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 90%[=================> ] 2.91G 5.70MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 90%[=================> ] 2.91G 5.97MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 90%[=================> ] 2.92G 5.90MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 91%[=================> ] 2.92G 5.94MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 91%[=================> ] 2.92G 6.02MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 91%[=================> ] 2.92G 6.11MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 91%[=================> ] 2.92G 6.09MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 91%[=================> ] 2.92G 6.04MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 91%[=================> ] 2.92G 6.26MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 91%[=================> ] 2.92G 6.02MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 91%[=================> ] 2.93G 5.93MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 91%[=================> ] 2.93G 6.03MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 91%[=================> ] 2.93G 6.03MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 91%[=================> ] 2.93G 5.92MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 91%[=================> ] 2.93G 6.09MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 91%[=================> ] 2.93G 6.11MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 91%[=================> ] 2.93G 6.08MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 91%[=================> ] 2.94G 6.04MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 91%[=================> ] 2.94G 6.19MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 91%[=================> ] 2.94G 6.12MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 91%[=================> ] 2.94G 6.09MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 91%[=================> ] 2.94G 6.03MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 91%[=================> ] 2.94G 6.13MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 91%[=================> ] 2.95G 6.10MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 91%[=================> ] 2.95G 6.07MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 91%[=================> ] 2.95G 6.09MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 92%[=================> ] 2.95G 6.22MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 92%[=================> ] 2.95G 6.16MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 92%[=================> ] 2.95G 5.99MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 92%[=================> ] 2.95G 6.19MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 92%[=================> ] 2.96G 6.20MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 92%[=================> ] 2.96G 6.18MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 92%[=================> ] 2.96G 6.34MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 92%[=================> ] 2.96G 6.38MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 92%[=================> ] 2.96G 6.18MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 92%[=================> ] 2.96G 6.28MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 92%[=================> ] 2.96G 6.23MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 92%[=================> ] 2.96G 6.14MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 92%[=================> ] 2.97G 6.18MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 92%[=================> ] 2.97G 6.39MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 92%[=================> ] 2.97G 6.07MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 92%[=================> ] 2.97G 6.24MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 92%[=================> ] 2.97G 6.04MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 92%[=================> ] 2.97G 5.83MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 92%[=================> ] 2.97G 6.11MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 92%[=================> ] 2.98G 5.86MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 92%[=================> ] 2.98G 5.91MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 92%[=================> ] 2.98G 6.01MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 92%[=================> ] 2.98G 5.90MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 93%[=================> ] 2.98G 5.86MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 93%[=================> ] 2.98G 5.73MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 93%[=================> ] 2.98G 5.61MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 93%[=================> ] 2.98G 5.76MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 93%[=================> ] 2.99G 5.61MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 93%[=================> ] 2.99G 5.51MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 93%[=================> ] 2.99G 5.55MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 93%[=================> ] 2.99G 5.53MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 93%[=================> ] 2.99G 5.30MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 93%[=================> ] 2.99G 5.46MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 93%[=================> ] 2.99G 5.38MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 93%[=================> ] 2.99G 5.23MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 93%[=================> ] 3.00G 5.46MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 93%[=================> ] 3.00G 5.29MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 93%[=================> ] 3.00G 5.13MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 93%[=================> ] 3.00G 5.35MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 93%[=================> ] 3.00G 5.30MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 93%[=================> ] 3.00G 5.07MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 93%[=================> ] 3.00G 4.95MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 93%[=================> ] 3.00G 4.80MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 93%[=================> ] 3.00G 4.87MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 93%[=================> ] 3.00G 5.15MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 93%[=================> ] 3.01G 4.70MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 93%[=================> ] 3.01G 4.97MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 93%[=================> ] 3.01G 5.01MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 93%[=================> ] 3.01G 5.02MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 93%[=================> ] 3.01G 4.55MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 93%[=================> ] 3.01G 4.91MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 94%[=================> ] 3.01G 4.90MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 94%[=================> ] 3.01G 4.78MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 94%[=================> ] 3.01G 4.81MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 94%[=================> ] 3.02G 4.68MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 94%[=================> ] 3.02G 4.41MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 94%[=================> ] 3.02G 4.41MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 94%[=================> ] 3.02G 4.35MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 94%[=================> ] 3.02G 4.14MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 94%[=================> ] 3.02G 4.21MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 94%[=================> ] 3.02G 3.86MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 94%[=================> ] 3.02G 4.00MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 94%[=================> ] 3.02G 3.78MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 94%[=================> ] 3.02G 3.63MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 94%[=================> ] 3.02G 3.57MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 94%[=================> ] 3.02G 3.85MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 94%[=================> ] 3.02G 3.43MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 94%[=================> ] 3.03G 3.29MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 94%[=================> ] 3.03G 3.37MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 94%[=================> ] 3.03G 3.34MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 94%[=================> ] 3.03G 3.21MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 94%[=================> ] 3.03G 3.30MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 94%[=================> ] 3.03G 3.23MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 94%[=================> ] 3.03G 3.25MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 94%[=================> ] 3.03G 3.25MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 94%[=================> ] 3.03G 3.34MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 94%[=================> ] 3.03G 3.20MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 94%[=================> ] 3.03G 3.36MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 94%[=================> ] 3.03G 3.19MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 94%[=================> ] 3.04G 3.22MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 94%[=================> ] 3.04G 3.14MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 94%[=================> ] 3.04G 3.07MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 94%[=================> ] 3.04G 3.11MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 94%[=================> ] 3.04G 3.03MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 94%[=================> ] 3.04G 2.98MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 94%[=================> ] 3.04G 3.05MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 94%[=================> ] 3.04G 2.93MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 94%[=================> ] 3.04G 3.00MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 94%[=================> ] 3.04G 2.85MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 94%[=================> ] 3.04G 2.81MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 94%[=================> ] 3.04G 2.81MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 94%[=================> ] 3.04G 2.90MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 94%[=================> ] 3.04G 2.74MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 94%[=================> ] 3.04G 2.72MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 95%[==================> ] 3.04G 2.62MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 95%[==================> ] 3.05G 2.67MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 95%[==================> ] 3.05G 2.74MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 95%[==================> ] 3.05G 2.68MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 95%[==================> ] 3.05G 2.60MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 95%[==================> ] 3.05G 2.55MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 95%[==================> ] 3.05G 2.53MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 95%[==================> ] 3.05G 2.47MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 95%[==================> ] 3.05G 2.51MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 95%[==================> ] 3.05G 2.38MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 95%[==================> ] 3.05G 2.47MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 95%[==================> ] 3.05G 2.32MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 95%[==================> ] 3.05G 2.41MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 95%[==================> ] 3.05G 2.25MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 95%[==================> ] 3.05G 2.37MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 95%[==================> ] 3.05G 2.46MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 95%[==================> ] 3.05G 2.33MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 95%[==================> ] 3.05G 2.30MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 95%[==================> ] 3.05G 2.39MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 95%[==================> ] 3.06G 2.38MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 95%[==================> ] 3.06G 2.45MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 95%[==================> ] 3.06G 2.44MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 95%[==================> ] 3.06G 2.38MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 95%[==================> ] 3.06G 2.50MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 95%[==================> ] 3.06G 2.41MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 95%[==================> ] 3.06G 2.52MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 95%[==================> ] 3.06G 2.43MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 95%[==================> ] 3.06G 2.54MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 95%[==================> ] 3.06G 2.50MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 95%[==================> ] 3.06G 2.54MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 95%[==================> ] 3.06G 2.47MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 95%[==================> ] 3.06G 2.53MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 95%[==================> ] 3.06G 2.48MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 95%[==================> ] 3.06G 2.54MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 95%[==================> ] 3.06G 2.47MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 95%[==================> ] 3.07G 2.54MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 95%[==================> ] 3.07G 2.49MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 95%[==================> ] 3.07G 2.32MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 95%[==================> ] 3.07G 2.39MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 95%[==================> ] 3.07G 2.31MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 95%[==================> ] 3.07G 2.31MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 95%[==================> ] 3.07G 2.23MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 95%[==================> ] 3.07G 2.26MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 95%[==================> ] 3.07G 2.23MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 95%[==================> ] 3.07G 2.19MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 95%[==================> ] 3.07G 2.25MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 95%[==================> ] 3.07G 2.16MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 95%[==================> ] 3.07G 2.24MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 95%[==================> ] 3.07G 2.20MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 95%[==================> ] 3.07G 2.23MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 95%[==================> ] 3.07G 2.18MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 95%[==================> ] 3.07G 2.22MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 95%[==================> ] 3.07G 2.38MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 95%[==================> ] 3.07G 2.25MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 95%[==================> ] 3.08G 2.27MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 95%[==================> ] 3.08G 2.27MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 95%[==================> ] 3.08G 2.26MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 95%[==================> ] 3.08G 2.25MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 96%[==================> ] 3.08G 2.34MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 96%[==================> ] 3.08G 2.34MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 96%[==================> ] 3.08G 2.42MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 96%[==================> ] 3.08G 2.39MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 96%[==================> ] 3.08G 2.46MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 96%[==================> ] 3.08G 2.44MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 96%[==================> ] 3.08G 2.40MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 96%[==================> ] 3.08G 2.47MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 96%[==================> ] 3.08G 2.43MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 96%[==================> ] 3.08G 2.49MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 96%[==================> ] 3.08G 2.43MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 96%[==================> ] 3.08G 2.53MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 96%[==================> ] 3.08G 2.50MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 96%[==================> ] 3.08G 2.45MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 96%[==================> ] 3.09G 2.52MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 96%[==================> ] 3.09G 2.51MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 96%[==================> ] 3.09G 2.57MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 96%[==================> ] 3.09G 2.54MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 96%[==================> ] 3.09G 2.56MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 96%[==================> ] 3.09G 2.56MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 96%[==================> ] 3.09G 2.46MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 96%[==================> ] 3.09G 2.51MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 96%[==================> ] 3.09G 2.51MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 96%[==================> ] 3.09G 2.60MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 96%[==================> ] 3.09G 2.58MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 96%[==================> ] 3.09G 2.53MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 96%[==================> ] 3.09G 2.61MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 96%[==================> ] 3.09G 2.58MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 96%[==================> ] 3.09G 2.63MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 96%[==================> ] 3.09G 2.60MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 96%[==================> ] 3.09G 2.66MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 96%[==================> ] 3.10G 2.64MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 96%[==================> ] 3.10G 2.69MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 96%[==================> ] 3.10G 2.69MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 96%[==================> ] 3.10G 2.82MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 96%[==================> ] 3.10G 2.79MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 96%[==================> ] 3.10G 2.65MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 96%[==================> ] 3.10G 2.74MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 96%[==================> ] 3.10G 2.72MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 96%[==================> ] 3.10G 2.88MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 96%[==================> ] 3.10G 2.85MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 96%[==================> ] 3.10G 3.03MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 96%[==================> ] 3.10G 3.04MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 96%[==================> ] 3.10G 3.19MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 96%[==================> ] 3.10G 3.18MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 96%[==================> ] 3.10G 3.04MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 96%[==================> ] 3.11G 3.18MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 96%[==================> ] 3.11G 3.18MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 96%[==================> ] 3.11G 3.34MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 97%[==================> ] 3.11G 3.34MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 97%[==================> ] 3.11G 3.51MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 97%[==================> ] 3.11G 3.56MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 97%[==================> ] 3.11G 3.80MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 97%[==================> ] 3.11G 3.87MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 97%[==================> ] 3.11G 4.06MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 97%[==================> ] 3.12G 4.12MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 97%[==================> ] 3.12G 4.38MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 97%[==================> ] 3.12G 4.42MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 97%[==================> ] 3.12G 4.25MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 97%[==================> ] 3.12G 4.49MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 97%[==================> ] 3.12G 4.53MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4 97%[==================> ] 3.12G 4.87MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D40 97%[==================> ] 3.12G 4.93MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D409 97%[==================> ] 3.12G 5.30MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096 97%[==================> ] 3.13G 5.45MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096- 97%[==================> ] 3.13G 5.45MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D4096-E 97%[==================> ] 3.13G 5.54MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 97%[==================> ] 3.13G 5.66MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D4096-E0_ 97%[==================> ] 3.13G 6.05MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D4096-E0_1 97%[==================> ] 3.13G 6.23MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D4096-E0_1- 97%[==================> ] 3.14G 6.65MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D4096-E0_1-m 97%[==================> ] 3.14G 6.68MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D4096-E0_1-me 97%[==================> ] 3.14G 6.49MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D4096-E0_1-mem 97%[==================> ] 3.14G 6.59MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 98%[==================> ] 3.14G 6.93MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 98%[==================> ] 3.14G 6.89MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 98%[==================> ] 3.14G 7.17MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 98%[==================> ] 3.15G 7.10MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 98%[==================> ] 3.15G 7.44MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 98%[==================> ] 3.15G 7.31MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 98%[==================> ] 3.15G 7.01MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 98%[==================> ] 3.15G 7.26MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 98%[==================> ] 3.15G 7.17MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 98%[==================> ] 3.15G 7.52MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 98%[==================> ] 3.16G 7.51MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 98%[==================> ] 3.16G 7.57MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 98%[==================> ] 3.16G 7.23MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 98%[==================> ] 3.16G 7.13MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 98%[==================> ] 3.16G 7.46MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 98%[==================> ] 3.16G 7.76MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 98%[==================> ] 3.17G 7.45MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 98%[==================> ] 3.17G 7.40MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 98%[==================> ] 3.17G 7.31MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 98%[==================> ] 3.17G 7.47MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 98%[==================> ] 3.17G 7.65MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 99%[==================> ] 3.17G 7.85MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 99%[==================> ] 3.18G 7.94MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 99%[==================> ] 3.18G 8.07MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 99%[==================> ] 3.18G 7.78MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 99%[==================> ] 3.18G 7.99MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 99%[==================> ] 3.18G 8.15MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 99%[==================> ] 3.18G 8.28MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 99%[==================> ] 3.19G 8.49MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 99%[==================> ] 3.19G 8.35MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 99%[==================> ] 3.19G 8.20MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 99%[==================> ] 3.19G 8.30MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 99%[==================> ] 3.19G 8.41MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 99%[==================> ] 3.19G 8.63MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 99%[==================> ] 3.20G 8.67MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 99%[==================> ] 3.20G 8.77MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 99%[==================> ] 3.20G 8.41MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 99%[==================> ] 3.20G 8.55MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 99%[==================> ] 3.20G 8.71MB/s eta 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D4096-E0 100%[===================>] 3.21G 8.84MB/s in 5m 42s \r\n", - "\r\n", - "2023-08-30 19:34:02 (9.61 MB/s) - ‘v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth’ saved [3441599109/3441599109]\r\n", - "\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "--2023-08-30 19:34:02-- https://huggingface.co/rwkv-x-dev/rwkv-x-playground/resolve/main/experiment/rwkv-x-exp/v5-headsize2x/v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth\r\n", - "Resolving huggingface.co (huggingface.co)... 13.33.33.110, 13.33.33.55, 13.33.33.20, ...\r\n", - "Connecting to huggingface.co (huggingface.co)|13.33.33.110|:443... connected.\r\n", - "HTTP request sent, awaiting response... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "302 Found\r\n", - "Location: https://cdn-lfs.huggingface.co/repos/2e/f7/2ef78555202aa92abdbdf476ce3d0fd5a8b15f7245edf0b80d4d30572355f30d/c8e3cb04e7c511cb2a2756ba15243c0ef7c725d520fcbe4489f86ea6cb59ccbd?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693683242&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzY4MzI0Mn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy8yZS9mNy8yZWY3ODU1NTIwMmFhOTJhYmRiZGY0NzZjZTNkMGZkNWE4YjE1ZjcyNDVlZGYwYjgwZDRkMzA1NzIzNTVmMzBkL2M4ZTNjYjA0ZTdjNTExY2IyYTI3NTZiYTE1MjQzYzBlZjdjNzI1ZDUyMGZjYmU0NDg5Zjg2ZWE2Y2I1OWNjYmQ%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=iA0APYlTKUAY5kFT811fH5inhMj%7ElO2aFbSdHQLt8AfQyDZtHSdTleJIWdusTPMf6Qv--1okli2zEDXHTaECuH9DXtJPeuMV-vnPF62qZAG1GYwcwZ79D81ghbNHPz4OxXI-bx6qKr2cTL0dyv29gDEQQdHe4mZuuyA1V4Hl1dLCz%7EeGa%7Em3--kHhQqIzLfsabFlOQi-uxqvdbb18cAyVvdP38CbfI-PpggAoIZPy6VqPqKt2vjfpMM4jyC-VGkx8impq9VI3IE%7EY5tY1jm9uwt2NGS8vG7HV4SeqtPh-Mcekrb0bODE--JhQG%7EUzGANAthYGDSClU%7ER3x2FCo5mdg__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", - "--2023-08-30 19:34:02-- https://cdn-lfs.huggingface.co/repos/2e/f7/2ef78555202aa92abdbdf476ce3d0fd5a8b15f7245edf0b80d4d30572355f30d/c8e3cb04e7c511cb2a2756ba15243c0ef7c725d520fcbe4489f86ea6cb59ccbd?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693683242&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzY4MzI0Mn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy8yZS9mNy8yZWY3ODU1NTIwMmFhOTJhYmRiZGY0NzZjZTNkMGZkNWE4YjE1ZjcyNDVlZGYwYjgwZDRkMzA1NzIzNTVmMzBkL2M4ZTNjYjA0ZTdjNTExY2IyYTI3NTZiYTE1MjQzYzBlZjdjNzI1ZDUyMGZjYmU0NDg5Zjg2ZWE2Y2I1OWNjYmQ%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=iA0APYlTKUAY5kFT811fH5inhMj%7ElO2aFbSdHQLt8AfQyDZtHSdTleJIWdusTPMf6Qv--1okli2zEDXHTaECuH9DXtJPeuMV-vnPF62qZAG1GYwcwZ79D81ghbNHPz4OxXI-bx6qKr2cTL0dyv29gDEQQdHe4mZuuyA1V4Hl1dLCz%7EeGa%7Em3--kHhQqIzLfsabFlOQi-uxqvdbb18cAyVvdP38CbfI-PpggAoIZPy6VqPqKt2vjfpMM4jyC-VGkx8impq9VI3IE%7EY5tY1jm9uwt2NGS8vG7HV4SeqtPh-Mcekrb0bODE--JhQG%7EUzGANAthYGDSClU%7ER3x2FCo5mdg__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", - "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "18.155.68.98, 18.155.68.94, 18.155.68.73, ...\r\n", - "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|18.155.68.98|:443... connected.\r\n", - "HTTP request sent, awaiting response... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "200 OK\r\n", - "Length: 1066508165 (1017M) [binary/octet-stream]\r\n", - "Saving to: ‘v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth’\r\n", - "\r\n", - "\r", - " v5-hs2x-L 0%[ ] 0 --.-KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 0%[ ] 24.23K 103KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 0%[ ] 58.23K 124KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 0%[ ] 147.86K 209KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 0%[ ] 262.11K 278KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 0%[ ] 376.37K 320KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 0%[ ] 508.21K 360KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 0%[ ] 640.04K 388KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 0%[ ] 763.09K 405KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 0%[ ] 912.50K 431KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 0%[ ] 1.04M 455KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 0%[ ] 1.20M 474KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 0%[ ] 1.36M 492KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 0%[ ] 1.52M 510KB/s eta 34m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 0%[ ] 1.71M 530KB/s eta 34m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 0%[ ] 1.89M 548KB/s eta 34m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 0%[ ] 2.09M 568KB/s eta 34m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 0%[ ] 2.30M 589KB/s eta 34m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 0%[ ] 2.52M 609KB/s eta 28m 27s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 0%[ ] 2.75M 630KB/s eta 28m 27s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 0%[ ] 2.98M 649KB/s eta 28m 27s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 0%[ ] 3.25M 701KB/s eta 28m 27s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 0%[ ] 3.51M 752KB/s eta 28m 27s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 0%[ ] 3.78M 791KB/s eta 24m 11s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 0%[ ] 4.08M 832KB/s eta 24m 11s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 0%[ ] 4.39M 874KB/s eta 24m 11s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 0%[ ] 4.71M 916KB/s eta 24m 11s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 0%[ ] 5.04M 949KB/s eta 24m 11s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 0%[ ] 5.41M 1014KB/s eta 20m 33s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 0%[ ] 5.77M 1.04MB/s eta 20m 33s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 0%[ ] 6.17M 1.09MB/s eta 20m 33s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 0%[ ] 6.58M 1.15MB/s eta 20m 33s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 0%[ ] 7.02M 1.20MB/s eta 20m 33s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 0%[ ] 7.47M 1.26MB/s eta 17m 31s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 0%[ ] 7.95M 1.33MB/s eta 17m 31s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 0%[ ] 8.45M 1.42MB/s eta 17m 31s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 0%[ ] 8.96M 1.49MB/s eta 17m 31s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 0%[ ] 9.52M 1.57MB/s eta 17m 31s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 0%[ ] 10.10M 1.68MB/s eta 14m 52s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 1%[ ] 10.71M 1.76MB/s eta 14m 52s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 1%[ ] 11.34M 1.85MB/s eta 14m 52s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 1%[ ] 12.01M 1.98MB/s eta 14m 52s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 1%[ ] 12.73M 2.07MB/s eta 13m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 1%[ ] 14.17M 2.36MB/s eta 13m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 1%[ ] 14.98M 2.48MB/s eta 13m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 1%[ ] 15.84M 2.60MB/s eta 13m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 1%[ ] 16.73M 2.73MB/s eta 13m 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 1%[ ] 17.67M 2.82MB/s eta 10m 32s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 1%[ ] 18.65M 3.00MB/s eta 10m 32s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 1%[ ] 19.70M 3.12MB/s eta 10m 32s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 2%[ ] 20.77M 3.31MB/s eta 10m 32s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 2%[ ] 21.92M 3.43MB/s eta 10m 32s" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 2%[ ] 23.12M 3.57MB/s eta 8m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 2%[ ] 24.38M 3.82MB/s eta 8m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 2%[ ] 25.71M 3.98MB/s eta 8m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 2%[ ] 27.09M 4.13MB/s eta 8m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 2%[ ] 28.56M 4.30MB/s eta 8m 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 2%[ ] 30.09M 4.56MB/s eta 7m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 3%[ ] 31.70M 4.80MB/s eta 7m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 3%[ ] 33.37M 4.97MB/s eta 7m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 3%[ ] 34.67M 5.23MB/s eta 7m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 3%[ ] 35.32M 5.26MB/s eta 7m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 3%[ ] 37.18M 5.53MB/s eta 6m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 3%[ ] 39.15M 5.80MB/s eta 6m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 4%[ ] 41.21M 6.01MB/s eta 6m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 4%[ ] 43.37M 6.21MB/s eta 6m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 4%[ ] 45.65M 6.43MB/s eta 6m 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 4%[ ] 48.04M 6.89MB/s eta 5m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 4%[ ] 50.54M 7.39MB/s eta 5m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 5%[> ] 53.15M 7.69MB/s eta 5m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 5%[> ] 55.90M 7.98MB/s eta 5m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 5%[> ] 58.79M 8.56MB/s eta 5m 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 6%[> ] 61.82M 8.99MB/s eta 4m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 6%[> ] 65.02M 9.63MB/s eta 4m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 6%[> ] 68.35M 10.1MB/s eta 4m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 7%[> ] 71.77M 10.5MB/s eta 4m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 7%[> ] 75.18M 11.2MB/s eta 4m 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 7%[> ] 78.93M 11.7MB/s eta 3m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 8%[> ] 82.79M 12.3MB/s eta 3m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 8%[> ] 86.52M 12.7MB/s eta 3m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 8%[> ] 90.29M 13.2MB/s eta 3m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 9%[> ] 94.06M 13.4MB/s eta 3m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 9%[> ] 97.67M 13.1MB/s eta 3m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 9%[> ] 101.04M 13.3MB/s eta 3m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 10%[=> ] 103.93M 13.5MB/s eta 3m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 10%[=> ] 106.90M 13.4MB/s eta 3m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 10%[=> ] 109.95M 13.5MB/s eta 3m 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 11%[=> ] 112.98M 13.2MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 11%[=> ] 116.15M 13.1MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 11%[=> ] 119.38M 13.4MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 11%[=> ] 120.38M 12.7MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 12%[=> ] 123.07M 12.5MB/s eta 2m 47s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 12%[=> ] 125.38M 12.7MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 12%[=> ] 127.76M 12.3MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 12%[=> ] 130.17M 11.8MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 13%[=> ] 132.60M 12.1MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 13%[=> ] 135.07M 11.9MB/s eta 2m 36s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 13%[=> ] 137.57M 11.6MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 13%[=> ] 140.10M 11.4MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 14%[=> ] 142.65M 11.1MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 14%[=> ] 145.21M 10.8MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 14%[=> ] 147.81M 10.8MB/s eta 2m 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 14%[=> ] 150.43M 11.1MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 15%[==> ] 153.07M 10.9MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 15%[==> ] 155.73M 10.9MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 15%[==> ] 158.40M 10.8MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 15%[==> ] 161.07M 10.7MB/s eta 2m 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 16%[==> ] 163.77M 10.8MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 16%[==> ] 166.48M 10.7MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 16%[==> ] 169.17M 10.6MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 16%[==> ] 171.90M 11.0MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 17%[==> ] 174.63M 11.0MB/s eta 2m 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 17%[==> ] 177.40M 11.0MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 17%[==> ] 180.17M 11.1MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 17%[==> ] 182.93M 11.2MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 18%[==> ] 185.71M 11.3MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 18%[==> ] 188.51M 11.3MB/s eta 2m 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 18%[==> ] 191.31M 11.4MB/s eta 2m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 19%[==> ] 194.10M 11.5MB/s eta 2m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 19%[==> ] 196.90M 11.5MB/s eta 2m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 19%[==> ] 199.70M 11.6MB/s eta 2m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 19%[==> ] 202.49M 11.6MB/s eta 2m 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 20%[===> ] 205.31M 11.6MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 20%[===> ] 208.12M 11.7MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 20%[===> ] 210.93M 11.7MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 21%[===> ] 213.74M 11.7MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 21%[===> ] 216.57M 11.8MB/s eta 1m 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 21%[===> ] 219.38M 11.8MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 21%[===> ] 222.20M 11.8MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 22%[===> ] 225.01M 11.8MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 22%[===> ] 227.82M 11.9MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 22%[===> ] 230.63M 11.9MB/s eta 1m 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 22%[===> ] 233.43M 11.9MB/s eta 1m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 23%[===> ] 236.23M 11.9MB/s eta 1m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 23%[===> ] 239.04M 11.9MB/s eta 1m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 23%[===> ] 241.85M 11.9MB/s eta 1m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 24%[===> ] 244.67M 11.9MB/s eta 1m 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 24%[===> ] 247.48M 11.9MB/s eta 1m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 24%[===> ] 249.65M 11.2MB/s eta 1m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 24%[===> ] 253.29M 11.2MB/s eta 1m 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 25%[====> ] 255.24M 11.1MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 25%[====> ] 257.31M 10.9MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 25%[====> ] 259.43M 10.8MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 25%[====> ] 261.59M 10.6MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 25%[====> ] 263.79M 10.5MB/s eta 1m 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 26%[====> ] 266.04M 10.4MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 26%[====> ] 268.32M 10.3MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 26%[====> ] 270.63M 10.2MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 26%[====> ] 272.99M 10.1MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 27%[====> ] 275.38M 9.98MB/s eta 98s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 27%[====> ] 277.79M 9.89MB/s eta 96s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 27%[====> ] 280.24M 9.82MB/s eta 96s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 27%[====> ] 282.71M 9.75MB/s eta 96s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 28%[====> ] 285.23M 9.69MB/s eta 96s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 28%[====> ] 287.74M 9.49MB/s eta 96s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 28%[====> ] 290.31M 9.70MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 28%[====> ] 292.88M 9.64MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 29%[====> ] 295.48M 9.60MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 29%[====> ] 298.10M 10.2MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 29%[====> ] 300.74M 10.1MB/s eta 93s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 29%[====> ] 303.40M 10.2MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 30%[=====> ] 306.06M 10.4MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 30%[=====> ] 308.73M 10.5MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 30%[=====> ] 311.43M 10.6MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 30%[=====> ] 314.13M 10.7MB/s eta 90s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 31%[=====> ] 316.85M 10.8MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 31%[=====> ] 319.57M 10.9MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 31%[=====> ] 322.32M 11.0MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 31%[=====> ] 325.07M 11.1MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 32%[=====> ] 327.84M 11.1MB/s eta 87s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 32%[=====> ] 330.60M 11.2MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 32%[=====> ] 333.38M 11.3MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 33%[=====> ] 336.17M 11.4MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 33%[=====> ] 338.95M 11.4MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 33%[=====> ] 341.73M 11.5MB/s eta 84s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 33%[=====> ] 344.52M 11.5MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 34%[=====> ] 347.34M 11.6MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 34%[=====> ] 350.15M 11.6MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 34%[=====> ] 352.95M 11.7MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 34%[=====> ] 355.76M 11.7MB/s eta 82s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 35%[======> ] 358.57M 11.7MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 35%[======> ] 361.40M 11.8MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 35%[======> ] 364.21M 11.8MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 36%[======> ] 367.02M 11.8MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 36%[======> ] 369.71M 11.8MB/s eta 79s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 36%[======> ] 372.54M 11.8MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 36%[======> ] 375.37M 11.8MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 37%[======> ] 378.18M 11.8MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 37%[======> ] 381.01M 11.6MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 37%[======> ] 383.82M 11.5MB/s eta 76s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 38%[======> ] 386.63M 11.8MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 38%[======> ] 389.13M 11.8MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 38%[======> ] 391.95M 11.8MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 38%[======> ] 394.77M 11.8MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 39%[======> ] 397.59M 11.6MB/s eta 74s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 39%[======> ] 400.20M 11.4MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 39%[======> ] 402.98M 11.7MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 39%[======> ] 405.79M 11.8MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 40%[=======> ] 408.62M 11.8MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 40%[=======> ] 411.45M 11.8MB/s eta 72s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 40%[=======> ] 414.26M 11.6MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 41%[=======> ] 417.10M 11.5MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 41%[=======> ] 419.93M 11.7MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 41%[=======> ] 422.59M 11.8MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 41%[=======> ] 425.43M 11.8MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 42%[=======> ] 428.29M 11.8MB/s eta 67s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 42%[=======> ] 431.13M 11.9MB/s eta 67s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 42%[=======> ] 433.99M 11.9MB/s eta 67s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 42%[=======> ] 436.87M 11.9MB/s eta 67s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 43%[=======> ] 439.76M 11.9MB/s eta 67s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 43%[=======> ] 442.45M 11.8MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 43%[=======> ] 445.34M 11.9MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 44%[=======> ] 448.24M 11.9MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 44%[=======> ] 451.18M 12.0MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 44%[=======> ] 454.12M 12.0MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 44%[=======> ] 457.07M 12.1MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 45%[========> ] 460.04M 12.1MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 45%[========> ] 463.01M 12.1MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 45%[========> ] 466.01M 12.2MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 46%[========> ] 469.04M 12.2MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 46%[========> ] 472.09M 12.3MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 46%[========> ] 475.15M 12.3MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 47%[========> ] 478.23M 12.4MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 47%[========> ] 481.34M 12.4MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 47%[========> ] 484.48M 12.5MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 47%[========> ] 487.65M 12.6MB/s eta 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 48%[========> ] 490.87M 12.6MB/s eta 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 48%[========> ] 494.10M 12.7MB/s eta 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 48%[========> ] 497.37M 12.8MB/s eta 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 49%[========> ] 500.67M 12.9MB/s eta 58s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 49%[========> ] 503.99M 13.1MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 49%[========> ] 507.35M 13.2MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 50%[=========> ] 510.73M 13.3MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 50%[=========> ] 514.17M 13.4MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 50%[=========> ] 517.67M 13.5MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 51%[=========> ] 521.10M 13.6MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 51%[=========> ] 524.24M 13.3MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 51%[=========> ] 527.98M 13.3MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 52%[=========> ] 530.52M 13.2MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 52%[=========> ] 533.18M 13.2MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 52%[=========> ] 535.90M 13.1MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 52%[=========> ] 538.67M 13.0MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 53%[=========> ] 541.48M 13.0MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 53%[=========> ] 544.34M 12.9MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 53%[=========> ] 547.23M 12.9MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 54%[=========> ] 550.18M 12.7MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 54%[=========> ] 553.18M 12.7MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 54%[=========> ] 556.21M 12.6MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 54%[=========> ] 559.31M 12.5MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 55%[==========> ] 562.45M 12.4MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 55%[==========> ] 565.59M 12.4MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 55%[==========> ] 568.79M 12.1MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 56%[==========> ] 572.01M 12.6MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 56%[==========> ] 575.27M 13.1MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 56%[==========> ] 578.57M 13.1MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 57%[==========> ] 581.82M 13.3MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 57%[==========> ] 585.06M 12.4MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 57%[==========> ] 588.82M 12.6MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 58%[==========> ] 591.18M 12.8MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 58%[==========> ] 593.59M 12.4MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 58%[==========> ] 596.04M 12.1MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 58%[==========> ] 598.52M 12.4MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 59%[==========> ] 601.04M 11.8MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 59%[==========> ] 603.59M 11.8MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 59%[==========> ] 606.15M 11.5MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 59%[==========> ] 608.74M 11.3MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 60%[===========> ] 611.37M 11.6MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 60%[===========> ] 613.99M 11.0MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 60%[===========> ] 616.65M 10.8MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 60%[===========> ] 619.34M 10.8MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 61%[===========> ] 622.04M 11.2MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 61%[===========> ] 624.76M 10.7MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 61%[===========> ] 627.48M 11.0MB/s eta 42s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 61%[===========> ] 630.21M 10.9MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 62%[===========> ] 632.96M 11.2MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 62%[===========> ] 635.73M 11.1MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 62%[===========> ] 638.51M 11.4MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 63%[===========> ] 641.29M 11.2MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 63%[===========> ] 644.09M 11.1MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 63%[===========> ] 646.87M 11.4MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 63%[===========> ] 649.68M 11.4MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 64%[===========> ] 652.49M 11.6MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 64%[===========> ] 655.32M 11.5MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 64%[===========> ] 658.17M 11.7MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 64%[===========> ] 660.99M 11.6MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 65%[============> ] 663.73M 11.2MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 65%[============> ] 666.59M 11.8MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 65%[============> ] 669.15M 11.5MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 66%[============> ] 671.99M 11.3MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 66%[============> ] 674.85M 11.8MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 66%[============> ] 677.63M 11.6MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 66%[============> ] 680.49M 11.4MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 67%[============> ] 683.35M 11.9MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 67%[============> ] 686.21M 11.7MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 67%[============> ] 688.85M 11.4MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 68%[============> ] 691.73M 11.8MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 68%[============> ] 694.49M 11.7MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 68%[============> ] 697.31M 11.5MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 68%[============> ] 700.17M 11.9MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 69%[============> ] 703.02M 11.7MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 69%[============> ] 705.73M 11.5MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 69%[============> ] 708.59M 11.9MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 69%[============> ] 711.31M 11.7MB/s eta 32s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 70%[=============> ] 714.17M 11.6MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 70%[=============> ] 716.99M 11.5MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 70%[=============> ] 719.87M 11.9MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 71%[=============> ] 722.40M 11.8MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 71%[=============> ] 725.27M 11.9MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 71%[=============> ] 728.13M 11.9MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 71%[=============> ] 731.01M 11.9MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 72%[=============> ] 733.88M 11.9MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 72%[=============> ] 736.76M 11.9MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 72%[=============> ] 739.65M 11.9MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 73%[=============> ] 742.52M 12.0MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 73%[=============> ] 745.42M 12.0MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 73%[=============> ] 748.31M 12.0MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 73%[=============> ] 751.20M 12.0MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 74%[=============> ] 754.10M 12.0MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 74%[=============> ] 757.02M 12.1MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 74%[=============> ] 759.95M 12.1MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 74%[=============> ] 760.71M 11.2MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 75%[==============> ] 764.02M 11.3MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 75%[==============> ] 766.07M 11.2MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 75%[==============> ] 768.23M 11.0MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 75%[==============> ] 770.43M 10.9MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 75%[==============> ] 772.67M 10.8MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 76%[==============> ] 774.96M 10.6MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 76%[==============> ] 777.31M 10.5MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 76%[==============> ] 779.68M 10.4MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 76%[==============> ] 782.09M 10.0MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 77%[==============> ] 784.54M 9.70MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 77%[==============> ] 787.01M 10.1MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 77%[==============> ] 787.23M 8.70MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 77%[==============> ] 791.07M 9.33MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 77%[==============> ] 792.85M 9.08MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 78%[==============> ] 794.70M 8.86MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 78%[==============> ] 796.56M 8.49MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 78%[==============> ] 798.45M 8.41MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 78%[==============> ] 800.37M 8.98MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 78%[==============> ] 802.31M 8.65MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 79%[==============> ] 804.26M 8.63MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 79%[==============> ] 806.24M 8.59MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 79%[==============> ] 808.23M 8.54MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 79%[==============> ] 810.24M 8.49MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 79%[==============> ] 812.27M 8.43MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 80%[===============> ] 814.32M 8.29MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 80%[===============> ] 816.38M 8.17MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 80%[===============> ] 818.46M 8.44MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 80%[===============> ] 820.54M 8.25MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 80%[===============> ] 822.62M 8.11MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 81%[===============> ] 824.73M 8.24MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 81%[===============> ] 826.84M 8.13MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 81%[===============> ] 828.96M 8.79MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 81%[===============> ] 831.09M 9.10MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 81%[===============> ] 833.21M 8.75MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 82%[===============> ] 835.35M 8.82MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 82%[===============> ] 837.51M 8.89MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 82%[===============> ] 839.67M 8.95MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 82%[===============> ] 841.82M 8.99MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 82%[===============> ] 843.63M 9.00MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 83%[===============> ] 845.30M 9.02MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 83%[===============> ] 846.32M 8.82MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 83%[===============> ] 848.48M 8.88MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 83%[===============> ] 850.65M 8.91MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 83%[===============> ] 852.81M 8.96MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 84%[===============> ] 854.98M 8.96MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 84%[===============> ] 857.15M 8.99MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 84%[===============> ] 859.32M 9.01MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 84%[===============> ] 861.49M 9.02MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 84%[===============> ] 863.65M 9.03MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 85%[================> ] 865.82M 9.04MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 85%[================> ] 868.01M 9.05MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 85%[================> ] 870.18M 8.86MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 85%[================> ] 872.35M 9.07MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 85%[================> ] 874.52M 9.07MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 86%[================> ] 875.42M 8.28MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 86%[================> ] 879.04M 8.48MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 86%[================> ] 880.57M 8.65MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 86%[================> ] 882.15M 8.38MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 86%[================> ] 883.77M 8.07MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 87%[================> ] 885.45M 8.27MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 87%[================> ] 887.13M 8.05MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 87%[================> ] 888.87M 7.79MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 87%[================> ] 890.63M 8.01MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 87%[================> ] 892.42M 7.60MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 87%[================> ] 894.24M 7.85MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 88%[================> ] 896.09M 7.67MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 88%[================> ] 897.98M 7.47MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 88%[================> ] 899.88M 7.63MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 88%[================> ] 901.81M 7.48MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 88%[================> ] 903.76M 7.29MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 89%[================> ] 905.73M 7.38MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 89%[================> ] 907.71M 8.04MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 89%[================> ] 909.71M 7.70MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 89%[================> ] 911.74M 7.83MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 89%[================> ] 913.77M 7.95MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 90%[=================> ] 915.82M 8.05MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 90%[=================> ] 917.88M 8.15MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 90%[=================> ] 919.96M 8.29MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 90%[=================> ] 922.06M 8.23MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 90%[=================> ] 924.17M 8.42MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 91%[=================> ] 926.26M 8.53MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 91%[=================> ] 928.38M 8.60MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 91%[=================> ] 930.51M 8.51MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 91%[=================> ] 932.65M 8.55MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 91%[=================> ] 934.77M 8.83MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 92%[=================> ] 936.93M 8.68MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 92%[=================> ] 939.07M 8.73MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 92%[=================> ] 940.73M 8.25MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 92%[=================> ] 943.90M 8.45MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 92%[=================> ] 943.96M 7.96MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 93%[=================> ] 946.84M 8.06MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 93%[=================> ] 947.79M 8.02MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 93%[=================> ] 948.60M 7.76MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 93%[=================> ] 949.73M 7.47MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 93%[=================> ] 950.87M 7.09MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 93%[=================> ] 951.46M 6.35MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 93%[=================> ] 953.99M 6.65MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 93%[=================> ] 954.84M 6.23MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 93%[=================> ] 955.70M 5.86MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 94%[=================> ] 956.56M 5.73MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 94%[=================> ] 957.45M 5.34MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 94%[=================> ] 958.34M 4.95MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 94%[=================> ] 959.26M 4.84MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 94%[=================> ] 960.18M 4.94MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 94%[=================> ] 961.10M 4.69MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 94%[=================> ] 962.04M 4.20MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 94%[=================> ] 962.99M 4.11MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 94%[=================> ] 963.95M 4.07MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 94%[=================> ] 964.90M 4.02MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 94%[=================> ] 965.87M 3.97MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 95%[==================> ] 966.85M 4.38MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 95%[==================> ] 967.82M 3.93MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 95%[==================> ] 968.81M 4.01MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 95%[==================> ] 969.79M 4.07MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-h 95%[==================> ] 970.77M 4.08MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs 95%[==================> ] 971.34M 4.05MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2 95%[==================> ] 972.31M 4.12MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x 95%[==================> ] 973.31M 4.09MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x- 95%[==================> ] 974.31M 4.09MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L 95%[==================> ] 975.29M 4.18MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6 95%[==================> ] 976.29M 4.15MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6- 96%[==================> ] 977.29M 4.15MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D 96%[==================> ] 978.29M 4.20MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2 96%[==================> ] 979.29M 4.18MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D20 96%[==================> ] 980.29M 4.21MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D204 96%[==================> ] 981.29M 4.19MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048 96%[==================> ] 982.29M 4.22MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048- 96%[==================> ] 983.29M 4.19MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-hs2x-L6-D2048-E 96%[==================> ] 984.29M 4.22MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 96%[==================> ] 985.29M 4.19MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-hs2x-L6-D2048-E0_ 96%[==================> ] 986.29M 4.20MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-hs2x-L6-D2048-E0_1 97%[==================> ] 987.29M 4.17MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "hs2x-L6-D2048-E0_1- 97%[==================> ] 988.29M 4.24MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "s2x-L6-D2048-E0_1-m 97%[==================> ] 989.29M 4.22MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2x-L6-D2048-E0_1-me 97%[==================> ] 990.29M 4.27MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-L6-D2048-E0_1-mem 97%[==================> ] 991.29M 4.25MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 97%[==================> ] 992.29M 4.26MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 97%[==================> ] 993.18M 4.24MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 97%[==================> ] 994.09M 4.26MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 97%[==================> ] 994.82M 4.21MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 97%[==================> ] 995.82M 4.28MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 98%[==================> ] 996.82M 4.27MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 98%[==================> ] 997.84M 4.31MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 98%[==================> ] 998.87M 4.28MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 98%[==================> ] 999.87M 4.38MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 98%[==================> ] 1000M 4.27MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 98%[==================> ] 1002M 4.28MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 98%[==================> ] 1003M 4.35MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 98%[==================> ] 1004M 4.34MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 98%[==================> ] 1005M 4.31MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 98%[==================> ] 1006M 4.40MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 98%[==================> ] 1007M 4.41MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 99%[==================> ] 1008M 4.50MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 99%[==================> ] 1009M 4.49MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 99%[==================> ] 1010M 4.57MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 99%[==================> ] 1011M 4.51MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 99%[==================> ] 1012M 4.55MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 99%[==================> ] 1013M 4.60MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 99%[==================> ] 1014M 4.65MB/s eta 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 99%[==================> ] 1016M 4.72MB/s eta 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 99%[==================> ] 1017M 4.77MB/s eta 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-hs2x-L6-D2048-E0 100%[===================>] 1017M 4.82MB/s in 1m 55s \r\n", - "\r\n", - "2023-08-30 19:35:58 (8.87 MB/s) - ‘v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth’ saved [1066508165/1066508165]\r\n", - "\r\n" - ] - } - ], - "source": [ - "# Lets download the custom models\n", - "!mkdir -p ../../../model/\n", - "!cd ../../../model/ && wget -nc \"https://huggingface.co/rwkv-x-dev/rwkv-x-playground/resolve/main/experiment/rwkv-x-exp/v5-headsize2x/v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth\"\n", - "!cd ../../../model/ && wget -nc \"https://huggingface.co/rwkv-x-dev/rwkv-x-playground/resolve/main/experiment/rwkv-x-exp/v5-headsize2x/v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth\"" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "id": "cc89cf61", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T19:35:58.769753Z", - "iopub.status.busy": "2023-08-30T19:35:58.769502Z", - "iopub.status.idle": "2023-08-30T19:35:58.989821Z", - "shell.execute_reply": "2023-08-30T19:35:58.989023Z" - }, - "papermill": { - "duration": 0.291092, - "end_time": "2023-08-30T19:35:58.991543", - "exception": false, - "start_time": "2023-08-30T19:35:58.700451", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "total 4.2G\r\n", - "-rw-r--r-- 1 root root 1018M Aug 26 02:06 v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth\r\n", - "-rw-r--r-- 1 root root 3.3G Aug 25 07:41 v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth\r\n" - ] - } - ], - "source": [ - "!ls -lh ../../../model/" - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "id": "6c94a955", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T19:35:59.135760Z", - "iopub.status.busy": "2023-08-30T19:35:59.135509Z", - "iopub.status.idle": "2023-08-30T19:36:01.236453Z", - "shell.execute_reply": "2023-08-30T19:36:01.235575Z" - }, - "papermill": { - "duration": 2.172495, - "end_time": "2023-08-30T19:36:01.238248", - "exception": false, - "start_time": "2023-08-30T19:35:59.065753", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Requirement already satisfied: aiocsv in /usr/local/lib/python3.10/dist-packages (1.2.4)\r\n", - "Requirement already satisfied: aiofiles in /usr/local/lib/python3.10/dist-packages (23.2.1)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\u001b[33mWARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\u001b[0m\u001b[33m\r\n", - "\u001b[0m" - ] - } - ], - "source": [ - "!python3 -m pip install aiocsv aiofiles" - ] - }, - { - "cell_type": "markdown", - "id": "5c5420f9", - "metadata": { - "papermill": { - "duration": 0.068885, - "end_time": "2023-08-30T19:36:01.380403", - "exception": false, - "start_time": "2023-08-30T19:36:01.311518", - "status": "completed" - }, - "tags": [] - }, - "source": [ - "# headsize 2x (128) - L6-D4096" - ] - }, - { - "cell_type": "code", - "execution_count": 4, - "id": "70470497", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T19:36:01.520119Z", - "iopub.status.busy": "2023-08-30T19:36:01.519857Z", - "iopub.status.idle": "2023-08-30T19:36:39.973622Z", - "shell.execute_reply": "2023-08-30T19:36:39.972826Z" - }, - "papermill": { - "duration": 38.526028, - "end_time": "2023-08-30T19:36:39.975827", - "exception": false, - "start_time": "2023-08-30T19:36:01.449799", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-08-30 19:36:04,368] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 40 tokens : 100.0% similarity, with 40 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 45 tokens : 100.0% similarity, with 45 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 50 tokens : 100.0% similarity, with 50 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 55 tokens : 100.0% similarity, with 55 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 60 tokens : 98.33333333333333% similarity, with 59 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 65 tokens : 98.46153846153847% similarity, with 64 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 70 tokens : 98.57142857142858% similarity, with 69 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 75 tokens : 98.66666666666667% similarity, with 74 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 80 tokens : 96.25% similarity, with 77 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 85 tokens : 96.47058823529412% similarity, with 82 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 90 tokens : 96.66666666666667% similarity, with 87 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 95 tokens : 97.89473684210527% similarity, with 93 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 100 tokens : 99.0% similarity, with 99 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 105 tokens : 99.04761904761905% similarity, with 104 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 110 tokens : 98.18181818181819% similarity, with 108 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 115 tokens : 98.26086956521739% similarity, with 113 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 120 tokens : 98.33333333333333% similarity, with 118 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 125 tokens : 99.2% similarity, with 124 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 130 tokens : 99.23076923076923% similarity, with 129 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 135 tokens : 98.51851851851852% similarity, with 133 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 140 tokens : 98.57142857142858% similarity, with 138 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 145 tokens : 98.62068965517241% similarity, with 143 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 150 tokens : 98.66666666666667% similarity, with 148 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 160 tokens : 98.125% similarity, with 157 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 170 tokens : 97.6470588235294% similarity, with 166 matched token, and 4 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 180 tokens : 97.77777777777777% similarity, with 176 matched token, and 4 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 190 tokens : 98.42105263157895% similarity, with 187 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 200 tokens : 98.5% similarity, with 197 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 210 tokens : 99.04761904761905% similarity, with 208 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 220 tokens : 98.63636363636363% similarity, with 217 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 230 tokens : 99.1304347826087% similarity, with 228 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 240 tokens : 99.58333333333333% similarity, with 239 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 250 tokens : 99.6% similarity, with 249 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 260 tokens : 99.23076923076923% similarity, with 258 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 270 tokens : 98.14814814814815% similarity, with 265 matched token, and 5 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 280 tokens : 98.21428571428571% similarity, with 275 matched token, and 5 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 290 tokens : 97.93103448275862% similarity, with 284 matched token, and 6 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 300 tokens : 98.0% similarity, with 294 matched token, and 6 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 325 tokens : 98.15384615384616% similarity, with 319 matched token, and 6 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 350 tokens : 97.42857142857143% similarity, with 341 matched token, and 9 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 375 tokens : 96.0% similarity, with 360 matched token, and 15 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 400 tokens : 96.25% similarity, with 385 matched token, and 15 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 425 tokens : 95.52941176470588% similarity, with 406 matched token, and 19 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 450 tokens : 95.77777777777777% similarity, with 431 matched token, and 19 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 475 tokens : 95.36842105263158% similarity, with 453 matched token, and 22 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 500 tokens : 95.19999999999999% similarity, with 476 matched token, and 24 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 525 tokens : 94.47619047619048% similarity, with 496 matched token, and 29 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 550 tokens : 94.72727272727272% similarity, with 521 matched token, and 29 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 575 tokens : 94.78260869565217% similarity, with 545 matched token, and 30 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 600 tokens : 94.83333333333334% similarity, with 569 matched token, and 31 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 625 tokens : 94.88% similarity, with 593 matched token, and 32 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 650 tokens : 94.0% similarity, with 611 matched token, and 39 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 675 tokens : 94.37037037037037% similarity, with 637 matched token, and 38 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 700 tokens : 93.28571428571428% similarity, with 653 matched token, and 47 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 750 tokens : 93.2% similarity, with 699 matched token, and 51 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 800 tokens : 91.25% similarity, with 730 matched token, and 70 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 850 tokens : 90.23529411764706% similarity, with 767 matched token, and 83 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 900 tokens : 89.88888888888889% similarity, with 809 matched token, and 91 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 950 tokens : 89.57894736842105% similarity, with 851 matched token, and 99 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1000 tokens : 88.5% similarity, with 885 matched token, and 115 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n", - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5headsize2x_memory_guided.py \"../../../model/v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth\" \"./logs/v5-hs2x-L6-D4096-E0_1-1k.csv\"" - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "id": "dec49f20", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T19:36:40.129023Z", - "iopub.status.busy": "2023-08-30T19:36:40.128447Z", - "iopub.status.idle": "2023-08-30T19:38:52.573399Z", - "shell.execute_reply": "2023-08-30T19:38:52.572594Z" - }, - "papermill": { - "duration": 132.520965, - "end_time": "2023-08-30T19:38:52.575430", - "exception": false, - "start_time": "2023-08-30T19:36:40.054465", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-08-30 19:36:42,984] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1100 tokens : 86.18181818181819% similarity, with 948 matched token, and 152 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1150 tokens : 85.04347826086956% similarity, with 978 matched token, and 172 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1200 tokens : 84.66666666666667% similarity, with 1016 matched token, and 184 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1250 tokens : 84.24000000000001% similarity, with 1053 matched token, and 197 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1300 tokens : 83.07692307692308% similarity, with 1080 matched token, and 220 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1350 tokens : 82.22222222222221% similarity, with 1110 matched token, and 240 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1400 tokens : 81.21428571428572% similarity, with 1137 matched token, and 263 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1450 tokens : 80.55172413793103% similarity, with 1168 matched token, and 282 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1500 tokens : 79.86666666666666% similarity, with 1198 matched token, and 302 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1550 tokens : 79.16129032258064% similarity, with 1227 matched token, and 323 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1600 tokens : 77.3125% similarity, with 1237 matched token, and 363 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1650 tokens : 75.63636363636364% similarity, with 1248 matched token, and 402 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1700 tokens : 74.3529411764706% similarity, with 1264 matched token, and 436 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1750 tokens : 72.39999999999999% similarity, with 1267 matched token, and 483 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1800 tokens : 70.22222222222221% similarity, with 1264 matched token, and 536 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1850 tokens : 69.62162162162161% similarity, with 1288 matched token, and 562 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1900 tokens : 68.78947368421052% similarity, with 1307 matched token, and 593 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1950 tokens : 67.02564102564102% similarity, with 1307 matched token, and 643 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2000 tokens : 66.3% similarity, with 1326 matched token, and 674 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2050 tokens : 64.04878048780488% similarity, with 1313 matched token, and 737 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2100 tokens : 63.714285714285715% similarity, with 1338 matched token, and 762 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2150 tokens : 62.83720930232558% similarity, with 1351 matched token, and 799 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2200 tokens : 61.68181818181818% similarity, with 1357 matched token, and 843 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2250 tokens : 60.84444444444445% similarity, with 1369 matched token, and 881 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2300 tokens : 58.39130434782609% similarity, with 1343 matched token, and 957 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2350 tokens : 57.53191489361702% similarity, with 1352 matched token, and 998 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2400 tokens : 56.41666666666667% similarity, with 1354 matched token, and 1046 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2450 tokens : 55.224489795918366% similarity, with 1353 matched token, and 1097 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2500 tokens : 54.44% similarity, with 1361 matched token, and 1139 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2550 tokens : 53.254901960784316% similarity, with 1358 matched token, and 1192 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2600 tokens : 51.76923076923077% similarity, with 1346 matched token, and 1254 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2650 tokens : 50.83018867924528% similarity, with 1347 matched token, and 1303 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2700 tokens : 49.81481481481482% similarity, with 1345 matched token, and 1355 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2750 tokens : 49.236363636363635% similarity, with 1354 matched token, and 1396 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2800 tokens : 48.32142857142857% similarity, with 1353 matched token, and 1447 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2850 tokens : 47.368421052631575% similarity, with 1350 matched token, and 1500 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2900 tokens : 46.310344827586206% similarity, with 1343 matched token, and 1557 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2950 tokens : 45.49152542372881% similarity, with 1342 matched token, and 1608 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3000 tokens : 44.56666666666666% similarity, with 1337 matched token, and 1663 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3050 tokens : 43.73770491803279% similarity, with 1334 matched token, and 1716 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3100 tokens : 42.516129032258064% similarity, with 1318 matched token, and 1782 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3150 tokens : 41.87301587301587% similarity, with 1319 matched token, and 1831 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3200 tokens : 41.1875% similarity, with 1318 matched token, and 1882 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3250 tokens : 40.43076923076923% similarity, with 1314 matched token, and 1936 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3300 tokens : 39.45454545454545% similarity, with 1302 matched token, and 1998 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3350 tokens : 38.80597014925373% similarity, with 1300 matched token, and 2050 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3400 tokens : 37.6764705882353% similarity, with 1281 matched token, and 2119 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3450 tokens : 36.63768115942029% similarity, with 1264 matched token, and 2186 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3500 tokens : 35.97142857142857% similarity, with 1259 matched token, and 2241 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3550 tokens : 35.23943661971831% similarity, with 1251 matched token, and 2299 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3600 tokens : 34.72222222222222% similarity, with 1250 matched token, and 2350 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3650 tokens : 33.91780821917808% similarity, with 1238 matched token, and 2412 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3700 tokens : 33.4054054054054% similarity, with 1236 matched token, and 2464 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3750 tokens : 32.373333333333335% similarity, with 1214 matched token, and 2536 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3800 tokens : 31.55263157894737% similarity, with 1199 matched token, and 2601 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3850 tokens : 30.857142857142854% similarity, with 1188 matched token, and 2662 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3900 tokens : 29.897435897435898% similarity, with 1166 matched token, and 2734 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3950 tokens : 28.987341772151897% similarity, with 1145 matched token, and 2805 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4000 tokens : 28.075% similarity, with 1123 matched token, and 2877 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5headsize2x_memory_guided.py \"../../../model/v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth\" \"./logs/v5-hs2x-L6-D4096-E0_1-4k.csv\" 1100 4000" - ] - }, - { - "cell_type": "code", - "execution_count": 6, - "id": "a01e1fc2", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T19:38:52.731378Z", - "iopub.status.busy": "2023-08-30T19:38:52.731130Z", - "iopub.status.idle": "2023-08-30T20:18:52.636435Z", - "shell.execute_reply": "2023-08-30T20:18:52.635654Z" - }, - "papermill": { - "duration": 2399.982993, - "end_time": "2023-08-30T20:18:52.638397", - "exception": false, - "start_time": "2023-08-30T19:38:52.655404", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-08-30 19:38:55,624] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4100 tokens : 26.243902439024392% similarity, with 1076 matched token, and 3024 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4200 tokens : 24.952380952380953% similarity, with 1048 matched token, and 3152 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4300 tokens : 23.162790697674417% similarity, with 996 matched token, and 3304 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4400 tokens : 21.386363636363637% similarity, with 941 matched token, and 3459 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4500 tokens : 19.22222222222222% similarity, with 865 matched token, and 3635 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4600 tokens : 17.0% similarity, with 782 matched token, and 3818 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4700 tokens : 15.297872340425531% similarity, with 719 matched token, and 3981 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4800 tokens : 13.666666666666666% similarity, with 656 matched token, and 4144 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4900 tokens : 12.285714285714286% similarity, with 602 matched token, and 4298 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5000 tokens : 10.92% similarity, with 546 matched token, and 4454 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5100 tokens : 9.450980392156863% similarity, with 482 matched token, and 4618 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5200 tokens : 7.961538461538462% similarity, with 414 matched token, and 4786 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5300 tokens : 7.283018867924529% similarity, with 386 matched token, and 4914 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5400 tokens : 6.12962962962963% similarity, with 331 matched token, and 5069 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5500 tokens : 5.49090909090909% similarity, with 302 matched token, and 5198 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5600 tokens : 5.017857142857142% similarity, with 281 matched token, and 5319 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5700 tokens : 4.385964912280701% similarity, with 250 matched token, and 5450 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5800 tokens : 4.068965517241379% similarity, with 236 matched token, and 5564 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5900 tokens : 3.8474576271186436% similarity, with 227 matched token, and 5673 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6000 tokens : 3.733333333333334% similarity, with 224 matched token, and 5776 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6100 tokens : 3.5081967213114753% similarity, with 214 matched token, and 5886 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6200 tokens : 3.338709677419355% similarity, with 207 matched token, and 5993 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6300 tokens : 3.2222222222222223% similarity, with 203 matched token, and 6097 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6400 tokens : 3.2031249999999996% similarity, with 205 matched token, and 6195 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6500 tokens : 3.1846153846153844% similarity, with 207 matched token, and 6293 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6600 tokens : 3.1363636363636362% similarity, with 207 matched token, and 6393 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6700 tokens : 3.119402985074627% similarity, with 209 matched token, and 6491 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6800 tokens : 3.088235294117647% similarity, with 210 matched token, and 6590 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6900 tokens : 3.173913043478261% similarity, with 219 matched token, and 6681 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7000 tokens : 3.1285714285714286% similarity, with 219 matched token, and 6781 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7100 tokens : 3.140845070422535% similarity, with 223 matched token, and 6877 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7200 tokens : 3.111111111111111% similarity, with 224 matched token, and 6976 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7300 tokens : 3.1643835616438354% similarity, with 231 matched token, and 7069 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7400 tokens : 3.1621621621621623% similarity, with 234 matched token, and 7166 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7500 tokens : 3.1466666666666665% similarity, with 236 matched token, and 7264 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7600 tokens : 3.1578947368421053% similarity, with 240 matched token, and 7360 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7700 tokens : 3.1558441558441555% similarity, with 243 matched token, and 7457 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7800 tokens : 3.1538461538461537% similarity, with 246 matched token, and 7554 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7900 tokens : 3.151898734177215% similarity, with 249 matched token, and 7651 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8000 tokens : 3.1375% similarity, with 251 matched token, and 7749 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8100 tokens : 3.185185185185185% similarity, with 258 matched token, and 7842 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8200 tokens : 3.1707317073170733% similarity, with 260 matched token, and 7940 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8300 tokens : 3.156626506024096% similarity, with 262 matched token, and 8038 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8400 tokens : 3.130952380952381% similarity, with 263 matched token, and 8137 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8500 tokens : 3.2% similarity, with 272 matched token, and 8228 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8600 tokens : 3.1976744186046515% similarity, with 275 matched token, and 8325 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8700 tokens : 3.206896551724138% similarity, with 279 matched token, and 8421 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8800 tokens : 3.193181818181818% similarity, with 281 matched token, and 8519 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8900 tokens : 3.191011235955056% similarity, with 284 matched token, and 8616 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9000 tokens : 3.188888888888889% similarity, with 287 matched token, and 8713 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9100 tokens : 3.208791208791209% similarity, with 292 matched token, and 8808 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9200 tokens : 3.2282608695652173% similarity, with 297 matched token, and 8903 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9300 tokens : 3.21505376344086% similarity, with 299 matched token, and 9001 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9400 tokens : 3.1914893617021276% similarity, with 300 matched token, and 9100 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9500 tokens : 3.2105263157894735% similarity, with 305 matched token, and 9195 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9600 tokens : 3.21875% similarity, with 309 matched token, and 9291 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9700 tokens : 3.216494845360825% similarity, with 312 matched token, and 9388 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9800 tokens : 3.2040816326530615% similarity, with 314 matched token, and 9486 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9900 tokens : 3.2222222222222223% similarity, with 319 matched token, and 9581 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10000 tokens : 3.25% similarity, with 325 matched token, and 9675 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10100 tokens : 3.2574257425742577% similarity, with 329 matched token, and 9771 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10200 tokens : 3.2549019607843137% similarity, with 332 matched token, and 9868 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10300 tokens : 3.2427184466019416% similarity, with 334 matched token, and 9966 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10400 tokens : 3.240384615384615% similarity, with 337 matched token, and 10063 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10500 tokens : 3.257142857142857% similarity, with 342 matched token, and 10158 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10600 tokens : 3.2547169811320753% similarity, with 345 matched token, and 10255 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10700 tokens : 3.2710280373831773% similarity, with 350 matched token, and 10350 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10800 tokens : 3.2870370370370368% similarity, with 355 matched token, and 10445 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10900 tokens : 3.2660550458715596% similarity, with 356 matched token, and 10544 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11000 tokens : 3.2818181818181817% similarity, with 361 matched token, and 10639 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11100 tokens : 3.288288288288288% similarity, with 365 matched token, and 10735 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11200 tokens : 3.276785714285714% similarity, with 367 matched token, and 10833 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11300 tokens : 3.2920353982300887% similarity, with 372 matched token, and 10928 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11400 tokens : 3.324561403508772% similarity, with 379 matched token, and 11021 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11500 tokens : 3.3391304347826085% similarity, with 384 matched token, and 11116 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11600 tokens : 3.3448275862068964% similarity, with 388 matched token, and 11212 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11700 tokens : 3.3247863247863245% similarity, with 389 matched token, and 11311 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11800 tokens : 3.347457627118644% similarity, with 395 matched token, and 11405 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11900 tokens : 3.3361344537815127% similarity, with 397 matched token, and 11503 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12000 tokens : 3.3416666666666663% similarity, with 401 matched token, and 11599 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12100 tokens : 3.3636363636363638% similarity, with 407 matched token, and 11693 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12200 tokens : 3.344262295081967% similarity, with 408 matched token, and 11792 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12300 tokens : 3.3577235772357725% similarity, with 413 matched token, and 11887 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12400 tokens : 3.362903225806452% similarity, with 417 matched token, and 11983 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12500 tokens : 3.3680000000000003% similarity, with 421 matched token, and 12079 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12600 tokens : 3.3650793650793656% similarity, with 424 matched token, and 12176 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12700 tokens : 3.362204724409449% similarity, with 427 matched token, and 12273 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12800 tokens : 3.359375% similarity, with 430 matched token, and 12370 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12900 tokens : 3.3643410852713176% similarity, with 434 matched token, and 12466 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13000 tokens : 3.3692307692307697% similarity, with 438 matched token, and 12562 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13100 tokens : 3.381679389312977% similarity, with 443 matched token, and 12657 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13200 tokens : 3.3939393939393945% similarity, with 448 matched token, and 12752 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13300 tokens : 3.37593984962406% similarity, with 449 matched token, and 12851 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13400 tokens : 3.395522388059701% similarity, with 455 matched token, and 12945 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13500 tokens : 3.3851851851851853% similarity, with 457 matched token, and 13043 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13600 tokens : 3.4044117647058822% similarity, with 463 matched token, and 13137 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13700 tokens : 3.386861313868613% similarity, with 464 matched token, and 13236 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13800 tokens : 3.3913043478260874% similarity, with 468 matched token, and 13332 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13900 tokens : 3.3884892086330933% similarity, with 471 matched token, and 13429 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14000 tokens : 3.4357142857142855% similarity, with 481 matched token, and 13519 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14100 tokens : 3.4255319148936167% similarity, with 483 matched token, and 13617 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14200 tokens : 3.408450704225352% similarity, with 484 matched token, and 13716 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14300 tokens : 3.4055944055944054% similarity, with 487 matched token, and 13813 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14400 tokens : 3.4166666666666665% similarity, with 492 matched token, and 13908 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14500 tokens : 3.420689655172414% similarity, with 496 matched token, and 14004 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14600 tokens : 3.404109589041096% similarity, with 497 matched token, and 14103 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14700 tokens : 3.4421768707482996% similarity, with 506 matched token, and 14194 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14800 tokens : 3.4391891891891895% similarity, with 509 matched token, and 14291 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14900 tokens : 3.422818791946309% similarity, with 510 matched token, and 14390 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15000 tokens : 3.42% similarity, with 513 matched token, and 14487 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15100 tokens : 3.4172185430463573% similarity, with 516 matched token, and 14584 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15200 tokens : 3.4078947368421058% similarity, with 518 matched token, and 14682 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15300 tokens : 3.4117647058823533% similarity, with 522 matched token, and 14778 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15400 tokens : 3.4090909090909087% similarity, with 525 matched token, and 14875 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15500 tokens : 3.4000000000000004% similarity, with 527 matched token, and 14973 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15600 tokens : 3.4038461538461537% similarity, with 531 matched token, and 15069 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15700 tokens : 3.4012738853503186% similarity, with 534 matched token, and 15166 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15800 tokens : 3.3924050632911396% similarity, with 536 matched token, and 15264 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15900 tokens : 3.3962264150943398% similarity, with 540 matched token, and 15360 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 16000 tokens : 3.3875% similarity, with 542 matched token, and 15458 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5headsize2x_memory_guided.py \"../../../model/v5-hs2x-L6-D4096-E0_1-mem-ctx-8k.pth\" \"./logs/v5-hs2x-L6-D4096-E0_1-16k.csv\" 4100 16000" - ] - }, - { - "cell_type": "markdown", - "id": "3a1e70b7", - "metadata": { - "papermill": { - "duration": 0.079999, - "end_time": "2023-08-30T20:18:52.802267", - "exception": false, - "start_time": "2023-08-30T20:18:52.722268", - "status": "completed" - }, - "tags": [] - }, - "source": [ - "# headsize 2x (128) - L6-D2048" - ] - }, - { - "cell_type": "code", - "execution_count": 7, - "id": "fe346751", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T20:18:52.961416Z", - "iopub.status.busy": "2023-08-30T20:18:52.961150Z", - "iopub.status.idle": "2023-08-30T20:19:22.620977Z", - "shell.execute_reply": "2023-08-30T20:19:22.620229Z" - }, - "papermill": { - "duration": 29.741672, - "end_time": "2023-08-30T20:19:22.622972", - "exception": false, - "start_time": "2023-08-30T20:18:52.881300", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-08-30 20:18:55,846] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 40 tokens : 100.0% similarity, with 40 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 45 tokens : 100.0% similarity, with 45 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 50 tokens : 100.0% similarity, with 50 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 55 tokens : 100.0% similarity, with 55 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 60 tokens : 100.0% similarity, with 60 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 65 tokens : 100.0% similarity, with 65 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 70 tokens : 100.0% similarity, with 70 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 75 tokens : 98.66666666666667% similarity, with 74 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 80 tokens : 98.75% similarity, with 79 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 85 tokens : 98.82352941176471% similarity, with 84 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 90 tokens : 98.88888888888889% similarity, with 89 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 95 tokens : 98.94736842105263% similarity, with 94 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 100 tokens : 99.0% similarity, with 99 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 105 tokens : 99.04761904761905% similarity, with 104 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 110 tokens : 99.0909090909091% similarity, with 109 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 115 tokens : 99.1304347826087% similarity, with 114 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 120 tokens : 99.16666666666667% similarity, with 119 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 125 tokens : 99.2% similarity, with 124 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 130 tokens : 99.23076923076923% similarity, with 129 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 135 tokens : 99.25925925925925% similarity, with 134 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 140 tokens : 99.28571428571429% similarity, with 139 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 145 tokens : 99.3103448275862% similarity, with 144 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 150 tokens : 99.33333333333333% similarity, with 149 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 160 tokens : 99.375% similarity, with 159 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 170 tokens : 99.41176470588235% similarity, with 169 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 180 tokens : 99.44444444444444% similarity, with 179 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 190 tokens : 99.47368421052632% similarity, with 189 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 200 tokens : 99.5% similarity, with 199 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 210 tokens : 99.52380952380952% similarity, with 209 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 220 tokens : 99.54545454545455% similarity, with 219 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 230 tokens : 99.1304347826087% similarity, with 228 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 240 tokens : 99.58333333333333% similarity, with 239 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 250 tokens : 99.6% similarity, with 249 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 260 tokens : 99.61538461538461% similarity, with 259 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 270 tokens : 99.25925925925925% similarity, with 268 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 280 tokens : 98.92857142857143% similarity, with 277 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 290 tokens : 98.27586206896551% similarity, with 285 matched token, and 5 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 300 tokens : 98.33333333333333% similarity, with 295 matched token, and 5 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 325 tokens : 98.46153846153847% similarity, with 320 matched token, and 5 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 350 tokens : 98.0% similarity, with 343 matched token, and 7 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 375 tokens : 97.06666666666666% similarity, with 364 matched token, and 11 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 400 tokens : 97.25% similarity, with 389 matched token, and 11 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 425 tokens : 96.70588235294117% similarity, with 411 matched token, and 14 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 450 tokens : 95.33333333333334% similarity, with 429 matched token, and 21 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 475 tokens : 95.15789473684211% similarity, with 452 matched token, and 23 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 500 tokens : 95.39999999999999% similarity, with 477 matched token, and 23 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 525 tokens : 94.47619047619048% similarity, with 496 matched token, and 29 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 550 tokens : 94.9090909090909% similarity, with 522 matched token, and 28 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 575 tokens : 93.73913043478261% similarity, with 539 matched token, and 36 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 600 tokens : 93.16666666666666% similarity, with 559 matched token, and 41 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 625 tokens : 93.44% similarity, with 584 matched token, and 41 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 650 tokens : 92.46153846153847% similarity, with 601 matched token, and 49 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 675 tokens : 92.14814814814815% similarity, with 622 matched token, and 53 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 700 tokens : 92.14285714285714% similarity, with 645 matched token, and 55 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 750 tokens : 91.73333333333333% similarity, with 688 matched token, and 62 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 800 tokens : 91.125% similarity, with 729 matched token, and 71 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 850 tokens : 90.58823529411765% similarity, with 770 matched token, and 80 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 900 tokens : 88.66666666666667% similarity, with 798 matched token, and 102 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 950 tokens : 87.78947368421053% similarity, with 834 matched token, and 116 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1000 tokens : 87.5% similarity, with 875 matched token, and 125 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n", - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5headsize2x_memory_guided.py \"../../../model/v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth\" \"./logs/v5-hs2x-L6-D2048-E0_1-1k.csv\"" - ] - }, - { - "cell_type": "code", - "execution_count": 8, - "id": "44b0505e", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T20:19:22.797548Z", - "iopub.status.busy": "2023-08-30T20:19:22.797290Z", - "iopub.status.idle": "2023-08-30T20:21:09.096478Z", - "shell.execute_reply": "2023-08-30T20:21:09.095692Z" - }, - "papermill": { - "duration": 106.385333, - "end_time": "2023-08-30T20:21:09.098520", - "exception": false, - "start_time": "2023-08-30T20:19:22.713187", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-08-30 20:19:25,664] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1100 tokens : 85.81818181818181% similarity, with 944 matched token, and 156 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1150 tokens : 84.69565217391303% similarity, with 974 matched token, and 176 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1200 tokens : 82.75% similarity, with 993 matched token, and 207 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1250 tokens : 82.16% similarity, with 1027 matched token, and 223 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1300 tokens : 80.92307692307692% similarity, with 1052 matched token, and 248 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1350 tokens : 79.4074074074074% similarity, with 1072 matched token, and 278 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1400 tokens : 78.21428571428571% similarity, with 1095 matched token, and 305 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1450 tokens : 77.10344827586208% similarity, with 1118 matched token, and 332 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1500 tokens : 76.33333333333333% similarity, with 1145 matched token, and 355 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1550 tokens : 75.74193548387098% similarity, with 1174 matched token, and 376 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1600 tokens : 74.25% similarity, with 1188 matched token, and 412 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1650 tokens : 72.96969696969697% similarity, with 1204 matched token, and 446 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1700 tokens : 71.23529411764706% similarity, with 1211 matched token, and 489 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1750 tokens : 68.85714285714286% similarity, with 1205 matched token, and 545 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1800 tokens : 68.44444444444444% similarity, with 1232 matched token, and 568 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1850 tokens : 66.97297297297298% similarity, with 1239 matched token, and 611 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1900 tokens : 66.26315789473685% similarity, with 1259 matched token, and 641 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1950 tokens : 65.07692307692308% similarity, with 1269 matched token, and 681 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2000 tokens : 64.4% similarity, with 1288 matched token, and 712 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2050 tokens : 62.48780487804878% similarity, with 1281 matched token, and 769 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2100 tokens : 61.38095238095238% similarity, with 1289 matched token, and 811 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2150 tokens : 59.67441860465116% similarity, with 1283 matched token, and 867 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2200 tokens : 58.77272727272727% similarity, with 1293 matched token, and 907 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2250 tokens : 58.08888888888889% similarity, with 1307 matched token, and 943 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2300 tokens : 56.826086956521735% similarity, with 1307 matched token, and 993 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2350 tokens : 54.55319148936171% similarity, with 1282 matched token, and 1068 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2400 tokens : 54.0% similarity, with 1296 matched token, and 1104 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2450 tokens : 52.48979591836734% similarity, with 1286 matched token, and 1164 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2500 tokens : 51.160000000000004% similarity, with 1279 matched token, and 1221 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2550 tokens : 49.72549019607843% similarity, with 1268 matched token, and 1282 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2600 tokens : 49.11538461538461% similarity, with 1277 matched token, and 1323 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2650 tokens : 47.84905660377359% similarity, with 1268 matched token, and 1382 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2700 tokens : 46.925925925925924% similarity, with 1267 matched token, and 1433 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2750 tokens : 46.43636363636364% similarity, with 1277 matched token, and 1473 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2800 tokens : 45.464285714285715% similarity, with 1273 matched token, and 1527 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2850 tokens : 44.526315789473685% similarity, with 1269 matched token, and 1581 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2900 tokens : 44.03448275862069% similarity, with 1277 matched token, and 1623 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2950 tokens : 43.28813559322034% similarity, with 1277 matched token, and 1673 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3000 tokens : 42.36666666666667% similarity, with 1271 matched token, and 1729 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3050 tokens : 41.63934426229508% similarity, with 1270 matched token, and 1780 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3100 tokens : 41.096774193548384% similarity, with 1274 matched token, and 1826 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3150 tokens : 40.19047619047619% similarity, with 1266 matched token, and 1884 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3200 tokens : 39.53125% similarity, with 1265 matched token, and 1935 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3250 tokens : 38.95384615384616% similarity, with 1266 matched token, and 1984 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3300 tokens : 38.27272727272727% similarity, with 1263 matched token, and 2037 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3350 tokens : 37.55223880597015% similarity, with 1258 matched token, and 2092 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3400 tokens : 37.23529411764706% similarity, with 1266 matched token, and 2134 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3450 tokens : 36.231884057971016% similarity, with 1250 matched token, and 2200 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3500 tokens : 35.82857142857143% similarity, with 1254 matched token, and 2246 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3550 tokens : 34.845070422535215% similarity, with 1237 matched token, and 2313 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3600 tokens : 34.61111111111111% similarity, with 1246 matched token, and 2354 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3650 tokens : 33.89041095890411% similarity, with 1237 matched token, and 2413 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3700 tokens : 33.16216216216216% similarity, with 1227 matched token, and 2473 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3750 tokens : 32.77333333333333% similarity, with 1229 matched token, and 2521 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3800 tokens : 32.23684210526316% similarity, with 1225 matched token, and 2575 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3850 tokens : 31.558441558441558% similarity, with 1215 matched token, and 2635 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3900 tokens : 31.179487179487182% similarity, with 1216 matched token, and 2684 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3950 tokens : 30.531645569620252% similarity, with 1206 matched token, and 2744 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4000 tokens : 29.849999999999998% similarity, with 1194 matched token, and 2806 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5headsize2x_memory_guided.py \"../../../model/v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth\" \"./logs/v5-hs2x-L6-D2048-E0_1-4k.csv\" 1100 4000" - ] - }, - { - "cell_type": "code", - "execution_count": 9, - "id": "386bd282", - "metadata": { - "execution": { - "iopub.execute_input": "2023-08-30T20:21:09.271034Z", - "iopub.status.busy": "2023-08-30T20:21:09.270783Z", - "iopub.status.idle": "2023-08-30T20:59:04.698141Z", - "shell.execute_reply": "2023-08-30T20:59:04.697352Z" - }, - "papermill": { - "duration": 2275.513837, - "end_time": "2023-08-30T20:59:04.700077", - "exception": false, - "start_time": "2023-08-30T20:21:09.186240", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-08-30 20:21:12,169] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4100 tokens : 28.46341463414634% similarity, with 1167 matched token, and 2933 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4200 tokens : 27.166666666666668% similarity, with 1141 matched token, and 3059 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4300 tokens : 25.813953488372093% similarity, with 1110 matched token, and 3190 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4400 tokens : 24.06818181818182% similarity, with 1059 matched token, and 3341 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4500 tokens : 22.466666666666665% similarity, with 1011 matched token, and 3489 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4600 tokens : 20.52173913043478% similarity, with 944 matched token, and 3656 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4700 tokens : 19.404255319148938% similarity, with 912 matched token, and 3788 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4800 tokens : 17.75% similarity, with 852 matched token, and 3948 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4900 tokens : 16.28571428571429% similarity, with 798 matched token, and 4102 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5000 tokens : 15.2% similarity, with 760 matched token, and 4240 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5100 tokens : 13.76470588235294% similarity, with 702 matched token, and 4398 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5200 tokens : 12.134615384615383% similarity, with 631 matched token, and 4569 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5300 tokens : 10.50943396226415% similarity, with 557 matched token, and 4743 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5400 tokens : 9.24074074074074% similarity, with 499 matched token, and 4901 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5500 tokens : 8.436363636363636% similarity, with 464 matched token, and 5036 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5600 tokens : 7.642857142857143% similarity, with 428 matched token, and 5172 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5700 tokens : 6.859649122807017% similarity, with 391 matched token, and 5309 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5800 tokens : 6.241379310344827% similarity, with 362 matched token, and 5438 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5900 tokens : 5.508474576271186% similarity, with 325 matched token, and 5575 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6000 tokens : 5.033333333333333% similarity, with 302 matched token, and 5698 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6100 tokens : 4.557377049180328% similarity, with 278 matched token, and 5822 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6200 tokens : 4.274193548387097% similarity, with 265 matched token, and 5935 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6300 tokens : 3.984126984126984% similarity, with 251 matched token, and 6049 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6400 tokens : 3.9218749999999996% similarity, with 251 matched token, and 6149 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6500 tokens : 3.8307692307692305% similarity, with 249 matched token, and 6251 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6600 tokens : 3.621212121212121% similarity, with 239 matched token, and 6361 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6700 tokens : 3.6865671641791047% similarity, with 247 matched token, and 6453 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6800 tokens : 3.514705882352941% similarity, with 239 matched token, and 6561 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6900 tokens : 3.5652173913043477% similarity, with 246 matched token, and 6654 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7000 tokens : 3.471428571428571% similarity, with 243 matched token, and 6757 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7100 tokens : 3.408450704225352% similarity, with 242 matched token, and 6858 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7200 tokens : 3.375% similarity, with 243 matched token, and 6957 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7300 tokens : 3.383561643835616% similarity, with 247 matched token, and 7053 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7400 tokens : 3.3648648648648654% similarity, with 249 matched token, and 7151 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7500 tokens : 3.32% similarity, with 249 matched token, and 7251 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7600 tokens : 3.3684210526315788% similarity, with 256 matched token, and 7344 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7700 tokens : 3.3636363636363638% similarity, with 259 matched token, and 7441 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7800 tokens : 3.346153846153846% similarity, with 261 matched token, and 7539 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7900 tokens : 3.329113924050633% similarity, with 263 matched token, and 7637 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8000 tokens : 3.3125% similarity, with 265 matched token, and 7735 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8100 tokens : 3.4074074074074074% similarity, with 276 matched token, and 7824 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8200 tokens : 3.3658536585365857% similarity, with 276 matched token, and 7924 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8300 tokens : 3.337349397590361% similarity, with 277 matched token, and 8023 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8400 tokens : 3.3214285714285716% similarity, with 279 matched token, and 8121 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8500 tokens : 3.3882352941176466% similarity, with 288 matched token, and 8212 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8600 tokens : 3.383720930232558% similarity, with 291 matched token, and 8309 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8700 tokens : 3.3908045977011496% similarity, with 295 matched token, and 8405 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8800 tokens : 3.375% similarity, with 297 matched token, and 8503 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8900 tokens : 3.359550561797753% similarity, with 299 matched token, and 8601 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9000 tokens : 3.3666666666666663% similarity, with 303 matched token, and 8697 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9100 tokens : 3.3626373626373627% similarity, with 306 matched token, and 8794 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9200 tokens : 3.369565217391304% similarity, with 310 matched token, and 8890 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9300 tokens : 3.344086021505376% similarity, with 311 matched token, and 8989 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9400 tokens : 3.3297872340425534% similarity, with 313 matched token, and 9087 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9500 tokens : 3.3684210526315788% similarity, with 320 matched token, and 9180 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9600 tokens : 3.3541666666666665% similarity, with 322 matched token, and 9278 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9700 tokens : 3.350515463917526% similarity, with 325 matched token, and 9375 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9800 tokens : 3.3265306122448983% similarity, with 326 matched token, and 9474 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9900 tokens : 3.3636363636363638% similarity, with 333 matched token, and 9567 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10000 tokens : 3.4000000000000004% similarity, with 340 matched token, and 9660 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10100 tokens : 3.425742574257426% similarity, with 346 matched token, and 9754 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10200 tokens : 3.4117647058823533% similarity, with 348 matched token, and 9852 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10300 tokens : 3.388349514563107% similarity, with 349 matched token, and 9951 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10400 tokens : 3.3942307692307696% similarity, with 353 matched token, and 10047 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10500 tokens : 3.419047619047619% similarity, with 359 matched token, and 10141 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10600 tokens : 3.3962264150943398% similarity, with 360 matched token, and 10240 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10700 tokens : 3.4392523364485985% similarity, with 368 matched token, and 10332 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10800 tokens : 3.4351851851851847% similarity, with 371 matched token, and 10429 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10900 tokens : 3.431192660550459% similarity, with 374 matched token, and 10526 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11000 tokens : 3.4454545454545453% similarity, with 379 matched token, and 10621 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11100 tokens : 3.432432432432433% similarity, with 381 matched token, and 10719 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11200 tokens : 3.428571428571429% similarity, with 384 matched token, and 10816 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11300 tokens : 3.433628318584071% similarity, with 388 matched token, and 10912 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11400 tokens : 3.482456140350877% similarity, with 397 matched token, and 11003 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11500 tokens : 3.5130434782608697% similarity, with 404 matched token, and 11096 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11600 tokens : 3.508620689655172% similarity, with 407 matched token, and 11193 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11700 tokens : 3.4957264957264957% similarity, with 409 matched token, and 11291 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11800 tokens : 3.5254237288135593% similarity, with 416 matched token, and 11384 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11900 tokens : 3.5126050420168067% similarity, with 418 matched token, and 11482 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12000 tokens : 3.5249999999999995% similarity, with 423 matched token, and 11577 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12100 tokens : 3.5371900826446283% similarity, with 428 matched token, and 11672 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12200 tokens : 3.5327868852459017% similarity, with 431 matched token, and 11769 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12300 tokens : 3.528455284552846% similarity, with 434 matched token, and 11866 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12400 tokens : 3.5241935483870965% similarity, with 437 matched token, and 11963 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12500 tokens : 3.504% similarity, with 438 matched token, and 12062 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12600 tokens : 3.507936507936508% similarity, with 442 matched token, and 12158 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12700 tokens : 3.5196850393700787% similarity, with 447 matched token, and 12253 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12800 tokens : 3.515625% similarity, with 450 matched token, and 12350 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12900 tokens : 3.5193798449612403% similarity, with 454 matched token, and 12446 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13000 tokens : 3.523076923076923% similarity, with 458 matched token, and 12542 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13100 tokens : 3.5038167938931295% similarity, with 459 matched token, and 12641 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13200 tokens : 3.5151515151515147% similarity, with 464 matched token, and 12736 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13300 tokens : 3.496240601503759% similarity, with 465 matched token, and 12835 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13400 tokens : 3.544776119402985% similarity, with 475 matched token, and 12925 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13500 tokens : 3.5111111111111115% similarity, with 474 matched token, and 13026 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13600 tokens : 3.5367647058823533% similarity, with 481 matched token, and 13119 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13700 tokens : 3.5328467153284673% similarity, with 484 matched token, and 13216 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13800 tokens : 3.5072463768115942% similarity, with 484 matched token, and 13316 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13900 tokens : 3.553956834532374% similarity, with 494 matched token, and 13406 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14000 tokens : 3.564285714285714% similarity, with 499 matched token, and 13501 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14100 tokens : 3.5673758865248226% similarity, with 503 matched token, and 13597 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14200 tokens : 3.549295774647887% similarity, with 504 matched token, and 13696 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14300 tokens : 3.5454545454545454% similarity, with 507 matched token, and 13793 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14400 tokens : 3.5624999999999996% similarity, with 513 matched token, and 13887 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14500 tokens : 3.5586206896551724% similarity, with 516 matched token, and 13984 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14600 tokens : 3.5479452054794516% similarity, with 518 matched token, and 14082 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14700 tokens : 3.5918367346938775% similarity, with 528 matched token, and 14172 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14800 tokens : 3.567567567567568% similarity, with 528 matched token, and 14272 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14900 tokens : 3.577181208053691% similarity, with 533 matched token, and 14367 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15000 tokens : 3.56% similarity, with 534 matched token, and 14466 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15100 tokens : 3.562913907284768% similarity, with 538 matched token, and 14562 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15200 tokens : 3.55921052631579% similarity, with 541 matched token, and 14659 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15300 tokens : 3.5620915032679736% similarity, with 545 matched token, and 14755 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15400 tokens : 3.5584415584415585% similarity, with 548 matched token, and 14852 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15500 tokens : 3.561290322580645% similarity, with 552 matched token, and 14948 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15600 tokens : 3.5705128205128203% similarity, with 557 matched token, and 15043 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15700 tokens : 3.579617834394905% similarity, with 562 matched token, and 15138 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15800 tokens : 3.5632911392405062% similarity, with 563 matched token, and 15237 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15900 tokens : 3.5534591194968552% similarity, with 565 matched token, and 15335 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 16000 tokens : 3.5374999999999996% similarity, with 566 matched token, and 15434 token mismatch\r\n", - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5headsize2x_memory_guided.py \"../../../model/v5-hs2x-L6-D2048-E0_1-mem-ctx-8k.pth\" \"./logs/v5-hs2x-L6-D2048-E0_1-16k.csv\" 4100 16000" - ] - } - ], - "metadata": { - "kernelspec": { - "display_name": "rwkv-infctx", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.10.12" - }, - "papermill": { - "default_parameters": {}, - "duration": 5447.312882, - "end_time": "2023-08-30T20:59:04.918766", - "environment_variables": {}, - "exception": null, - "input_path": "/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/Benchmark-V5headsize2x.ipynb", - "output_path": "/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/Benchmark-V5headsize2x.ipynb", - "parameters": {}, - "start_time": "2023-08-30T19:28:17.605884", - "version": "2.4.0" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} \ No newline at end of file