{ "cells": [ { "cell_type": "markdown", "id": "cf73c4cf", "metadata": { "papermill": { "duration": 0.004145, "end_time": "2023-09-05T19:58:25.321223", "exception": false, "start_time": "2023-09-05T19:58:25.317078", "status": "completed" }, "tags": [] }, "source": [ "## Custom Experimental Memory benchmarking\n", "\n", "The following is meant to observe the memory performance in a more verbose CSV logging mode, for the baseline raven models" ] }, { "cell_type": "code", "execution_count": 1, "id": "aaec4faf", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T19:58:25.330738Z", "iopub.status.busy": "2023-09-05T19:58:25.330236Z", "iopub.status.idle": "2023-09-05T20:04:41.032031Z", "shell.execute_reply": "2023-09-05T20:04:41.030878Z" }, "papermill": { "duration": 375.709392, "end_time": "2023-09-05T20:04:41.034546", "exception": false, "start_time": "2023-09-05T19:58:25.325154", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "--2023-09-05 19:58:25-- https://huggingface.co/picocreator/memory-size-experiment-for-rwkv/resolve/main/RWKV-v5-baseline/BaseV5-C-Tune5.pth\r\n", "Resolving huggingface.co (huggingface.co)... 18.154.227.7, 18.154.227.67, 18.154.227.69, ...\r\n", "Connecting to huggingface.co (huggingface.co)|18.154.227.7|:443... connected.\r\n", "HTTP request sent, awaiting response... 302 Found\r\n", "Location: https://cdn-lfs.huggingface.co/repos/cb/ef/cbef09abb2634a3375b28868bffa285226dfeabedec89b28c2fb302221164d66/c1f89b4d653a240f6f165d25988b51f6db36bf8a2388707e3e3242af751575eb?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27BaseV5-C-Tune5.pth%3B+filename%3D%22BaseV5-C-Tune5.pth%22%3B&Expires=1694203105&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzEwNX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9jYi9lZi9jYmVmMDlhYmIyNjM0YTMzNzViMjg4NjhiZmZhMjg1MjI2ZGZlYWJlZGVjODliMjhjMmZiMzAyMjIxMTY0ZDY2L2MxZjg5YjRkNjUzYTI0MGY2ZjE2NWQyNTk4OGI1MWY2ZGIzNmJmOGEyMzg4NzA3ZTNlMzI0MmFmNzUxNTc1ZWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=ykou8uLrNIvdiZlMOBKSa-TxcLOCLvMDjj9o4SZ5Vj1ovca53yzWCgEu7VINUQKO2GvnX4ivd153xcBlbnlzlCtGT96pIKOf6AT1KwcIthqxPj4SnMm7LaZOfOQPQ2HcRQjLRp9S-ThMRXwrniPe4iB4USdcqbP%7E3YnQRQ7YCnrqrEzF2A7SX8ubT-oNXDevc3Cj21BKYo6qlYuTK%7EMCChwgmcq7EX%7EeP%7E9I3A02TvxkM302k1m-Ex%7ERjA7k0Px9xUp0otVtDIir65Y0mMafarGbJIgtI3T-mQQRYyxn6pymYMLV5td%7EXExISwcje1-Gwsc4cLPgh8rrj7Kr9J2WZg__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", "--2023-09-05 19:58:25-- https://cdn-lfs.huggingface.co/repos/cb/ef/cbef09abb2634a3375b28868bffa285226dfeabedec89b28c2fb302221164d66/c1f89b4d653a240f6f165d25988b51f6db36bf8a2388707e3e3242af751575eb?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27BaseV5-C-Tune5.pth%3B+filename%3D%22BaseV5-C-Tune5.pth%22%3B&Expires=1694203105&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzEwNX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9jYi9lZi9jYmVmMDlhYmIyNjM0YTMzNzViMjg4NjhiZmZhMjg1MjI2ZGZlYWJlZGVjODliMjhjMmZiMzAyMjIxMTY0ZDY2L2MxZjg5YjRkNjUzYTI0MGY2ZjE2NWQyNTk4OGI1MWY2ZGIzNmJmOGEyMzg4NzA3ZTNlMzI0MmFmNzUxNTc1ZWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=ykou8uLrNIvdiZlMOBKSa-TxcLOCLvMDjj9o4SZ5Vj1ovca53yzWCgEu7VINUQKO2GvnX4ivd153xcBlbnlzlCtGT96pIKOf6AT1KwcIthqxPj4SnMm7LaZOfOQPQ2HcRQjLRp9S-ThMRXwrniPe4iB4USdcqbP%7E3YnQRQ7YCnrqrEzF2A7SX8ubT-oNXDevc3Cj21BKYo6qlYuTK%7EMCChwgmcq7EX%7EeP%7E9I3A02TvxkM302k1m-Ex%7ERjA7k0Px9xUp0otVtDIir65Y0mMafarGbJIgtI3T-mQQRYyxn6pymYMLV5td%7EXExISwcje1-Gwsc4cLPgh8rrj7Kr9J2WZg__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.49, 108.138.64.111, 108.138.64.36, ...\r\n", "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.49|:443... connected.\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ "200 OK\r\n", "Length: 6060483063 (5.6G) [binary/octet-stream]\r\n", "Saving to: ‘BaseV5-C-Tune5.pth’\r\n", "\r\n", "\r", "BaseV5-C-Tune5.pth 0%[ ] 0 --.-KB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 0%[ ] 15.26M 61.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 0%[ ] 30.52M 67.6MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 0%[ ] 45.78M 61.0MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 1%[ ] 60.52M 61.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 1%[ ] 61.03M 50.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 1%[ ] 76.41M 51.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 1%[ ] 91.55M 54.7MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 1%[ ] 106.29M 56.5MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 1%[ ] 106.81M 51.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 2%[ ] 122.07M 53.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 2%[ ] 137.33M 51.5MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 2%[ ] 152.59M 50.9MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 2%[ ] 162.26M 50.7MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 2%[ ] 167.85M 48.0MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 3%[ ] 182.59M 48.0MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 3%[ ] 189.42M 47.3MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 3%[ ] 198.36M 46.6MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 3%[ ] 206.18M 45.3MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 3%[ ] 213.74M 43.4MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 3%[ ] 228.87M 43.3MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 4%[ ] 244.13M 43.2MB/s eta 1m 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 4%[ ] 252.57M 42.5MB/s eta 1m 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 4%[ ] 259.40M 42.0MB/s eta 1m 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 4%[ ] 282.07M 44.6MB/s eta 1m 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 5%[> ] 289.92M 43.5MB/s eta 1m 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 5%[> ] 305.18M 43.5MB/s eta 1m 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 5%[> ] 320.43M 42.4MB/s eta 1m 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 5%[> ] 340.13M 45.8MB/s eta 1m 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 6%[> ] 350.39M 46.0MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 6%[> ] 358.96M 46.4MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 6%[> ] 381.47M 50.1MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 6%[> ] 396.73M 50.6MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 7%[> ] 411.47M 53.5MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 7%[> ] 416.17M 52.6MB/s eta 1m 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 7%[> ] 427.25M 52.3MB/s eta 1m 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 7%[> ] 442.51M 51.7MB/s eta 1m 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 7%[> ] 455.18M 53.4MB/s eta 1m 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 7%[> ] 457.76M 51.2MB/s eta 1m 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 8%[> ] 472.50M 54.1MB/s eta 1m 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 8%[> ] 476.21M 50.8MB/s eta 1m 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 8%[> ] 488.28M 50.2MB/s eta 1m 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 8%[> ] 502.28M 50.0MB/s eta 1m 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 9%[> ] 532.23M 54.6MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 9%[> ] 540.75M 52.4MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 9%[> ] 549.31M 54.1MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 9%[> ] 564.58M 50.6MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 10%[=> ] 579.31M 51.0MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 10%[=> ] 593.27M 49.9MB/s eta 1m 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 10%[=> ] 610.35M 50.6MB/s eta 1m 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 10%[=> ] 625.61M 53.3MB/s eta 1m 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 10%[=> ] 635.17M 53.9MB/s eta 1m 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 11%[=> ] 640.87M 50.4MB/s eta 1m 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 11%[=> ] 656.13M 51.3MB/s eta 1m 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 11%[=> ] 670.87M 50.0MB/s eta 1m 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 11%[=> ] 684.82M 53.1MB/s eta 1m 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 11%[=> ] 686.64M 49.2MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 12%[=> ] 701.39M 51.6MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 12%[=> ] 717.16M 48.9MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 12%[=> ] 732.42M 47.2MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 12%[=> ] 747.69M 46.6MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 13%[=> ] 762.94M 47.2MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 13%[=> ] 767.13M 44.7MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 13%[=> ] 778.20M 45.5MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 13%[=> ] 791.63M 46.0MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 13%[=> ] 793.46M 42.8MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 13%[=> ] 808.71M 41.9MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 14%[=> ] 823.97M 42.7MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 14%[=> ] 839.23M 43.7MB/s eta 1m 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 14%[=> ] 853.98M 44.2MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 15%[==> ] 869.24M 45.9MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 15%[==> ] 882.01M 45.5MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 15%[==> ] 885.01M 46.0MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 15%[==> ] 899.75M 46.5MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 15%[==> ] 915.01M 44.4MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 16%[==> ] 930.27M 46.6MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 16%[==> ] 939.22M 45.3MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 16%[==> ] 946.04M 44.1MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 16%[==> ] 961.30M 44.8MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 16%[==> ] 976.55M 46.2MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 17%[==> ] 991.82M 46.6MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 17%[==> ] 1007M 46.9MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 17%[==> ] 1007M 46.0MB/s eta 1m 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 17%[==> ] 1022M 46.5MB/s eta 1m 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 17%[==> ] 1.01G 46.2MB/s eta 1m 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 18%[==> ] 1.03G 45.1MB/s eta 1m 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 18%[==> ] 1.04G 47.6MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 18%[==> ] 1.04G 45.0MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 18%[==> ] 1.06G 45.5MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 18%[==> ] 1.06G 43.5MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 19%[==> ] 1.07G 43.7MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 19%[==> ] 1.09G 43.7MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 19%[==> ] 1.09G 42.9MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 19%[==> ] 1.10G 41.8MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 19%[==> ] 1.12G 43.0MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 19%[==> ] 1.12G 39.4MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 20%[===> ] 1.13G 41.5MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 20%[===> ] 1.15G 40.3MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 20%[===> ] 1.16G 39.5MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 20%[===> ] 1.17G 38.3MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 20%[===> ] 1.18G 40.2MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 21%[===> ] 1.19G 40.4MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 21%[===> ] 1.21G 39.5MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 21%[===> ] 1.22G 41.4MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 21%[===> ] 1.24G 41.9MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 22%[===> ] 1.25G 42.6MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 22%[===> ] 1.27G 44.5MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 22%[===> ] 1.28G 43.6MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 22%[===> ] 1.29G 46.3MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 23%[===> ] 1.30G 45.9MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 23%[===> ] 1.30G 44.5MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 23%[===> ] 1.31G 44.9MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 23%[===> ] 1.31G 39.0MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 23%[===> ] 1.31G 38.1MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 23%[===> ] 1.33G 38.3MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 23%[===> ] 1.34G 38.9MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 24%[===> ] 1.37G 41.1MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 24%[===> ] 1.37G 39.7MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 24%[===> ] 1.39G 39.7MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 24%[===> ] 1.40G 38.1MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 25%[====> ] 1.42G 37.7MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 25%[====> ] 1.43G 36.2MB/s eta 95s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 25%[====> ] 1.44G 38.6MB/s eta 95s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 25%[====> ] 1.45G 35.3MB/s eta 95s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 25%[====> ] 1.46G 37.0MB/s eta 95s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 26%[====> ] 1.47G 39.6MB/s eta 94s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 26%[====> ] 1.48G 40.5MB/s eta 94s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 26%[====> ] 1.49G 41.8MB/s eta 94s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 26%[====> ] 1.50G 44.1MB/s eta 94s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 26%[====> ] 1.51G 45.6MB/s eta 94s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 26%[====> ] 1.52G 45.4MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 27%[====> ] 1.53G 44.7MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 27%[====> ] 1.54G 41.4MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 27%[====> ] 1.55G 40.4MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 27%[====> ] 1.56G 40.5MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 28%[====> ] 1.59G 44.7MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 28%[====> ] 1.59G 44.2MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 28%[====> ] 1.60G 43.1MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 28%[====> ] 1.61G 43.4MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 28%[====> ] 1.62G 45.2MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 29%[====> ] 1.64G 46.1MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 29%[====> ] 1.65G 45.3MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 29%[====> ] 1.65G 42.5MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 29%[====> ] 1.66G 41.6MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 29%[====> ] 1.67G 40.0MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 29%[====> ] 1.68G 43.1MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 30%[=====> ] 1.70G 42.7MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 30%[=====> ] 1.71G 45.1MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 30%[=====> ] 1.72G 44.8MB/s eta 90s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 30%[=====> ] 1.73G 46.3MB/s eta 89s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 30%[=====> ] 1.74G 47.4MB/s eta 89s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 31%[=====> ] 1.76G 47.1MB/s eta 89s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 31%[=====> ] 1.77G 44.3MB/s eta 89s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 31%[=====> ] 1.79G 46.4MB/s eta 87s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 31%[=====> ] 1.79G 45.9MB/s eta 87s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 31%[=====> ] 1.80G 45.3MB/s eta 87s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 32%[=====> ] 1.82G 44.6MB/s eta 87s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 32%[=====> ] 1.82G 43.9MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 32%[=====> ] 1.83G 43.5MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 32%[=====> ] 1.85G 42.9MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 32%[=====> ] 1.86G 45.9MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 32%[=====> ] 1.86G 46.2MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 33%[=====> ] 1.86G 45.2MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 33%[=====> ] 1.88G 45.5MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 33%[=====> ] 1.89G 45.2MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 33%[=====> ] 1.91G 47.1MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 34%[=====> ] 1.92G 46.0MB/s eta 84s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 34%[=====> ] 1.94G 45.8MB/s eta 84s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 34%[=====> ] 1.95G 45.3MB/s eta 84s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 34%[=====> ] 1.97G 45.7MB/s eta 84s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 35%[======> ] 1.98G 46.2MB/s eta 82s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 35%[======> ] 1.98G 45.6MB/s eta 82s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 35%[======> ] 2.00G 43.6MB/s eta 82s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 35%[======> ] 2.01G 44.9MB/s eta 82s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 35%[======> ] 2.02G 44.0MB/s eta 82s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 36%[======> ] 2.04G 46.1MB/s eta 82s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 36%[======> ] 2.04G 44.6MB/s eta 82s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 36%[======> ] 2.06G 46.8MB/s eta 81s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 36%[======> ] 2.07G 47.3MB/s eta 81s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 36%[======> ] 2.08G 45.3MB/s eta 81s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 37%[======> ] 2.10G 48.0MB/s eta 81s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 37%[======> ] 2.12G 45.6MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 37%[======> ] 2.12G 42.9MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 37%[======> ] 2.13G 40.2MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 37%[======> ] 2.13G 39.4MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 38%[======> ] 2.15G 40.5MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 38%[======> ] 2.16G 39.9MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 38%[======> ] 2.17G 43.0MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 38%[======> ] 2.18G 40.1MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 38%[======> ] 2.19G 42.6MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 39%[======> ] 2.21G 44.4MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 39%[======> ] 2.21G 42.6MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 39%[======> ] 2.22G 41.0MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 39%[======> ] 2.23G 42.1MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 39%[======> ] 2.23G 39.8MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 39%[======> ] 2.25G 41.5MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 39%[======> ] 2.25G 40.6MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 40%[=======> ] 2.26G 39.0MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 40%[=======> ] 2.29G 41.8MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 40%[=======> ] 2.31G 48.5MB/s eta 76s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 40%[=======> ] 2.31G 44.5MB/s eta 76s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 40%[=======> ] 2.31G 43.3MB/s eta 76s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 41%[=======> ] 2.32G 40.6MB/s eta 76s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 41%[=======> ] 2.34G 42.9MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 41%[=======> ] 2.35G 41.5MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 41%[=======> ] 2.37G 43.3MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 42%[=======> ] 2.38G 44.3MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 42%[=======> ] 2.39G 44.3MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 42%[=======> ] 2.40G 46.1MB/s eta 74s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 42%[=======> ] 2.41G 45.2MB/s eta 74s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 43%[=======> ] 2.43G 46.5MB/s eta 74s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 43%[=======> ] 2.44G 49.4MB/s eta 74s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 43%[=======> ] 2.45G 46.9MB/s eta 73s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 43%[=======> ] 2.46G 45.0MB/s eta 73s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 43%[=======> ] 2.47G 43.5MB/s eta 73s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 44%[=======> ] 2.49G 43.9MB/s eta 72s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 44%[=======> ] 2.50G 47.7MB/s eta 72s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 44%[=======> ] 2.51G 46.2MB/s eta 72s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 44%[=======> ] 2.52G 46.1MB/s eta 72s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 44%[=======> ] 2.53G 45.3MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 45%[========> ] 2.55G 45.5MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 45%[========> ] 2.56G 46.1MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 45%[========> ] 2.56G 44.2MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 45%[========> ] 2.58G 44.9MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 46%[========> ] 2.60G 47.1MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 46%[========> ] 2.61G 46.3MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 46%[========> ] 2.62G 47.3MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 46%[========> ] 2.64G 48.2MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 46%[========> ] 2.64G 46.1MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 46%[========> ] 2.65G 47.2MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 47%[========> ] 2.67G 46.0MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 47%[========> ] 2.68G 47.8MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 47%[========> ] 2.70G 50.3MB/s eta 67s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 48%[========> ] 2.71G 50.5MB/s eta 67s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 48%[========> ] 2.73G 50.5MB/s eta 67s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 48%[========> ] 2.74G 53.0MB/s eta 67s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 48%[========> ] 2.76G 50.7MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 49%[========> ] 2.77G 49.9MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 49%[========> ] 2.77G 51.3MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 49%[========> ] 2.78G 51.3MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 49%[========> ] 2.79G 48.2MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 49%[========> ] 2.80G 48.2MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 49%[========> ] 2.82G 48.0MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 50%[=========> ] 2.83G 48.5MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 50%[=========> ] 2.85G 48.2MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 50%[=========> ] 2.86G 48.4MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 50%[=========> ] 2.86G 44.2MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 50%[=========> ] 2.87G 44.1MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 50%[=========> ] 2.88G 43.8MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 51%[=========> ] 2.89G 42.9MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 51%[=========> ] 2.90G 44.6MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 51%[=========> ] 2.91G 40.1MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 51%[=========> ] 2.92G 43.4MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 52%[=========> ] 2.93G 44.2MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 52%[=========> ] 2.94G 45.0MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 52%[=========> ] 2.95G 39.8MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 52%[=========> ] 2.96G 37.8MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 52%[=========> ] 2.96G 38.6MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 52%[=========> ] 2.98G 37.8MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 52%[=========> ] 2.98G 37.4MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 53%[=========> ] 3.00G 35.8MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 53%[=========> ] 3.00G 34.2MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 53%[=========> ] 3.01G 37.1MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 53%[=========> ] 3.02G 38.2MB/s eta 60s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 53%[=========> ] 3.03G 39.9MB/s eta 60s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 53%[=========> ] 3.04G 37.5MB/s eta 60s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 54%[=========> ] 3.05G 40.4MB/s eta 60s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 54%[=========> ] 3.06G 40.4MB/s eta 60s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 54%[=========> ] 3.07G 41.2MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 54%[=========> ] 3.08G 39.5MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 54%[=========> ] 3.10G 41.3MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 55%[==========> ] 3.11G 41.4MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 55%[==========> ] 3.13G 41.8MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 55%[==========> ] 3.14G 44.4MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 55%[==========> ] 3.16G 46.2MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 56%[==========> ] 3.17G 47.9MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 56%[==========> ] 3.19G 48.7MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 56%[==========> ] 3.20G 50.1MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 56%[==========> ] 3.21G 52.3MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 57%[==========> ] 3.23G 54.4MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 57%[==========> ] 3.23G 52.9MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 57%[==========> ] 3.25G 52.5MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 57%[==========> ] 3.26G 53.8MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 58%[==========> ] 3.28G 54.6MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 58%[==========> ] 3.29G 56.2MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 58%[==========> ] 3.30G 56.0MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 58%[==========> ] 3.31G 55.1MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 58%[==========> ] 3.32G 54.4MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 59%[==========> ] 3.34G 53.6MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 59%[==========> ] 3.35G 56.0MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 59%[==========> ] 3.37G 56.2MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 59%[==========> ] 3.37G 52.1MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 59%[==========> ] 3.38G 54.2MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 59%[==========> ] 3.38G 50.2MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 60%[===========> ] 3.40G 48.0MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 60%[===========> ] 3.41G 47.9MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 60%[===========> ] 3.43G 47.6MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 60%[===========> ] 3.43G 44.6MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 60%[===========> ] 3.44G 43.0MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 61%[===========> ] 3.46G 43.8MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 61%[===========> ] 3.47G 45.6MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 61%[===========> ] 3.47G 43.9MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 61%[===========> ] 3.49G 43.4MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 61%[===========> ] 3.49G 39.3MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 62%[===========> ] 3.50G 42.4MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 62%[===========> ] 3.52G 39.4MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 62%[===========> ] 3.53G 41.6MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 62%[===========> ] 3.55G 42.1MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 63%[===========> ] 3.56G 45.4MB/s eta 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 63%[===========> ] 3.58G 47.9MB/s eta 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 63%[===========> ] 3.58G 43.9MB/s eta 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 63%[===========> ] 3.59G 47.3MB/s eta 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 63%[===========> ] 3.60G 45.5MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 63%[===========> ] 3.61G 43.0MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 64%[===========> ] 3.62G 44.2MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 64%[===========> ] 3.64G 43.5MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 64%[===========> ] 3.65G 45.0MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 64%[===========> ] 3.67G 44.2MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 65%[============> ] 3.68G 48.1MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 65%[============> ] 3.69G 47.1MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 65%[============> ] 3.71G 46.2MB/s eta 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 65%[============> ] 3.72G 49.3MB/s eta 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 66%[============> ] 3.72G 43.7MB/s eta 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 66%[============> ] 3.74G 42.6MB/s eta 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 66%[============> ] 3.75G 43.8MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 66%[============> ] 3.76G 46.0MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 66%[============> ] 3.77G 45.6MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 67%[============> ] 3.79G 48.9MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 67%[============> ] 3.80G 49.8MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 67%[============> ] 3.81G 50.5MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 67%[============> ] 3.81G 48.8MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 67%[============> ] 3.83G 47.3MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 68%[============> ] 3.85G 49.0MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 68%[============> ] 3.86G 48.2MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 68%[============> ] 3.87G 46.7MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 68%[============> ] 3.89G 47.1MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 69%[============> ] 3.90G 46.8MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 69%[============> ] 3.91G 44.9MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 69%[============> ] 3.93G 49.0MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 69%[============> ] 3.93G 46.4MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 69%[============> ] 3.94G 43.3MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 69%[============> ] 3.95G 43.9MB/s eta 38s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 70%[=============> ] 3.96G 43.9MB/s eta 38s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 70%[=============> ] 3.98G 44.2MB/s eta 38s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 70%[=============> ] 3.99G 43.2MB/s eta 38s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 71%[=============> ] 4.01G 45.9MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 71%[=============> ] 4.02G 46.5MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 71%[=============> ] 4.02G 46.1MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 71%[=============> ] 4.04G 47.3MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 71%[=============> ] 4.05G 45.5MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 72%[=============> ] 4.08G 47.3MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 72%[=============> ] 4.08G 48.5MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 72%[=============> ] 4.10G 49.9MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 72%[=============> ] 4.11G 49.3MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 72%[=============> ] 4.12G 47.1MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 73%[=============> ] 4.13G 49.1MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 73%[=============> ] 4.13G 48.9MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 73%[=============> ] 4.13G 46.9MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 73%[=============> ] 4.14G 45.6MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 73%[=============> ] 4.16G 48.3MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 73%[=============> ] 4.16G 47.3MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 73%[=============> ] 4.17G 46.6MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 74%[=============> ] 4.19G 47.4MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 74%[=============> ] 4.20G 47.7MB/s eta 32s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 74%[=============> ] 4.21G 45.7MB/s eta 32s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 74%[=============> ] 4.22G 46.3MB/s eta 32s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 75%[==============> ] 4.24G 51.0MB/s eta 32s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 75%[==============> ] 4.26G 49.9MB/s eta 32s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 75%[==============> ] 4.27G 48.2MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 75%[==============> ] 4.27G 45.4MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 75%[==============> ] 4.28G 44.7MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 76%[==============> ] 4.29G 45.8MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 76%[==============> ] 4.31G 47.6MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 76%[==============> ] 4.32G 49.4MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 76%[==============> ] 4.34G 53.6MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 77%[==============> ] 4.35G 52.4MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 77%[==============> ] 4.35G 52.2MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 77%[==============> ] 4.37G 51.0MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 77%[==============> ] 4.37G 50.1MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 77%[==============> ] 4.38G 50.4MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 77%[==============> ] 4.39G 49.4MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 78%[==============> ] 4.41G 51.4MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 78%[==============> ] 4.41G 47.5MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 78%[==============> ] 4.43G 48.8MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 78%[==============> ] 4.44G 46.8MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 78%[==============> ] 4.46G 46.6MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 79%[==============> ] 4.47G 46.6MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 79%[==============> ] 4.48G 47.1MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 79%[==============> ] 4.50G 48.6MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 79%[==============> ] 4.51G 51.0MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 80%[===============> ] 4.53G 48.6MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 80%[===============> ] 4.54G 47.3MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 80%[===============> ] 4.55G 46.7MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 80%[===============> ] 4.56G 48.6MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 81%[===============> ] 4.57G 50.5MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 81%[===============> ] 4.59G 51.3MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 81%[===============> ] 4.60G 52.3MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 81%[===============> ] 4.61G 52.6MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 81%[===============> ] 4.62G 51.2MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 82%[===============> ] 4.63G 53.8MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 82%[===============> ] 4.65G 53.4MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 82%[===============> ] 4.65G 50.5MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 82%[===============> ] 4.66G 51.3MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 82%[===============> ] 4.68G 50.3MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 83%[===============> ] 4.69G 50.6MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 83%[===============> ] 4.69G 48.4MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 83%[===============> ] 4.71G 49.1MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 83%[===============> ] 4.72G 48.8MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 83%[===============> ] 4.74G 48.9MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 84%[===============> ] 4.75G 47.1MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 84%[===============> ] 4.77G 49.3MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 84%[===============> ] 4.78G 51.0MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 85%[================> ] 4.80G 50.7MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 85%[================> ] 4.81G 51.0MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 85%[================> ] 4.82G 49.5MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 85%[================> ] 4.83G 45.3MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 85%[================> ] 4.84G 46.8MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 86%[================> ] 4.86G 47.3MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 86%[================> ] 4.87G 49.0MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 86%[================> ] 4.89G 46.8MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 86%[================> ] 4.90G 47.9MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 87%[================> ] 4.92G 48.2MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 87%[================> ] 4.93G 48.5MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 87%[================> ] 4.95G 48.5MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 87%[================> ] 4.95G 46.3MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 87%[================> ] 4.96G 47.7MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 87%[================> ] 4.96G 45.5MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 88%[================> ] 4.98G 44.7MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 88%[================> ] 4.98G 42.7MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 88%[================> ] 4.99G 39.5MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 88%[================> ] 5.00G 41.0MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 88%[================> ] 5.02G 42.5MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 88%[================> ] 5.02G 41.8MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 89%[================> ] 5.04G 41.1MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 89%[================> ] 5.05G 41.3MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 89%[================> ] 5.05G 36.6MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 89%[================> ] 5.07G 39.2MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 89%[================> ] 5.07G 37.7MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 90%[=================> ] 5.08G 36.2MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 90%[=================> ] 5.10G 37.0MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 90%[=================> ] 5.11G 39.6MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 90%[=================> ] 5.12G 39.4MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 91%[=================> ] 5.14G 41.6MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 91%[=================> ] 5.14G 40.0MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 91%[=================> ] 5.16G 42.4MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 91%[=================> ] 5.17G 43.9MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 91%[=================> ] 5.17G 41.0MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 91%[=================> ] 5.19G 43.9MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 92%[=================> ] 5.20G 44.1MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 92%[=================> ] 5.21G 44.2MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 92%[=================> ] 5.23G 44.7MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 92%[=================> ] 5.24G 44.5MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 93%[=================> ] 5.25G 45.6MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 93%[=================> ] 5.26G 49.2MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 93%[=================> ] 5.27G 48.5MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 93%[=================> ] 5.29G 49.6MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 93%[=================> ] 5.29G 46.3MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 94%[=================> ] 5.31G 47.3MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 94%[=================> ] 5.32G 47.0MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 94%[=================> ] 5.33G 49.8MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 94%[=================> ] 5.35G 49.5MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 95%[==================> ] 5.36G 48.9MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 95%[==================> ] 5.38G 51.0MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 95%[==================> ] 5.39G 52.7MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 95%[==================> ] 5.41G 53.1MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 95%[==================> ] 5.41G 51.9MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 96%[==================> ] 5.42G 51.9MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 96%[==================> ] 5.44G 53.3MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 96%[==================> ] 5.45G 53.7MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 96%[==================> ] 5.46G 53.6MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 96%[==================> ] 5.47G 52.1MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 97%[==================> ] 5.49G 53.2MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 97%[==================> ] 5.50G 52.6MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 97%[==================> ] 5.51G 52.9MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 97%[==================> ] 5.51G 52.5MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 97%[==================> ] 5.52G 49.7MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 97%[==================> ] 5.53G 49.4MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 98%[==================> ] 5.54G 48.4MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 98%[==================> ] 5.56G 48.0MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 98%[==================> ] 5.57G 50.4MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 99%[==================> ] 5.59G 48.2MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 99%[==================> ] 5.60G 48.7MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 99%[==================> ] 5.62G 47.2MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 99%[==================> ] 5.63G 50.1MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 99%[==================> ] 5.63G 46.6MB/s eta 0s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "BaseV5-C-Tune5.pth 99%[==================> ] 5.64G 44.2MB/s eta 0s \r", "BaseV5-C-Tune5.pth 100%[===================>] 5.64G 44.3MB/s in 2m 6s \r\n", "\r\n", "2023-09-05 20:00:31 (46.0 MB/s) - ‘BaseV5-C-Tune5.pth’ saved [6060483063/6060483063]\r\n", "\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "--2023-09-05 20:00:31-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/EWR-1B5-E0_1-mem-ctx-8k.pth\r\n", "Resolving huggingface.co (huggingface.co)... 18.154.227.67, 18.154.227.7, 18.154.227.69, ...\r\n", "Connecting to huggingface.co (huggingface.co)|18.154.227.67|:443... connected.\r\n", "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ "302 Found\r\n", "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/e886ffafd5148b502a00b1c10c847ca918cec61c4c956956a2fe9811c210029b?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27EWR-1B5-E0_1-mem-ctx-8k.pth%3B+filename%3D%22EWR-1B5-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203231&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzIzMX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwL2U4ODZmZmFmZDUxNDhiNTAyYTAwYjFjMTBjODQ3Y2E5MThjZWM2MWM0Yzk1Njk1NmEyZmU5ODExYzIxMDAyOWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=H7dALzpJjHXiRmYXfCi5wdUGBxT-ks5NF0PcdQAODDoHu%7E%7EBwyHOnsQGokQKeqqOmFA-%7E2cFXnl87ifEl3RrCl-xYvtCqJsTu-PCrHupXjKegnvyjToQCJIDtyW5f4RJ9aMmecwsGyTEJG1Nz0q-7Xm4OQfTBH-ItJ34BnzDQgW2XnuVav0keVtbME-KGM-ors8KbEGdI-tHni2lihjuxbBBxaV226vGo9Q7jssSP7WPLseWzK3-16BBLv3At3JjlpxbmDMCBFqNxBnJZbyTsrwmAIRj31kHFM15VSAa0y0CRfQ1Uh09OgdQr2zjlEWgU0mqpgv0M53%7ELLAtQP%7E%7ENw__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", "--2023-09-05 20:00:31-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/e886ffafd5148b502a00b1c10c847ca918cec61c4c956956a2fe9811c210029b?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27EWR-1B5-E0_1-mem-ctx-8k.pth%3B+filename%3D%22EWR-1B5-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203231&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzIzMX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwL2U4ODZmZmFmZDUxNDhiNTAyYTAwYjFjMTBjODQ3Y2E5MThjZWM2MWM0Yzk1Njk1NmEyZmU5ODExYzIxMDAyOWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=H7dALzpJjHXiRmYXfCi5wdUGBxT-ks5NF0PcdQAODDoHu%7E%7EBwyHOnsQGokQKeqqOmFA-%7E2cFXnl87ifEl3RrCl-xYvtCqJsTu-PCrHupXjKegnvyjToQCJIDtyW5f4RJ9aMmecwsGyTEJG1Nz0q-7Xm4OQfTBH-ItJ34BnzDQgW2XnuVav0keVtbME-KGM-ors8KbEGdI-tHni2lihjuxbBBxaV226vGo9Q7jssSP7WPLseWzK3-16BBLv3At3JjlpxbmDMCBFqNxBnJZbyTsrwmAIRj31kHFM15VSAa0y0CRfQ1Uh09OgdQr2zjlEWgU0mqpgv0M53%7ELLAtQP%7E%7ENw__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.111, 108.138.64.36, 108.138.64.49, ...\r\n", "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.111|:443... connected.\r\n", "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ "200 OK\r\n", "Length: 6060483163 (5.6G) [binary/octet-stream]\r\n", "Saving to: ‘EWR-1B5-E0_1-mem-ctx-8k.pth’\r\n", "\r\n", "\r", " EWR-1B5-E 0%[ ] 0 --.-KB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 0%[ ] 14.74M 63.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 0%[ ] 17.24M 39.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 0%[ ] 30.00M 46.2MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 0%[ ] 30.52M 33.1MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 0%[ ] 46.48M 41.5MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 1%[ ] 60.52M 41.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 1%[ ] 62.21M 37.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 1%[ ] 76.29M 39.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 1%[ ] 91.55M 41.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 1%[ ] 106.81M 41.6MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 2%[ ] 120.25M 43.2MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 2%[ ] 127.59M 42.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 2%[ ] 137.33M 42.9MB/s eta 2m 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 2%[ ] 152.45M 44.6MB/s eta 2m 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 2%[ ] 152.59M 41.9MB/s eta 2m 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 2%[ ] 163.51M 42.6MB/s eta 2m 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 3%[ ] 181.57M 45.0MB/s eta 2m 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 3%[ ] 183.10M 42.7MB/s eta 2m 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 3%[ ] 198.36M 40.6MB/s eta 2m 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 3%[ ] 213.62M 43.7MB/s eta 2m 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 3%[ ] 228.36M 43.1MB/s eta 2m 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 4%[ ] 239.57M 46.2MB/s eta 2m 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 4%[ ] 244.13M 42.5MB/s eta 2m 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 4%[ ] 259.40M 42.9MB/s eta 2m 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 4%[ ] 274.52M 45.9MB/s eta 2m 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 5%[> ] 289.92M 44.5MB/s eta 2m 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 5%[> ] 305.18M 45.2MB/s eta 2m 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 5%[> ] 320.56M 45.1MB/s eta 2m 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 5%[> ] 335.18M 47.6MB/s eta 2m 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 6%[> ] 350.95M 48.8MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 6%[> ] 366.20M 46.3MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 6%[> ] 381.47M 49.4MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 6%[> ] 396.73M 48.3MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 7%[> ] 414.61M 49.7MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 7%[> ] 426.73M 51.4MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 7%[> ] 430.51M 49.0MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 7%[> ] 440.68M 48.0MB/s eta 1m 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 7%[> ] 455.93M 49.6MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 7%[> ] 460.26M 48.1MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 8%[> ] 468.32M 46.0MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 8%[> ] 473.50M 46.0MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 8%[> ] 488.28M 44.7MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 8%[> ] 503.54M 40.7MB/s eta 2m 0s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 8%[> ] 518.80M 44.0MB/s eta 2m 0s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 9%[> ] 534.05M 40.9MB/s eta 2m 0s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 9%[> ] 548.80M 43.9MB/s eta 2m 0s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 9%[> ] 556.34M 41.7MB/s eta 2m 0s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 9%[> ] 564.58M 43.2MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 9%[> ] 577.31M 41.3MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 10%[=> ] 579.83M 39.0MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 10%[=> ] 594.57M 42.3MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 10%[=> ] 605.08M 42.6MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 10%[=> ] 610.35M 41.2MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 10%[=> ] 625.61M 42.7MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 11%[=> ] 640.87M 43.7MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 11%[=> ] 656.13M 45.2MB/s eta 1m 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 11%[=> ] 671.38M 45.5MB/s eta 1m 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 11%[=> ] 686.64M 44.7MB/s eta 1m 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 12%[=> ] 701.90M 45.3MB/s eta 1m 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 12%[=> ] 716.64M 44.2MB/s eta 1m 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 12%[=> ] 719.78M 44.5MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 12%[=> ] 731.91M 44.2MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 12%[=> ] 744.53M 46.8MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 12%[=> ] 747.81M 43.0MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 13%[=> ] 762.42M 45.4MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 13%[=> ] 763.07M 42.7MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 13%[=> ] 778.20M 43.9MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 13%[=> ] 793.31M 46.6MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 13%[=> ] 800.53M 46.0MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 13%[=> ] 808.20M 44.3MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 14%[=> ] 809.59M 41.2MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 14%[=> ] 823.97M 43.5MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 14%[=> ] 838.71M 42.0MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 14%[=> ] 841.85M 41.5MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 14%[=> ] 854.49M 40.3MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 14%[=> ] 857.55M 37.3MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 15%[==> ] 869.75M 40.7MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 15%[==> ] 879.33M 39.7MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 15%[==> ] 884.49M 40.9MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 15%[==> ] 889.88M 38.8MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 15%[==> ] 897.75M 39.9MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 15%[==> ] 915.53M 38.6MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 16%[==> ] 930.78M 38.1MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 16%[==> ] 941.84M 37.3MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 16%[==> ] 943.71M 37.1MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 16%[==> ] 945.90M 34.5MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 16%[==> ] 957.54M 37.2MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 16%[==> ] 961.30M 34.2MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 16%[==> ] 976.55M 34.6MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 17%[==> ] 991.82M 37.2MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 17%[==> ] 1007M 37.8MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 17%[==> ] 1007M 36.4MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 17%[==> ] 1011M 34.6MB/s eta 1m 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 17%[==> ] 1022M 36.0MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 17%[==> ] 1.01G 36.2MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 18%[==> ] 1.03G 37.6MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 18%[==> ] 1.03G 36.0MB/s eta 1m 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 18%[==> ] 1.04G 36.9MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 18%[==> ] 1.06G 34.0MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 18%[==> ] 1.07G 36.7MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 19%[==> ] 1.07G 34.1MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 19%[==> ] 1.09G 36.6MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 19%[==> ] 1.10G 39.1MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 19%[==> ] 1.11G 39.9MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 19%[==> ] 1.12G 40.3MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 20%[===> ] 1.14G 41.6MB/s eta 1m 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 20%[===> ] 1.15G 40.8MB/s eta 1m 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 20%[===> ] 1.16G 43.4MB/s eta 1m 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 20%[===> ] 1.16G 40.8MB/s eta 1m 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 20%[===> ] 1.18G 40.5MB/s eta 1m 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 21%[===> ] 1.19G 45.1MB/s eta 1m 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 21%[===> ] 1.20G 44.9MB/s eta 1m 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 21%[===> ] 1.21G 43.8MB/s eta 1m 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 21%[===> ] 1.21G 42.0MB/s eta 1m 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 21%[===> ] 1.22G 42.6MB/s eta 1m 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 21%[===> ] 1.24G 41.8MB/s eta 1m 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 22%[===> ] 1.25G 43.7MB/s eta 1m 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 22%[===> ] 1.27G 47.1MB/s eta 1m 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 22%[===> ] 1.27G 43.4MB/s eta 1m 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 22%[===> ] 1.28G 46.2MB/s eta 1m 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 22%[===> ] 1.29G 45.2MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 22%[===> ] 1.30G 43.1MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 23%[===> ] 1.31G 41.9MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 23%[===> ] 1.31G 39.3MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 23%[===> ] 1.33G 39.3MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 23%[===> ] 1.34G 39.3MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 24%[===> ] 1.36G 40.4MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 24%[===> ] 1.37G 42.9MB/s eta 1m 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 24%[===> ] 1.38G 42.9MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 24%[===> ] 1.39G 44.0MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 24%[===> ] 1.40G 42.5MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 25%[====> ] 1.42G 45.6MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 25%[====> ] 1.43G 45.6MB/s eta 1m 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 25%[====> ] 1.44G 43.5MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 25%[====> ] 1.45G 44.9MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 25%[====> ] 1.46G 44.4MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 25%[====> ] 1.46G 43.8MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 26%[====> ] 1.47G 43.9MB/s eta 1m 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 26%[====> ] 1.48G 44.1MB/s eta 1m 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 26%[====> ] 1.49G 43.7MB/s eta 1m 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 26%[====> ] 1.50G 44.9MB/s eta 1m 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 26%[====> ] 1.52G 42.6MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 27%[====> ] 1.53G 45.9MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 27%[====> ] 1.55G 45.0MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 27%[====> ] 1.55G 44.0MB/s eta 99s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 27%[====> ] 1.56G 43.3MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 27%[====> ] 1.57G 42.3MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 27%[====> ] 1.58G 42.6MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 28%[====> ] 1.59G 43.4MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 28%[====> ] 1.59G 40.2MB/s eta 98s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 28%[====> ] 1.61G 39.3MB/s eta 97s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 28%[====> ] 1.61G 39.9MB/s eta 97s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 28%[====> ] 1.63G 38.4MB/s eta 97s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 28%[====> ] 1.63G 40.2MB/s eta 97s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 29%[====> ] 1.64G 38.5MB/s eta 97s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 29%[====> ] 1.65G 38.1MB/s eta 97s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 29%[====> ] 1.67G 38.2MB/s eta 97s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 29%[====> ] 1.68G 41.0MB/s eta 97s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 29%[====> ] 1.68G 39.2MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 30%[=====> ] 1.70G 37.8MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 30%[=====> ] 1.72G 43.1MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 30%[=====> ] 1.73G 40.9MB/s eta 96s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 30%[=====> ] 1.74G 43.3MB/s eta 94s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 31%[=====> ] 1.76G 44.5MB/s eta 94s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 31%[=====> ] 1.77G 43.4MB/s eta 94s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 31%[=====> ] 1.79G 43.4MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 31%[=====> ] 1.80G 45.5MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 31%[=====> ] 1.80G 43.8MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 32%[=====> ] 1.82G 44.6MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 32%[=====> ] 1.82G 42.7MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 32%[=====> ] 1.83G 42.1MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 32%[=====> ] 1.84G 44.6MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 32%[=====> ] 1.85G 41.3MB/s eta 93s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 32%[=====> ] 1.86G 40.6MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 33%[=====> ] 1.87G 43.2MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 33%[=====> ] 1.88G 39.2MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 33%[=====> ] 1.88G 37.0MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 33%[=====> ] 1.89G 35.3MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 33%[=====> ] 1.91G 37.0MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 33%[=====> ] 1.92G 35.6MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 34%[=====> ] 1.92G 36.1MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 34%[=====> ] 1.94G 37.9MB/s eta 91s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 34%[=====> ] 1.95G 39.7MB/s eta 89s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 34%[=====> ] 1.97G 41.9MB/s eta 89s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 35%[======> ] 1.98G 42.5MB/s eta 89s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 35%[======> ] 2.00G 43.7MB/s eta 89s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 35%[======> ] 2.00G 43.1MB/s eta 88s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 35%[======> ] 2.01G 41.4MB/s eta 88s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 35%[======> ] 2.03G 44.7MB/s eta 88s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 36%[======> ] 2.04G 44.7MB/s eta 88s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 36%[======> ] 2.05G 46.8MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 36%[======> ] 2.06G 48.3MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 36%[======> ] 2.07G 49.5MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 36%[======> ] 2.08G 49.0MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 37%[======> ] 2.10G 52.4MB/s eta 86s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 37%[======> ] 2.10G 48.9MB/s eta 85s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 37%[======> ] 2.12G 46.7MB/s eta 85s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 37%[======> ] 2.13G 46.7MB/s eta 85s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 38%[======> ] 2.15G 45.1MB/s eta 84s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 38%[======> ] 2.16G 43.6MB/s eta 84s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 38%[======> ] 2.17G 44.2MB/s eta 84s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 38%[======> ] 2.17G 42.6MB/s eta 84s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 38%[======> ] 2.19G 44.6MB/s eta 83s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 39%[======> ] 2.20G 43.8MB/s eta 83s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 39%[======> ] 2.22G 44.4MB/s eta 83s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 39%[======> ] 2.23G 47.0MB/s eta 83s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 39%[======> ] 2.25G 46.2MB/s eta 81s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 39%[======> ] 2.25G 44.5MB/s eta 81s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 40%[=======> ] 2.26G 45.0MB/s eta 81s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 40%[=======> ] 2.28G 44.9MB/s eta 81s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 40%[=======> ] 2.29G 43.2MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 40%[=======> ] 2.31G 47.7MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 40%[=======> ] 2.31G 43.4MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 41%[=======> ] 2.32G 46.1MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 41%[=======> ] 2.33G 46.9MB/s eta 80s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 41%[=======> ] 2.34G 46.2MB/s eta 79s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 41%[=======> ] 2.35G 46.5MB/s eta 79s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 41%[=======> ] 2.37G 46.2MB/s eta 79s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 42%[=======> ] 2.38G 46.2MB/s eta 79s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 42%[=======> ] 2.38G 43.9MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 42%[=======> ] 2.40G 42.8MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 42%[=======> ] 2.41G 42.4MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 42%[=======> ] 2.41G 41.4MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 42%[=======> ] 2.41G 40.8MB/s eta 78s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 42%[=======> ] 2.42G 38.1MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 43%[=======> ] 2.43G 37.2MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 43%[=======> ] 2.44G 36.3MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 43%[=======> ] 2.45G 37.6MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 43%[=======> ] 2.46G 36.6MB/s eta 77s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 43%[=======> ] 2.47G 37.1MB/s eta 76s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 44%[=======> ] 2.49G 39.2MB/s eta 76s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 44%[=======> ] 2.50G 37.7MB/s eta 76s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 44%[=======> ] 2.52G 37.0MB/s eta 76s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 44%[=======> ] 2.52G 37.7MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 44%[=======> ] 2.53G 39.3MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 44%[=======> ] 2.54G 38.0MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 45%[========> ] 2.55G 34.9MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 45%[========> ] 2.55G 33.6MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 45%[========> ] 2.56G 34.4MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 45%[========> ] 2.58G 35.9MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 45%[========> ] 2.59G 37.2MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 46%[========> ] 2.61G 39.4MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 46%[========> ] 2.62G 39.3MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 46%[========> ] 2.64G 40.0MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 46%[========> ] 2.64G 38.5MB/s eta 73s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 46%[========> ] 2.65G 40.5MB/s eta 73s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 47%[========> ] 2.67G 40.0MB/s eta 73s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 47%[========> ] 2.68G 41.5MB/s eta 73s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 47%[========> ] 2.69G 41.1MB/s eta 73s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 47%[========> ] 2.70G 38.8MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 47%[========> ] 2.71G 41.2MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 48%[========> ] 2.71G 42.5MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 48%[========> ] 2.72G 45.5MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 48%[========> ] 2.73G 42.6MB/s eta 71s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 48%[========> ] 2.74G 41.7MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 48%[========> ] 2.75G 44.8MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 48%[========> ] 2.76G 44.6MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 49%[========> ] 2.77G 42.7MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 49%[========> ] 2.79G 44.0MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 49%[========> ] 2.81G 45.8MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 49%[========> ] 2.81G 47.1MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 49%[========> ] 2.82G 41.1MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 50%[=========> ] 2.83G 42.8MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 50%[=========> ] 2.85G 43.0MB/s eta 67s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 50%[=========> ] 2.86G 45.6MB/s eta 67s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 50%[=========> ] 2.88G 46.0MB/s eta 67s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 51%[=========> ] 2.89G 47.7MB/s eta 67s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 51%[=========> ] 2.90G 47.0MB/s eta 66s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 51%[=========> ] 2.91G 47.1MB/s eta 66s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 51%[=========> ] 2.92G 49.3MB/s eta 66s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 51%[=========> ] 2.92G 46.0MB/s eta 66s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 52%[=========> ] 2.93G 47.6MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 52%[=========> ] 2.95G 47.6MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 52%[=========> ] 2.96G 46.1MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 52%[=========> ] 2.98G 45.3MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 53%[=========> ] 2.99G 44.4MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 53%[=========> ] 3.00G 42.1MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 53%[=========> ] 3.01G 43.2MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 53%[=========> ] 3.01G 42.8MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 53%[=========> ] 3.02G 42.3MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 53%[=========> ] 3.04G 42.0MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 53%[=========> ] 3.04G 39.4MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 54%[=========> ] 3.05G 38.4MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 54%[=========> ] 3.07G 39.7MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 54%[=========> ] 3.08G 40.7MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 54%[=========> ] 3.09G 40.4MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 54%[=========> ] 3.10G 39.0MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 55%[==========> ] 3.11G 41.6MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 55%[==========> ] 3.13G 39.1MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 55%[==========> ] 3.14G 40.3MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 55%[==========> ] 3.16G 41.2MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 56%[==========> ] 3.17G 40.5MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 56%[==========> ] 3.17G 40.1MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 56%[==========> ] 3.19G 42.1MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 56%[==========> ] 3.20G 40.8MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 57%[==========> ] 3.22G 42.3MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 57%[==========> ] 3.23G 41.8MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 57%[==========> ] 3.23G 39.6MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 57%[==========> ] 3.25G 38.5MB/s eta 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 57%[==========> ] 3.25G 37.9MB/s eta 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 57%[==========> ] 3.26G 36.7MB/s eta 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 58%[==========> ] 3.28G 40.0MB/s eta 58s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 58%[==========> ] 3.29G 38.9MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 58%[==========> ] 3.31G 40.8MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 58%[==========> ] 3.32G 39.4MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 58%[==========> ] 3.32G 39.4MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 58%[==========> ] 3.32G 37.4MB/s eta 57s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 59%[==========> ] 3.34G 37.5MB/s eta 56s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 59%[==========> ] 3.35G 36.2MB/s eta 56s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 59%[==========> ] 3.37G 37.6MB/s eta 56s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 59%[==========> ] 3.38G 40.2MB/s eta 56s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 60%[===========> ] 3.40G 39.4MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 60%[===========> ] 3.40G 39.9MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 60%[===========> ] 3.41G 41.4MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 60%[===========> ] 3.43G 44.3MB/s eta 54s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 60%[===========> ] 3.44G 43.2MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 61%[===========> ] 3.44G 39.0MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 61%[===========> ] 3.45G 40.3MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 61%[===========> ] 3.47G 40.4MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 61%[===========> ] 3.48G 42.0MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 61%[===========> ] 3.49G 40.1MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 62%[===========> ] 3.50G 40.5MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 62%[===========> ] 3.51G 43.6MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 62%[===========> ] 3.52G 41.1MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 62%[===========> ] 3.53G 41.0MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 62%[===========> ] 3.53G 37.2MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 62%[===========> ] 3.55G 40.0MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 63%[===========> ] 3.56G 39.6MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 63%[===========> ] 3.58G 41.2MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 63%[===========> ] 3.59G 39.2MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 63%[===========> ] 3.59G 38.2MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 63%[===========> ] 3.61G 38.4MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 63%[===========> ] 3.61G 36.7MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 64%[===========> ] 3.62G 36.4MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 64%[===========> ] 3.63G 39.5MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 64%[===========> ] 3.64G 37.0MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 64%[===========> ] 3.65G 35.4MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 64%[===========> ] 3.67G 37.0MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 65%[============> ] 3.67G 37.2MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 65%[============> ] 3.68G 36.3MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 65%[============> ] 3.70G 37.2MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 65%[============> ] 3.71G 38.7MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 65%[============> ] 3.72G 41.4MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 66%[============> ] 3.72G 38.7MB/s eta 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 66%[============> ] 3.74G 38.7MB/s eta 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 66%[============> ] 3.75G 42.7MB/s eta 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 66%[============> ] 3.77G 45.0MB/s eta 47s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 67%[============> ] 3.78G 45.9MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 67%[============> ] 3.80G 47.1MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 67%[============> ] 3.80G 44.4MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 67%[============> ] 3.81G 47.1MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 67%[============> ] 3.83G 47.4MB/s eta 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 68%[============> ] 3.84G 46.5MB/s eta 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 68%[============> ] 3.86G 48.3MB/s eta 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 68%[============> ] 3.87G 50.8MB/s eta 44s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 68%[============> ] 3.87G 45.6MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 68%[============> ] 3.89G 47.4MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 69%[============> ] 3.90G 46.5MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 69%[============> ] 3.92G 45.8MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 69%[============> ] 3.93G 47.5MB/s eta 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 69%[============> ] 3.95G 47.3MB/s eta 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 70%[=============> ] 3.96G 47.2MB/s eta 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 70%[=============> ] 3.98G 47.1MB/s eta 42s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 70%[=============> ] 3.99G 46.7MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 70%[=============> ] 3.99G 46.8MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 71%[=============> ] 4.01G 47.6MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 71%[=============> ] 4.02G 46.1MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 71%[=============> ] 4.04G 47.1MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 71%[=============> ] 4.04G 44.9MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 71%[=============> ] 4.05G 43.9MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 71%[=============> ] 4.05G 42.3MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 72%[=============> ] 4.07G 43.7MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 72%[=============> ] 4.08G 45.2MB/s eta 38s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 72%[=============> ] 4.10G 43.4MB/s eta 38s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 72%[=============> ] 4.11G 44.8MB/s eta 38s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 73%[=============> ] 4.13G 44.4MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 73%[=============> ] 4.14G 45.7MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 73%[=============> ] 4.15G 43.7MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 73%[=============> ] 4.16G 43.0MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 73%[=============> ] 4.16G 43.0MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 73%[=============> ] 4.17G 38.8MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 74%[=============> ] 4.19G 39.7MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 74%[=============> ] 4.19G 37.9MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 74%[=============> ] 4.20G 40.7MB/s eta 36s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 74%[=============> ] 4.22G 38.7MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 74%[=============> ] 4.23G 39.7MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 74%[=============> ] 4.23G 36.9MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 75%[==============> ] 4.24G 36.4MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 75%[==============> ] 4.25G 33.9MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 75%[==============> ] 4.26G 37.3MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 75%[==============> ] 4.26G 33.7MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 75%[==============> ] 4.28G 33.8MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 76%[==============> ] 4.29G 37.0MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 76%[==============> ] 4.31G 38.3MB/s eta 33s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 76%[==============> ] 4.32G 38.8MB/s eta 33s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 76%[==============> ] 4.33G 39.8MB/s eta 33s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 77%[==============> ] 4.35G 39.3MB/s eta 33s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 77%[==============> ] 4.35G 39.1MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 77%[==============> ] 4.36G 41.5MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 77%[==============> ] 4.37G 39.0MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 77%[==============> ] 4.38G 39.8MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 77%[==============> ] 4.39G 42.4MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 77%[==============> ] 4.40G 41.6MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 78%[==============> ] 4.41G 41.9MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 78%[==============> ] 4.42G 42.7MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 78%[==============> ] 4.42G 39.5MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 78%[==============> ] 4.44G 41.8MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 78%[==============> ] 4.46G 43.6MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 79%[==============> ] 4.47G 43.6MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 79%[==============> ] 4.48G 44.1MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 79%[==============> ] 4.50G 41.2MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 79%[==============> ] 4.50G 41.8MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 79%[==============> ] 4.51G 42.8MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 80%[===============> ] 4.53G 44.4MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 80%[===============> ] 4.54G 45.8MB/s eta 27s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 80%[===============> ] 4.56G 45.6MB/s eta 27s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 81%[===============> ] 4.57G 45.7MB/s eta 27s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 81%[===============> ] 4.57G 41.8MB/s eta 27s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 81%[===============> ] 4.58G 43.0MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 81%[===============> ] 4.59G 42.0MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 81%[===============> ] 4.60G 44.0MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 81%[===============> ] 4.62G 44.3MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 81%[===============> ] 4.62G 44.2MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 82%[===============> ] 4.63G 43.3MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 82%[===============> ] 4.63G 41.0MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 82%[===============> ] 4.65G 41.0MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 82%[===============> ] 4.66G 40.5MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 82%[===============> ] 4.66G 39.2MB/s eta 24s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 82%[===============> ] 4.68G 40.9MB/s eta 24s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 83%[===============> ] 4.69G 40.1MB/s eta 24s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 83%[===============> ] 4.70G 38.9MB/s eta 24s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 83%[===============> ] 4.71G 39.6MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 83%[===============> ] 4.71G 37.2MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 83%[===============> ] 4.72G 36.7MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 83%[===============> ] 4.74G 39.8MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 84%[===============> ] 4.75G 42.6MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 84%[===============> ] 4.75G 40.3MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 84%[===============> ] 4.77G 40.6MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 84%[===============> ] 4.78G 40.8MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 84%[===============> ] 4.78G 38.1MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 85%[================> ] 4.80G 40.7MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 85%[================> ] 4.81G 41.0MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 85%[================> ] 4.83G 43.0MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 85%[================> ] 4.84G 42.3MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 86%[================> ] 4.86G 43.2MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 86%[================> ] 4.86G 41.5MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 86%[================> ] 4.88G 44.0MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 86%[================> ] 4.89G 43.8MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 86%[================> ] 4.89G 41.2MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 86%[================> ] 4.90G 41.5MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 86%[================> ] 4.90G 42.0MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 87%[================> ] 4.92G 41.3MB/s eta 18s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 87%[================> ] 4.93G 40.9MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 87%[================> ] 4.95G 41.4MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 87%[================> ] 4.96G 41.3MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 88%[================> ] 4.97G 40.8MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 88%[================> ] 4.98G 40.8MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 88%[================> ] 4.99G 44.3MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 88%[================> ] 4.99G 41.2MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 88%[================> ] 5.01G 41.5MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 88%[================> ] 5.02G 41.3MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 89%[================> ] 5.04G 42.0MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 89%[================> ] 5.04G 38.3MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 89%[================> ] 5.05G 41.0MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 89%[================> ] 5.07G 40.1MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 90%[=================> ] 5.08G 39.3MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 90%[=================> ] 5.09G 42.3MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 90%[=================> ] 5.10G 42.4MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 90%[=================> ] 5.11G 42.5MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 90%[=================> ] 5.13G 43.3MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 91%[=================> ] 5.14G 43.5MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "R-1B5-E0_1-mem-ctx- 91%[=================> ] 5.15G 44.4MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-1B5-E0_1-mem-ctx-8 91%[=================> ] 5.16G 43.3MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1B5-E0_1-mem-ctx-8k 91%[=================> ] 5.17G 44.0MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "B5-E0_1-mem-ctx-8k. 91%[=================> ] 5.18G 42.9MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-E0_1-mem-ctx-8k.p 91%[=================> ] 5.19G 42.8MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 92%[=================> ] 5.20G 42.4MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 92%[=================> ] 5.21G 43.0MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 92%[=================> ] 5.23G 44.3MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 92%[=================> ] 5.24G 47.5MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 92%[=================> ] 5.25G 44.5MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 93%[=================> ] 5.26G 42.8MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 93%[=================> ] 5.27G 43.3MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 93%[=================> ] 5.28G 43.9MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 93%[=================> ] 5.29G 43.5MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 93%[=================> ] 5.30G 42.6MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 93%[=================> ] 5.30G 39.5MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 94%[=================> ] 5.32G 41.6MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 94%[=================> ] 5.33G 40.0MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 94%[=================> ] 5.35G 41.7MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 95%[==================> ] 5.36G 43.6MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 95%[==================> ] 5.38G 42.7MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 95%[==================> ] 5.38G 43.0MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 95%[==================> ] 5.39G 43.0MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 95%[==================> ] 5.41G 42.4MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 96%[==================> ] 5.42G 43.4MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 96%[==================> ] 5.44G 43.4MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " E 96%[==================> ] 5.44G 44.0MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EW 96%[==================> ] 5.45G 43.9MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR 96%[==================> ] 5.47G 42.4MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR- 96%[==================> ] 5.47G 39.9MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1 97%[==================> ] 5.48G 43.2MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B 97%[==================> ] 5.50G 43.1MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5 97%[==================> ] 5.50G 42.9MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5- 97%[==================> ] 5.51G 41.6MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E 97%[==================> ] 5.53G 44.0MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0 98%[==================> ] 5.53G 42.1MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_ 98%[==================> ] 5.54G 41.1MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1 98%[==================> ] 5.54G 39.0MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1- 98%[==================> ] 5.56G 39.8MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-m 98%[==================> ] 5.57G 38.9MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-me 98%[==================> ] 5.58G 38.8MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem 99%[==================> ] 5.59G 36.4MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem- 99%[==================> ] 5.60G 39.1MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " EWR-1B5-E0_1-mem-c 99%[==================> ] 5.62G 38.1MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "EWR-1B5-E0_1-mem-ct 99%[==================> ] 5.63G 41.0MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "WR-1B5-E0_1-mem-ctx 99%[==================> ] 5.64G 40.3MB/s eta 1s \r", "EWR-1B5-E0_1-mem-ct 100%[===================>] 5.64G 40.6MB/s in 2m 17s \r\n", "\r\n", "2023-09-05 20:02:49 (42.0 MB/s) - ‘EWR-1B5-E0_1-mem-ctx-8k.pth’ saved [6060483163/6060483163]\r\n", "\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "--2023-09-05 20:02:49-- https://huggingface.co/rwkv-x-dev/rwkv-x-playground/resolve/main/experiment/rwkv-x-exp/v5-slim-memory/v5-L6-D1024-E0_1-mem-ctx-8k.pth\r\n", "Resolving huggingface.co (huggingface.co)... 18.154.227.69, 18.154.227.87, 18.154.227.67, ...\r\n", "Connecting to huggingface.co (huggingface.co)|18.154.227.69|:443... connected.\r\n", "HTTP request sent, awaiting response... 302 Found\r\n", "Location: https://cdn-lfs.huggingface.co/repos/2e/f7/2ef78555202aa92abdbdf476ce3d0fd5a8b15f7245edf0b80d4d30572355f30d/cefa72363bb7dfddb34723de3848f3cc5116c1ff15481f5562317058324b8bf0?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D1024-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D1024-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203370&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzM3MH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy8yZS9mNy8yZWY3ODU1NTIwMmFhOTJhYmRiZGY0NzZjZTNkMGZkNWE4YjE1ZjcyNDVlZGYwYjgwZDRkMzA1NzIzNTVmMzBkL2NlZmE3MjM2M2JiN2RmZGRiMzQ3MjNkZTM4NDhmM2NjNTExNmMxZmYxNTQ4MWY1NTYyMzE3MDU4MzI0YjhiZjA%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=B66WcOta7appV-JHHd-jMXu8SQjsoaHZFUDZQKrIz-elqYAFJYJb6m1qE2l6RR8yfASI8EA1iiSMO4ht-ToSA%7Eh5w827hJ5jknceswiSmp3dsP8R%7ERv3v79%7EPhXM26Mm0s1RiOhcwWAqJtECD4bFLqx6Ejh978NbajGhvZ08YBZx8aNA2ZPkfx8lK5ozeBRIoQI1NsQivS3r5uFuoe6aEe00iBVYuhSPP6DDtRa1NbEoF6ak4YWTqF6QED3U9Vp899VrgVJZzaEjJcE%7E2Aw6xywAiyfMmRFuG-QbfQ3zD93vVIFKVBaKgXtLNLsXq9OPn2pdMRV-IUKtGvJ2s-zjKA__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", "--2023-09-05 20:02:50-- https://cdn-lfs.huggingface.co/repos/2e/f7/2ef78555202aa92abdbdf476ce3d0fd5a8b15f7245edf0b80d4d30572355f30d/cefa72363bb7dfddb34723de3848f3cc5116c1ff15481f5562317058324b8bf0?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D1024-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D1024-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203370&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzM3MH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy8yZS9mNy8yZWY3ODU1NTIwMmFhOTJhYmRiZGY0NzZjZTNkMGZkNWE4YjE1ZjcyNDVlZGYwYjgwZDRkMzA1NzIzNTVmMzBkL2NlZmE3MjM2M2JiN2RmZGRiMzQ3MjNkZTM4NDhmM2NjNTExNmMxZmYxNTQ4MWY1NTYyMzE3MDU4MzI0YjhiZjA%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=B66WcOta7appV-JHHd-jMXu8SQjsoaHZFUDZQKrIz-elqYAFJYJb6m1qE2l6RR8yfASI8EA1iiSMO4ht-ToSA%7Eh5w827hJ5jknceswiSmp3dsP8R%7ERv3v79%7EPhXM26Mm0s1RiOhcwWAqJtECD4bFLqx6Ejh978NbajGhvZ08YBZx8aNA2ZPkfx8lK5ozeBRIoQI1NsQivS3r5uFuoe6aEe00iBVYuhSPP6DDtRa1NbEoF6ak4YWTqF6QED3U9Vp899VrgVJZzaEjJcE%7E2Aw6xywAiyfMmRFuG-QbfQ3zD93vVIFKVBaKgXtLNLsXq9OPn2pdMRV-IUKtGvJ2s-zjKA__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.49, 108.138.64.36, 108.138.64.111, ...\r\n", "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.49|:443... " ] }, { "name": "stdout", "output_type": "stream", "text": [ "connected.\r\n", "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ "200 OK\r\n", "Length: 369696005 (353M) [binary/octet-stream]\r\n", "Saving to: ‘v5-L6-D1024-E0_1-mem-ctx-8k.pth’\r\n", "\r\n", "\r", " v5-L6-D10 0%[ ] 0 --.-KB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D102 4%[ ] 15.26M 46.1MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D1024 8%[> ] 30.52M 54.1MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D1024- 12%[=> ] 45.78M 56.2MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D1024-E 17%[==> ] 61.03M 57.1MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D1024-E0 21%[===> ] 76.29M 55.7MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D1024-E0_ 25%[====> ] 91.55M 54.7MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D1024-E0_1 30%[=====> ] 106.81M 55.6MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D1024-E0_1- 34%[=====> ] 121.56M 55.5MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D1024-E0_1-m 38%[======> ] 135.50M 53.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D1024-E0_1-me 42%[=======> ] 151.33M 55.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D1024-E0_1-mem 43%[=======> ] 152.59M 50.9MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D1024-E0_1-mem- 47%[========> ] 167.85M 52.2MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D1024-E0_1-mem-c 50%[=========> ] 178.41M 52.2MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D1024-E0_1-mem-ct 56%[==========> ] 197.85M 52.5MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D1024-E0_1-mem-ctx 60%[===========> ] 211.79M 51.6MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D1024-E0_1-mem-ctx- 64%[===========> ] 228.36M 51.2MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1024-E0_1-mem-ctx-8 66%[============> ] 233.06M 46.8MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "024-E0_1-mem-ctx-8k 69%[============> ] 244.13M 46.8MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "24-E0_1-mem-ctx-8k. 73%[=============> ] 259.40M 47.5MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "4-E0_1-mem-ctx-8k.p 77%[==============> ] 274.14M 45.4MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 77%[==============> ] 274.66M 44.1MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 82%[===============> ] 289.40M 43.7MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 86%[================> ] 304.40M 45.0MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 86%[================> ] 305.79M 43.9MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 90%[=================> ] 320.43M 44.2MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 95%[==================> ] 335.69M 43.9MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 99%[==================> ] 350.44M 46.2MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D1024-E0_1-me 100%[===================>] 352.57M 45.4MB/s in 7.4s \r\n", "\r\n", "2023-09-05 20:02:57 (47.6 MB/s) - ‘v5-L6-D1024-E0_1-mem-ctx-8k.pth’ saved [369696005/369696005]\r\n", "\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "--2023-09-05 20:02:57-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D2048-E0_1-mem-ctx-8k.pth\r\n", "Resolving huggingface.co (huggingface.co)... 18.154.227.7, 18.154.227.67, 18.154.227.87, ...\r\n", "Connecting to huggingface.co (huggingface.co)|18.154.227.7|:443... connected.\r\n", "HTTP request sent, awaiting response... 302 Found\r\n", "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/87b64f45529c2049a8b044b7e7c0338a9ede8ba8259d17d987d8e73f8a34fd75?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D2048-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D2048-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203377&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzM3N319LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzg3YjY0ZjQ1NTI5YzIwNDlhOGIwNDRiN2U3YzAzMzhhOWVkZThiYTgyNTlkMTdkOTg3ZDhlNzNmOGEzNGZkNzU%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=VBYbW8z%7E9JBNguL51PviRfIlJ54YdlKEx91Ga02bS1bpaMTycJmWk-xv5BrCaiZzsDoosmbz7lPmOAAXRwEaLLn%7EpoS9cb5XHy3KTfp8ndxX7bqjKg3SYSf9P9po2RrS-50MBgszD2UFbjP7RWDf6GDRX7NHvHRXrKQ9DajMDZXByKypfrrMreWxQcsgaqJGEzco-tJYdyQO1JsjD8tTHFTQQd2R3DeHLlV1k8vAoxSg%7EkHse1nL4%7Ej68Z84lamLLL4rrO6qn2Lmh5KwDlTa76KCe5nID22ULDapKaGQr2grYb7qVEYGfXbHjoOxT63Ma82a6NWGRLMTR24M89v9Hg__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", "--2023-09-05 20:02:57-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/87b64f45529c2049a8b044b7e7c0338a9ede8ba8259d17d987d8e73f8a34fd75?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D2048-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D2048-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203377&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzM3N319LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzg3YjY0ZjQ1NTI5YzIwNDlhOGIwNDRiN2U3YzAzMzhhOWVkZThiYTgyNTlkMTdkOTg3ZDhlNzNmOGEzNGZkNzU%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=VBYbW8z%7E9JBNguL51PviRfIlJ54YdlKEx91Ga02bS1bpaMTycJmWk-xv5BrCaiZzsDoosmbz7lPmOAAXRwEaLLn%7EpoS9cb5XHy3KTfp8ndxX7bqjKg3SYSf9P9po2RrS-50MBgszD2UFbjP7RWDf6GDRX7NHvHRXrKQ9DajMDZXByKypfrrMreWxQcsgaqJGEzco-tJYdyQO1JsjD8tTHFTQQd2R3DeHLlV1k8vAoxSg%7EkHse1nL4%7Ej68Z84lamLLL4rrO6qn2Lmh5KwDlTa76KCe5nID22ULDapKaGQr2grYb7qVEYGfXbHjoOxT63Ma82a6NWGRLMTR24M89v9Hg__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.121, 108.138.64.111, 108.138.64.49, ...\r\n", "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.121|:443... connected.\r\n", "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ "200 OK\r\n", "Length: 1066508293 (1017M) [binary/octet-stream]\r\n", "Saving to: ‘v5-L6-D2048-E0_1-mem-ctx-8k.pth’\r\n", "\r\n", "\r", " v5-L6-D20 0%[ ] 0 --.-KB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D204 1%[ ] 13.43M 64.2MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048 2%[ ] 25.33M 61.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048- 3%[ ] 30.52M 44.1MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E 4%[ ] 45.78M 44.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0 5%[> ] 60.75M 49.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0_ 6%[> ] 61.03M 42.1MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0_1 7%[> ] 76.29M 43.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0_1- 8%[> ] 89.73M 42.1MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0_1-m 10%[=> ] 101.80M 43.4MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D2048-E0_1-me 10%[=> ] 107.72M 42.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D2048-E0_1-mem 11%[=> ] 121.56M 43.4MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D2048-E0_1-mem- 12%[=> ] 122.16M 40.7MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D2048-E0_1-mem-c 13%[=> ] 136.81M 41.9MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D2048-E0_1-mem-ct 14%[=> ] 150.76M 40.9MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D2048-E0_1-mem-ctx 16%[==> ] 165.33M 42.5MB/s eta 22s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D2048-E0_1-mem-ctx- 16%[==> ] 167.85M 39.9MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "2048-E0_1-mem-ctx-8 18%[==> ] 183.10M 39.5MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "048-E0_1-mem-ctx-8k 19%[==> ] 198.36M 39.8MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "48-E0_1-mem-ctx-8k. 20%[===> ] 213.11M 42.3MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8-E0_1-mem-ctx-8k.p 21%[===> ] 219.93M 40.2MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 23%[===> ] 241.44M 44.2MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 24%[===> ] 244.13M 41.1MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 25%[====> ] 259.40M 43.1MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 27%[====> ] 274.66M 44.2MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 28%[====> ] 289.40M 44.4MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 28%[====> ] 289.92M 41.9MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 29%[====> ] 304.66M 44.7MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 30%[=====> ] 305.30M 41.8MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 31%[=====> ] 320.43M 42.4MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 32%[=====> ] 335.18M 42.2MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 33%[=====> ] 341.75M 43.2MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 34%[=====> ] 350.95M 40.9MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 36%[======> ] 366.20M 41.3MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 37%[======> ] 380.96M 41.4MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 38%[======> ] 394.91M 41.0MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 40%[=======> ] 410.16M 40.6MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 40%[=======> ] 411.99M 37.7MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 41%[=======> ] 426.73M 40.1MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 42%[=======> ] 429.87M 36.9MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 43%[=======> ] 441.98M 37.4MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 44%[=======> ] 451.07M 39.7MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v 45%[========> ] 457.76M 37.2MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5 46%[========> ] 473.02M 40.3MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5- 48%[========> ] 488.28M 41.4MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L 49%[========> ] 503.03M 41.6MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6 50%[=========> ] 516.97M 43.5MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6- 52%[=========> ] 533.54M 44.0MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D 53%[=========> ] 548.80M 44.6MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2 55%[==========> ] 559.55M 43.8MB/s eta 12s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D20 55%[==========> ] 564.58M 42.1MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D204 57%[==========> ] 579.83M 42.9MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048 57%[==========> ] 585.02M 41.6MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048- 58%[==========> ] 595.09M 42.7MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E 60%[===========> ] 610.35M 42.0MB/s eta 10s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0 61%[===========> ] 625.61M 45.2MB/s eta 10s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0_ 63%[===========> ] 640.87M 45.4MB/s eta 10s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0_1 63%[===========> ] 647.18M 46.0MB/s eta 10s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0_1- 64%[===========> ] 655.62M 43.9MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D2048-E0_1-m 64%[===========> ] 656.34M 41.0MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D2048-E0_1-me 65%[============> ] 669.55M 43.4MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D2048-E0_1-mem 67%[============> ] 684.58M 44.3MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D2048-E0_1-mem- 67%[============> ] 686.77M 41.8MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D2048-E0_1-mem-c 69%[============> ] 701.90M 42.6MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D2048-E0_1-mem-ct 70%[=============> ] 717.16M 43.7MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D2048-E0_1-mem-ctx 72%[=============> ] 732.42M 44.5MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D2048-E0_1-mem-ctx- 73%[=============> ] 747.69M 42.8MB/s eta 8s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "2048-E0_1-mem-ctx-8 74%[=============> ] 762.42M 44.6MB/s eta 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "048-E0_1-mem-ctx-8k 76%[==============> ] 774.55M 44.9MB/s eta 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "48-E0_1-mem-ctx-8k. 76%[==============> ] 778.20M 43.6MB/s eta 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8-E0_1-mem-ctx-8k.p 78%[==============> ] 793.46M 43.0MB/s eta 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 79%[==============> ] 808.71M 45.2MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 80%[===============> ] 823.46M 43.2MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 81%[===============> ] 824.22M 40.6MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 82%[===============> ] 839.23M 41.4MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 84%[===============> ] 854.49M 42.6MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 85%[================> ] 869.75M 45.3MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 87%[================> ] 885.01M 44.5MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 87%[================> ] 892.69M 43.8MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 88%[================> ] 900.27M 42.5MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 90%[=================> ] 915.53M 42.7MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 91%[=================> ] 930.78M 42.2MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 93%[=================> ] 946.04M 43.3MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 94%[=================> ] 961.30M 43.7MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 96%[==================> ] 976.55M 45.9MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 97%[==================> ] 991.31M 44.9MB/s eta 2s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 97%[==================> ] 993.88M 43.3MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 99%[==================> ] 1007M 43.3MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 99%[==================> ] 1016M 42.5MB/s eta 1s \r", "v5-L6-D2048-E0_1-me 100%[===================>] 1017M 42.8MB/s in 24s \r\n", "\r\n", "2023-09-05 20:03:21 (42.8 MB/s) - ‘v5-L6-D2048-E0_1-mem-ctx-8k.pth’ saved [1066508293/1066508293]\r\n", "\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "--2023-09-05 20:03:22-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D4096-E0_1-mem-ctx-8k.pth\r\n", "Resolving huggingface.co (huggingface.co)... 18.154.227.69, 18.154.227.7, 18.154.227.67, ...\r\n", "Connecting to huggingface.co (huggingface.co)|18.154.227.69|:443... connected.\r\n", "HTTP request sent, awaiting response... 302 Found\r\n", "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/5f93b1f6f6f7fb2193130a3a51f8ed41a0541b1b5eab100ca9318c8218d481fa?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D4096-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D4096-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203402&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzQwMn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzVmOTNiMWY2ZjZmN2ZiMjE5MzEzMGEzYTUxZjhlZDQxYTA1NDFiMWI1ZWFiMTAwY2E5MzE4YzgyMThkNDgxZmE%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=kCsh5tzkI71pVRmfZsPhC0oiMlNdvC32eUOBVomz04o7staDhD2mIy6e9QqNHRsXMGyb1w1x8zQwRSuXSfWfo1LvvIkiIevIPEm6FGcRQhtkf9erytEqdKZatuYT-PBOlLBy%7EDrXG96JnUuXbDo9CTezywZTuYWQImQgZL2u5J3qHyUHcUbMiM8UwyVky4zy8XyGHBFFSvmIh3OygZOTofjkBuVZU78x0lbd-5xkf-UGRfm9bQLyHilkPWhulkTXE2M8XUYTbfJEfrwUyZi94%7EqXEqn7kX37bkywoVTOgmO-yBTF0R6uFjbm3r8lz7fM7Ww5wrblit2Clim6TTprww__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", "--2023-09-05 20:03:22-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/5f93b1f6f6f7fb2193130a3a51f8ed41a0541b1b5eab100ca9318c8218d481fa?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D4096-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D4096-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203402&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzQwMn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzVmOTNiMWY2ZjZmN2ZiMjE5MzEzMGEzYTUxZjhlZDQxYTA1NDFiMWI1ZWFiMTAwY2E5MzE4YzgyMThkNDgxZmE%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=kCsh5tzkI71pVRmfZsPhC0oiMlNdvC32eUOBVomz04o7staDhD2mIy6e9QqNHRsXMGyb1w1x8zQwRSuXSfWfo1LvvIkiIevIPEm6FGcRQhtkf9erytEqdKZatuYT-PBOlLBy%7EDrXG96JnUuXbDo9CTezywZTuYWQImQgZL2u5J3qHyUHcUbMiM8UwyVky4zy8XyGHBFFSvmIh3OygZOTofjkBuVZU78x0lbd-5xkf-UGRfm9bQLyHilkPWhulkTXE2M8XUYTbfJEfrwUyZi94%7EqXEqn7kX37bkywoVTOgmO-yBTF0R6uFjbm3r8lz7fM7Ww5wrblit2Clim6TTprww__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.36, 108.138.64.49, 108.138.64.111, ...\r\n", "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.36|:443... connected.\r\n", "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ "200 OK\r\n", "Length: 3441599237 (3.2G) [binary/octet-stream]\r\n", "Saving to: ‘v5-L6-D4096-E0_1-mem-ctx-8k.pth’\r\n", "\r\n", "\r", " v5-L6-D40 0%[ ] 0 --.-KB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D409 0%[ ] 13.43M 62.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096 0%[ ] 28.00M 67.3MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096- 0%[ ] 30.52M 42.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E 1%[ ] 45.78M 43.6MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0 1%[ ] 61.03M 43.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_ 2%[ ] 71.57M 45.0MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1 2%[ ] 85.74M 47.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1- 2%[ ] 91.55M 44.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1-m 3%[ ] 106.77M 47.6MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D4096-E0_1-me 3%[ ] 115.21M 47.2MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D4096-E0_1-mem 3%[ ] 120.25M 44.1MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D4096-E0_1-mem- 3%[ ] 129.42M 44.2MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D4096-E0_1-mem-c 4%[ ] 137.33M 41.8MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D4096-E0_1-mem-ct 4%[ ] 152.59M 42.4MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D4096-E0_1-mem-ctx 5%[> ] 167.33M 43.6MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D4096-E0_1-mem-ctx- 5%[> ] 174.16M 42.9MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "4096-E0_1-mem-ctx-8 5%[> ] 182.59M 42.8MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "096-E0_1-mem-ctx-8k 5%[> ] 185.73M 41.5MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "96-E0_1-mem-ctx-8k. 6%[> ] 198.36M 40.7MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-E0_1-mem-ctx-8k.p 6%[> ] 213.62M 41.7MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 6%[> ] 228.87M 42.3MB/s eta 75s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 7%[> ] 243.63M 43.6MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 7%[> ] 258.62M 46.3MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 7%[> ] 259.40M 41.1MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 8%[> ] 274.66M 40.4MB/s eta 70s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 8%[> ] 289.92M 42.5MB/s eta 69s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 9%[> ] 305.18M 43.4MB/s eta 69s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 9%[> ] 320.43M 43.6MB/s eta 69s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 10%[=> ] 335.69M 44.6MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 10%[=> ] 350.44M 43.4MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 10%[=> ] 359.99M 42.6MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 11%[=> ] 366.20M 42.2MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 11%[=> ] 381.47M 42.4MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 12%[=> ] 396.22M 43.9MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 12%[=> ] 396.73M 40.1MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 12%[=> ] 410.16M 42.8MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 13%[=> ] 426.73M 43.4MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 13%[=> ] 427.25M 40.1MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 13%[=> ] 441.98M 42.4MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 13%[=> ] 442.51M 39.2MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 13%[=> ] 457.24M 42.1MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v 14%[=> ] 465.94M 41.5MB/s eta 68s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5 14%[=> ] 482.89M 42.7MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5- 14%[=> ] 488.28M 38.8MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L 15%[==> ] 503.54M 41.0MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6 15%[==> ] 518.80M 41.1MB/s eta 65s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6- 16%[==> ] 534.05M 42.8MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D 16%[==> ] 548.80M 45.4MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4 16%[==> ] 557.75M 43.5MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D40 17%[==> ] 564.58M 43.4MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D409 17%[==> ] 579.31M 44.7MB/s eta 64s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096 17%[==> ] 582.81M 43.2MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096- 18%[==> ] 594.57M 44.6MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E 18%[==> ] 597.15M 41.9MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0 18%[==> ] 609.84M 41.8MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_ 18%[==> ] 615.55M 42.3MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1 19%[==> ] 625.61M 40.8MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1- 19%[==> ] 640.87M 42.8MB/s eta 63s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1-m 19%[==> ] 656.13M 39.5MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D4096-E0_1-me 20%[===> ] 670.87M 42.4MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D4096-E0_1-mem 20%[===> ] 671.38M 38.6MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D4096-E0_1-mem- 20%[===> ] 686.13M 39.8MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D4096-E0_1-mem-c 21%[===> ] 700.08M 40.0MB/s eta 62s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D4096-E0_1-mem-ct 21%[===> ] 708.71M 38.7MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D4096-E0_1-mem-ctx 21%[===> ] 717.16M 37.1MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D4096-E0_1-mem-ctx- 22%[===> ] 732.42M 37.2MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "4096-E0_1-mem-ctx-8 22%[===> ] 747.69M 38.9MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "096-E0_1-mem-ctx-8k 23%[===> ] 764.04M 40.8MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "96-E0_1-mem-ctx-8k. 23%[===> ] 777.68M 43.5MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-E0_1-mem-ctx-8k.p 23%[===> ] 784.89M 41.8MB/s eta 61s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 24%[===> ] 793.46M 40.1MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 24%[===> ] 808.71M 42.5MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 25%[====> ] 823.97M 41.8MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 25%[====> ] 839.23M 45.2MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 26%[====> ] 854.49M 46.2MB/s eta 59s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 26%[====> ] 869.75M 48.8MB/s eta 56s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 26%[====> ] 885.47M 49.5MB/s eta 56s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 27%[====> ] 899.75M 48.8MB/s eta 56s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 27%[====> ] 900.27M 46.6MB/s eta 56s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 27%[====> ] 915.53M 47.1MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 28%[====> ] 930.78M 45.8MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 28%[====> ] 946.04M 48.0MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 29%[====> ] 961.30M 48.8MB/s eta 55s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 29%[====> ] 975.91M 48.0MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 29%[====> ] 976.05M 46.0MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 29%[====> ] 983.00M 46.1MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 30%[=====> ] 993.36M 48.3MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 30%[=====> ] 1007M 45.6MB/s eta 53s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 31%[=====> ] 1022M 44.8MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 31%[=====> ] 1.00G 43.5MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 31%[=====> ] 1.01G 40.3MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v 32%[=====> ] 1.03G 42.6MB/s eta 52s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5 32%[=====> ] 1.04G 41.7MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5- 32%[=====> ] 1.06G 42.3MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L 33%[=====> ] 1.07G 45.0MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6 33%[=====> ] 1.08G 43.0MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6- 33%[=====> ] 1.08G 43.7MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D 33%[=====> ] 1.09G 41.8MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4 33%[=====> ] 1.09G 37.4MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D40 34%[=====> ] 1.09G 36.0MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D409 34%[=====> ] 1.10G 37.4MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096 34%[=====> ] 1.11G 37.0MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096- 34%[=====> ] 1.12G 37.6MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E 35%[======> ] 1.12G 38.8MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0 35%[======> ] 1.13G 36.8MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_ 35%[======> ] 1.15G 36.2MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1 35%[======> ] 1.15G 35.6MB/s eta 51s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1- 36%[======> ] 1.16G 35.8MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1-m 36%[======> ] 1.18G 35.6MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D4096-E0_1-me 37%[======> ] 1.19G 36.5MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D4096-E0_1-mem 37%[======> ] 1.20G 34.6MB/s eta 50s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D4096-E0_1-mem- 37%[======> ] 1.20G 32.8MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D4096-E0_1-mem-c 37%[======> ] 1.21G 31.2MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D4096-E0_1-mem-ct 37%[======> ] 1.21G 30.9MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D4096-E0_1-mem-ctx 38%[======> ] 1.22G 32.1MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D4096-E0_1-mem-ctx- 38%[======> ] 1.24G 35.1MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "4096-E0_1-mem-ctx-8 39%[======> ] 1.25G 36.4MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "096-E0_1-mem-ctx-8k 39%[======> ] 1.26G 36.2MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "96-E0_1-mem-ctx-8k. 39%[======> ] 1.27G 34.4MB/s eta 49s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-E0_1-mem-ctx-8k.p 39%[======> ] 1.28G 35.1MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 40%[=======> ] 1.30G 36.5MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 40%[=======> ] 1.31G 36.8MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 41%[=======> ] 1.33G 37.7MB/s eta 48s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 41%[=======> ] 1.34G 40.4MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 41%[=======> ] 1.34G 38.4MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 42%[=======> ] 1.36G 38.0MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 42%[=======> ] 1.37G 40.6MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 43%[=======> ] 1.38G 41.0MB/s eta 46s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 43%[=======> ] 1.38G 40.6MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 43%[=======> ] 1.39G 39.5MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 43%[=======> ] 1.40G 39.8MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 44%[=======> ] 1.41G 41.9MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 44%[=======> ] 1.42G 40.2MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 44%[=======> ] 1.43G 41.6MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 45%[========> ] 1.44G 42.3MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 45%[========> ] 1.45G 43.1MB/s eta 45s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 45%[========> ] 1.46G 42.1MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 46%[========> ] 1.47G 40.9MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 46%[========> ] 1.49G 41.6MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 46%[========> ] 1.50G 44.1MB/s eta 43s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 47%[========> ] 1.52G 44.3MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v 47%[========> ] 1.52G 41.0MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5 47%[========> ] 1.53G 38.9MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5- 48%[========> ] 1.55G 40.5MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L 48%[========> ] 1.55G 40.3MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6 48%[========> ] 1.56G 40.4MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6- 49%[========> ] 1.57G 42.1MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D 49%[========> ] 1.58G 39.5MB/s eta 41s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4 49%[========> ] 1.59G 41.8MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D40 50%[=========> ] 1.61G 41.3MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D409 50%[=========> ] 1.62G 43.3MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096 50%[=========> ] 1.62G 41.8MB/s eta 40s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096- 51%[=========> ] 1.64G 41.1MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E 51%[=========> ] 1.65G 40.7MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0 51%[=========> ] 1.65G 40.6MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_ 51%[=========> ] 1.66G 40.7MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1 52%[=========> ] 1.67G 39.4MB/s eta 39s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1- 52%[=========> ] 1.69G 41.3MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1-m 52%[=========> ] 1.70G 38.2MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D4096-E0_1-me 53%[=========> ] 1.71G 41.2MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D4096-E0_1-mem 53%[=========> ] 1.73G 39.5MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D4096-E0_1-mem- 54%[=========> ] 1.74G 41.7MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D4096-E0_1-mem-c 54%[=========> ] 1.76G 42.1MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D4096-E0_1-mem-ct 55%[==========> ] 1.77G 44.3MB/s eta 37s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D4096-E0_1-mem-ctx 55%[==========> ] 1.79G 45.5MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D4096-E0_1-mem-ctx- 56%[==========> ] 1.80G 46.7MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "4096-E0_1-mem-ctx-8 56%[==========> ] 1.80G 44.7MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "096-E0_1-mem-ctx-8k 56%[==========> ] 1.82G 44.8MB/s eta 35s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "96-E0_1-mem-ctx-8k. 57%[==========> ] 1.83G 45.5MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-E0_1-mem-ctx-8k.p 57%[==========> ] 1.85G 47.3MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 58%[==========> ] 1.86G 47.2MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 58%[==========> ] 1.88G 47.7MB/s eta 34s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 58%[==========> ] 1.88G 48.2MB/s eta 33s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 59%[==========> ] 1.89G 47.2MB/s eta 33s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 59%[==========> ] 1.90G 47.3MB/s eta 33s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 59%[==========> ] 1.91G 45.4MB/s eta 33s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 59%[==========> ] 1.92G 46.5MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 60%[===========> ] 1.94G 45.2MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 60%[===========> ] 1.95G 44.7MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 61%[===========> ] 1.96G 45.6MB/s eta 31s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 61%[===========> ] 1.97G 43.7MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 61%[===========> ] 1.98G 42.8MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 62%[===========> ] 2.00G 45.3MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 62%[===========> ] 2.01G 45.1MB/s eta 30s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 62%[===========> ] 2.01G 43.6MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 63%[===========> ] 2.03G 45.2MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 63%[===========> ] 2.04G 43.8MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 63%[===========> ] 2.04G 43.4MB/s eta 29s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 64%[===========> ] 2.06G 43.6MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 64%[===========> ] 2.06G 40.5MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 64%[===========> ] 2.07G 40.8MB/s eta 28s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v 65%[============> ] 2.09G 42.1MB/s eta 27s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5 65%[============> ] 2.10G 43.8MB/s eta 27s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5- 65%[============> ] 2.11G 43.3MB/s eta 27s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L 66%[============> ] 2.12G 41.7MB/s eta 27s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6 66%[============> ] 2.13G 39.8MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6- 66%[============> ] 2.15G 41.2MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D 67%[============> ] 2.16G 41.3MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4 67%[============> ] 2.16G 38.0MB/s eta 26s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D40 67%[============> ] 2.17G 39.9MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D409 67%[============> ] 2.17G 37.1MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096 68%[============> ] 2.19G 40.4MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096- 68%[============> ] 2.20G 39.8MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E 68%[============> ] 2.21G 38.9MB/s eta 25s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0 69%[============> ] 2.21G 37.6MB/s eta 24s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_ 69%[============> ] 2.22G 38.7MB/s eta 24s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1 69%[============> ] 2.23G 39.7MB/s eta 24s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1- 70%[=============> ] 2.25G 39.6MB/s eta 24s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1-m 70%[=============> ] 2.26G 41.4MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D4096-E0_1-me 70%[=============> ] 2.27G 38.7MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D4096-E0_1-mem 70%[=============> ] 2.27G 39.1MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D4096-E0_1-mem- 70%[=============> ] 2.27G 36.0MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D4096-E0_1-mem-c 71%[=============> ] 2.28G 34.9MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D4096-E0_1-mem-ct 71%[=============> ] 2.28G 35.7MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D4096-E0_1-mem-ctx 71%[=============> ] 2.29G 35.5MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D4096-E0_1-mem-ctx- 72%[=============> ] 2.31G 35.1MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "4096-E0_1-mem-ctx-8 72%[=============> ] 2.32G 37.5MB/s eta 23s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "096-E0_1-mem-ctx-8k 72%[=============> ] 2.34G 38.4MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "96-E0_1-mem-ctx-8k. 73%[=============> ] 2.35G 37.5MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-E0_1-mem-ctx-8k.p 73%[=============> ] 2.35G 34.7MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 73%[=============> ] 2.37G 37.5MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 73%[=============> ] 2.37G 36.1MB/s eta 21s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 74%[=============> ] 2.38G 37.7MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 74%[=============> ] 2.38G 37.2MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 74%[=============> ] 2.39G 36.3MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 74%[=============> ] 2.40G 35.1MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 75%[==============> ] 2.41G 33.7MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 75%[==============> ] 2.41G 33.1MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 76%[==============> ] 2.44G 37.2MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 76%[==============> ] 2.46G 39.9MB/s eta 20s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 76%[==============> ] 2.46G 40.2MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 77%[==============> ] 2.47G 39.3MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 77%[==============> ] 2.49G 39.9MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 77%[==============> ] 2.49G 38.9MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 77%[==============> ] 2.50G 35.8MB/s eta 19s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 78%[==============> ] 2.50G 37.2MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 78%[==============> ] 2.51G 38.4MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 78%[==============> ] 2.52G 36.4MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 78%[==============> ] 2.53G 39.8MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 79%[==============> ] 2.53G 37.3MB/s eta 17s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 79%[==============> ] 2.55G 41.2MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v 79%[==============> ] 2.56G 42.5MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5 80%[===============> ] 2.58G 42.3MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5- 80%[===============> ] 2.59G 44.0MB/s eta 16s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L 80%[===============> ] 2.59G 44.4MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6 81%[===============> ] 2.60G 42.2MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6- 81%[===============> ] 2.61G 40.7MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D 81%[===============> ] 2.62G 40.1MB/s eta 15s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4 82%[===============> ] 2.64G 42.8MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D40 82%[===============> ] 2.65G 44.0MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D409 83%[===============> ] 2.67G 45.4MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096 83%[===============> ] 2.68G 46.1MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096- 84%[===============> ] 2.70G 47.0MB/s eta 14s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E 84%[===============> ] 2.70G 45.7MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0 84%[===============> ] 2.71G 47.0MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_ 85%[================> ] 2.72G 48.7MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1 85%[================> ] 2.73G 47.7MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1- 85%[================> ] 2.74G 47.2MB/s eta 13s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D4096-E0_1-m 85%[================> ] 2.76G 47.5MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D4096-E0_1-me 86%[================> ] 2.77G 47.3MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "5-L6-D4096-E0_1-mem 86%[================> ] 2.79G 48.7MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-L6-D4096-E0_1-mem- 87%[================> ] 2.80G 48.9MB/s eta 11s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "L6-D4096-E0_1-mem-c 87%[================> ] 2.80G 47.7MB/s eta 10s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-D4096-E0_1-mem-ct 87%[================> ] 2.82G 48.5MB/s eta 10s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-D4096-E0_1-mem-ctx 88%[================> ] 2.83G 49.5MB/s eta 10s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "D4096-E0_1-mem-ctx- 88%[================> ] 2.84G 48.0MB/s eta 10s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "4096-E0_1-mem-ctx-8 89%[================> ] 2.86G 44.8MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "096-E0_1-mem-ctx-8k 89%[================> ] 2.86G 44.1MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "96-E0_1-mem-ctx-8k. 89%[================> ] 2.88G 44.7MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "6-E0_1-mem-ctx-8k.p 90%[=================> ] 2.89G 44.2MB/s eta 9s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-E0_1-mem-ctx-8k.pt 90%[=================> ] 2.91G 45.9MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "E0_1-mem-ctx-8k.pth 91%[=================> ] 2.92G 47.9MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "0_1-mem-ctx-8k.pth 91%[=================> ] 2.93G 48.7MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "_1-mem-ctx-8k.pth 91%[=================> ] 2.95G 48.0MB/s eta 7s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "1-mem-ctx-8k.pth 92%[=================> ] 2.95G 41.6MB/s eta 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-mem-ctx-8k.pth 92%[=================> ] 2.96G 43.9MB/s eta 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "mem-ctx-8k.pth 92%[=================> ] 2.98G 45.1MB/s eta 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "em-ctx-8k.pth 92%[=================> ] 2.98G 40.2MB/s eta 6s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "m-ctx-8k.pth 93%[=================> ] 2.99G 41.2MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-ctx-8k.pth 93%[=================> ] 3.00G 40.6MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "ctx-8k.pth 93%[=================> ] 3.01G 39.8MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "tx-8k.pth 94%[=================> ] 3.02G 42.2MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "x-8k.pth 94%[=================> ] 3.03G 41.7MB/s eta 5s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "-8k.pth 95%[==================> ] 3.05G 45.1MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "8k.pth 95%[==================> ] 3.05G 43.7MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "k.pth 95%[==================> ] 3.07G 43.3MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", ".pth 96%[==================> ] 3.08G 44.7MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "pth 96%[==================> ] 3.09G 43.9MB/s eta 4s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "th 96%[==================> ] 3.10G 44.3MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "h 97%[==================> ] 3.11G 42.7MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " 97%[==================> ] 3.13G 42.3MB/s eta 3s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v 98%[==================> ] 3.14G 42.7MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5 98%[==================> ] 3.16G 45.0MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5- 98%[==================> ] 3.16G 42.3MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L 99%[==================> ] 3.17G 46.3MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6 99%[==================> ] 3.18G 44.5MB/s eta 1s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6- 99%[==================> ] 3.19G 44.6MB/s eta 0s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", " v5-L6-D 99%[==================> ] 3.20G 46.1MB/s eta 0s " ] }, { "name": "stdout", "output_type": "stream", "text": [ "\r", "v5-L6-D4096-E0_1-me 100%[===================>] 3.21G 45.1MB/s in 78s \r\n", "\r\n", "2023-09-05 20:04:40 (41.9 MB/s) - ‘v5-L6-D4096-E0_1-mem-ctx-8k.pth’ saved [3441599237/3441599237]\r\n", "\r\n" ] } ], "source": [ "# Lets download the custom models\n", "!mkdir -p ../../../model/\n", "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/memory-size-experiment-for-rwkv/resolve/main/RWKV-v5-baseline/BaseV5-C-Tune5.pth\"\n", "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/EWR-1B5-E0_1-mem-ctx-8k.pth\"\n", "!cd ../../../model/ && wget -nc \"https://huggingface.co/rwkv-x-dev/rwkv-x-playground/resolve/main/experiment/rwkv-x-exp/v5-slim-memory/v5-L6-D1024-E0_1-mem-ctx-8k.pth\"\n", "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D2048-E0_1-mem-ctx-8k.pth\"\n", "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D4096-E0_1-mem-ctx-8k.pth\"" ] }, { "cell_type": "code", "execution_count": 2, "id": "c1d4920e", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T20:04:41.200276Z", "iopub.status.busy": "2023-09-05T20:04:41.199672Z", "iopub.status.idle": "2023-09-05T20:04:41.455126Z", "shell.execute_reply": "2023-09-05T20:04:41.454090Z" }, "papermill": { "duration": 0.340242, "end_time": "2023-09-05T20:04:41.457583", "exception": false, "start_time": "2023-09-05T20:04:41.117341", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "total 16G\r\n", "-rw-r--r-- 1 root root 5.7G Aug 11 12:48 BaseV5-C-Tune5.pth\r\n", "-rw-r--r-- 1 root root 5.7G Aug 17 14:38 EWR-1B5-E0_1-mem-ctx-8k.pth\r\n", "-rw-r--r-- 1 root root 353M Sep 5 14:40 v5-L6-D1024-E0_1-mem-ctx-8k.pth\r\n", "-rw-r--r-- 1 root root 1018M Aug 19 08:33 v5-L6-D2048-E0_1-mem-ctx-8k.pth\r\n", "-rw-r--r-- 1 root root 3.3G Aug 20 14:58 v5-L6-D4096-E0_1-mem-ctx-8k.pth\r\n" ] } ], "source": [ "!ls -lh ../../../model/" ] }, { "cell_type": "code", "execution_count": 3, "id": "836e432a", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T20:04:41.617951Z", "iopub.status.busy": "2023-09-05T20:04:41.617377Z", "iopub.status.idle": "2023-09-05T20:04:44.887019Z", "shell.execute_reply": "2023-09-05T20:04:44.885854Z" }, "papermill": { "duration": 3.352332, "end_time": "2023-09-05T20:04:44.889387", "exception": false, "start_time": "2023-09-05T20:04:41.537055", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: aiocsv in /usr/local/lib/python3.10/dist-packages (1.2.4)\r\n", "Requirement already satisfied: aiofiles in /usr/local/lib/python3.10/dist-packages (23.2.1)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "\u001b[33mWARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\u001b[0m\u001b[33m\r\n", "\u001b[0m" ] } ], "source": [ "!python3 -m pip install aiocsv aiofiles" ] }, { "cell_type": "markdown", "id": "2e58126b", "metadata": { "papermill": { "duration": 0.079405, "end_time": "2023-09-05T20:04:45.048270", "exception": false, "start_time": "2023-09-05T20:04:44.968865", "status": "completed" }, "tags": [] }, "source": [ "# 1B5 V5 benchmark" ] }, { "cell_type": "code", "execution_count": 4, "id": "ac23fcab", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T20:04:45.210262Z", "iopub.status.busy": "2023-09-05T20:04:45.209384Z", "iopub.status.idle": "2023-09-05T20:06:04.241980Z", "shell.execute_reply": "2023-09-05T20:06:04.240702Z" }, "papermill": { "duration": 79.11701, "end_time": "2023-09-05T20:06:04.244895", "exception": false, "start_time": "2023-09-05T20:04:45.127885", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 20:04:49,621] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 40 tokens : 100.0% similarity, with 40 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 45 tokens : 100.0% similarity, with 45 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 50 tokens : 100.0% similarity, with 50 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 55 tokens : 100.0% similarity, with 55 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 60 tokens : 100.0% similarity, with 60 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 65 tokens : 100.0% similarity, with 65 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 70 tokens : 100.0% similarity, with 70 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 75 tokens : 100.0% similarity, with 75 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 80 tokens : 100.0% similarity, with 80 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 85 tokens : 100.0% similarity, with 85 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 90 tokens : 100.0% similarity, with 90 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 95 tokens : 100.0% similarity, with 95 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 100 tokens : 100.0% similarity, with 100 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 105 tokens : 100.0% similarity, with 105 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 110 tokens : 100.0% similarity, with 110 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 115 tokens : 100.0% similarity, with 115 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 120 tokens : 100.0% similarity, with 120 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 125 tokens : 100.0% similarity, with 125 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 130 tokens : 100.0% similarity, with 130 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 135 tokens : 100.0% similarity, with 135 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 140 tokens : 100.0% similarity, with 140 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 145 tokens : 100.0% similarity, with 145 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 150 tokens : 100.0% similarity, with 150 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 160 tokens : 100.0% similarity, with 160 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 170 tokens : 100.0% similarity, with 170 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 180 tokens : 100.0% similarity, with 180 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 190 tokens : 99.47368421052632% similarity, with 189 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 200 tokens : 100.0% similarity, with 200 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 210 tokens : 100.0% similarity, with 210 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 220 tokens : 100.0% similarity, with 220 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 230 tokens : 100.0% similarity, with 230 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 240 tokens : 100.0% similarity, with 240 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 250 tokens : 100.0% similarity, with 250 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 260 tokens : 100.0% similarity, with 260 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 270 tokens : 100.0% similarity, with 270 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 280 tokens : 99.64285714285714% similarity, with 279 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 290 tokens : 100.0% similarity, with 290 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 300 tokens : 99.66666666666667% similarity, with 299 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 325 tokens : 100.0% similarity, with 325 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 350 tokens : 100.0% similarity, with 350 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 375 tokens : 99.46666666666667% similarity, with 373 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 400 tokens : 99.75% similarity, with 399 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 425 tokens : 99.76470588235294% similarity, with 424 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 450 tokens : 99.55555555555556% similarity, with 448 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 475 tokens : 99.36842105263159% similarity, with 472 matched token, and 3 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 500 tokens : 99.6% similarity, with 498 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 525 tokens : 99.61904761904762% similarity, with 523 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 550 tokens : 99.27272727272727% similarity, with 546 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 575 tokens : 99.30434782608695% similarity, with 571 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 600 tokens : 99.33333333333333% similarity, with 596 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 625 tokens : 99.03999999999999% similarity, with 619 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 650 tokens : 99.07692307692308% similarity, with 644 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 675 tokens : 99.11111111111111% similarity, with 669 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 700 tokens : 99.0% similarity, with 693 matched token, and 7 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 750 tokens : 99.06666666666666% similarity, with 743 matched token, and 7 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 800 tokens : 99.0% similarity, with 792 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 850 tokens : 99.05882352941177% similarity, with 842 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 900 tokens : 99.0% similarity, with 891 matched token, and 9 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 950 tokens : 99.1578947368421% similarity, with 942 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1000 tokens : 99.2% similarity, with 992 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-1k.csv\"" ] }, { "cell_type": "code", "execution_count": 5, "id": "534dc178", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T20:06:04.432032Z", "iopub.status.busy": "2023-09-05T20:06:04.431202Z", "iopub.status.idle": "2023-09-05T20:10:29.967568Z", "shell.execute_reply": "2023-09-05T20:10:29.966188Z" }, "papermill": { "duration": 265.629775, "end_time": "2023-09-05T20:10:29.969793", "exception": false, "start_time": "2023-09-05T20:06:04.340018", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 20:06:08,978] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1100 tokens : 98.63636363636363% similarity, with 1085 matched token, and 15 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1150 tokens : 98.52173913043478% similarity, with 1133 matched token, and 17 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1200 tokens : 98.75% similarity, with 1185 matched token, and 15 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1250 tokens : 98.72% similarity, with 1234 matched token, and 16 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1300 tokens : 98.61538461538461% similarity, with 1282 matched token, and 18 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1350 tokens : 98.44444444444444% similarity, with 1329 matched token, and 21 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1400 tokens : 98.5% similarity, with 1379 matched token, and 21 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1450 tokens : 98.20689655172414% similarity, with 1424 matched token, and 26 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1500 tokens : 97.86666666666667% similarity, with 1468 matched token, and 32 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1550 tokens : 97.67741935483872% similarity, with 1514 matched token, and 36 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1600 tokens : 97.8125% similarity, with 1565 matched token, and 35 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1650 tokens : 97.57575757575758% similarity, with 1610 matched token, and 40 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1700 tokens : 97.6470588235294% similarity, with 1660 matched token, and 40 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1750 tokens : 97.94285714285714% similarity, with 1714 matched token, and 36 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1800 tokens : 97.72222222222223% similarity, with 1759 matched token, and 41 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1850 tokens : 96.86486486486487% similarity, with 1792 matched token, and 58 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1900 tokens : 96.36842105263158% similarity, with 1831 matched token, and 69 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1950 tokens : 95.17948717948718% similarity, with 1856 matched token, and 94 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2000 tokens : 94.75% similarity, with 1895 matched token, and 105 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2050 tokens : 93.26829268292684% similarity, with 1912 matched token, and 138 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2100 tokens : 91.33333333333333% similarity, with 1918 matched token, and 182 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2150 tokens : 90.09302325581395% similarity, with 1937 matched token, and 213 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2200 tokens : 88.77272727272727% similarity, with 1953 matched token, and 247 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2250 tokens : 86.53333333333333% similarity, with 1947 matched token, and 303 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2300 tokens : 84.78260869565217% similarity, with 1950 matched token, and 350 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2350 tokens : 82.08510638297872% similarity, with 1929 matched token, and 421 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2400 tokens : 80.625% similarity, with 1935 matched token, and 465 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2450 tokens : 78.61224489795919% similarity, with 1926 matched token, and 524 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2500 tokens : 77.08% similarity, with 1927 matched token, and 573 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2550 tokens : 75.29411764705883% similarity, with 1920 matched token, and 630 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2600 tokens : 73.88461538461539% similarity, with 1921 matched token, and 679 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2650 tokens : 72.75471698113208% similarity, with 1928 matched token, and 722 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2700 tokens : 71.4074074074074% similarity, with 1928 matched token, and 772 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2750 tokens : 70.10909090909091% similarity, with 1928 matched token, and 822 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2800 tokens : 68.85714285714286% similarity, with 1928 matched token, and 872 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2850 tokens : 67.89473684210526% similarity, with 1935 matched token, and 915 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2900 tokens : 66.6896551724138% similarity, with 1934 matched token, and 966 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2950 tokens : 65.5593220338983% similarity, with 1934 matched token, and 1016 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3000 tokens : 64.36666666666667% similarity, with 1931 matched token, and 1069 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3050 tokens : 63.278688524590166% similarity, with 1930 matched token, and 1120 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3100 tokens : 62.096774193548384% similarity, with 1925 matched token, and 1175 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3150 tokens : 61.17460317460317% similarity, with 1927 matched token, and 1223 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3200 tokens : 60.21875% similarity, with 1927 matched token, and 1273 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3250 tokens : 59.199999999999996% similarity, with 1924 matched token, and 1326 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3300 tokens : 58.151515151515156% similarity, with 1919 matched token, and 1381 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3350 tokens : 57.16417910447761% similarity, with 1915 matched token, and 1435 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3400 tokens : 56.294117647058826% similarity, with 1914 matched token, and 1486 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3450 tokens : 55.362318840579704% similarity, with 1910 matched token, and 1540 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3500 tokens : 54.400000000000006% similarity, with 1904 matched token, and 1596 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3550 tokens : 53.5774647887324% similarity, with 1902 matched token, and 1648 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3600 tokens : 52.77777777777778% similarity, with 1900 matched token, and 1700 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3650 tokens : 51.89041095890411% similarity, with 1894 matched token, and 1756 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3700 tokens : 51.08108108108108% similarity, with 1890 matched token, and 1810 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3750 tokens : 50.160000000000004% similarity, with 1881 matched token, and 1869 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3800 tokens : 49.34210526315789% similarity, with 1875 matched token, and 1925 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3850 tokens : 48.51948051948052% similarity, with 1868 matched token, and 1982 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3900 tokens : 47.51282051282051% similarity, with 1853 matched token, and 2047 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3950 tokens : 46.607594936708864% similarity, with 1841 matched token, and 2109 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4000 tokens : 45.574999999999996% similarity, with 1823 matched token, and 2177 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-4k.csv\" 1100 4000" ] }, { "cell_type": "code", "execution_count": 6, "id": "99f322eb", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T20:10:30.144675Z", "iopub.status.busy": "2023-09-05T20:10:30.144153Z", "iopub.status.idle": "2023-09-05T21:13:05.936146Z", "shell.execute_reply": "2023-09-05T21:13:05.934942Z" }, "papermill": { "duration": 3755.883001, "end_time": "2023-09-05T21:13:05.938991", "exception": false, "start_time": "2023-09-05T20:10:30.055990", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 20:10:34,716] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4100 tokens : 44.0% similarity, with 1804 matched token, and 2296 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4200 tokens : 42.11904761904762% similarity, with 1769 matched token, and 2431 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4300 tokens : 40.27906976744186% similarity, with 1732 matched token, and 2568 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4400 tokens : 38.27272727272727% similarity, with 1684 matched token, and 2716 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4500 tokens : 35.8% similarity, with 1611 matched token, and 2889 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4600 tokens : 33.73913043478261% similarity, with 1552 matched token, and 3048 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4700 tokens : 31.06382978723404% similarity, with 1460 matched token, and 3240 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4800 tokens : 28.3125% similarity, with 1359 matched token, and 3441 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4900 tokens : 25.857142857142858% similarity, with 1267 matched token, and 3633 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5000 tokens : 23.04% similarity, with 1152 matched token, and 3848 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5100 tokens : 20.764705882352942% similarity, with 1059 matched token, and 4041 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5200 tokens : 18.5% similarity, with 962 matched token, and 4238 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5300 tokens : 16.88679245283019% similarity, with 895 matched token, and 4405 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5400 tokens : 15.222222222222223% similarity, with 822 matched token, and 4578 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5500 tokens : 13.418181818181818% similarity, with 738 matched token, and 4762 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5600 tokens : 11.625% similarity, with 651 matched token, and 4949 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5700 tokens : 10.421052631578947% similarity, with 594 matched token, and 5106 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5800 tokens : 9.344827586206897% similarity, with 542 matched token, and 5258 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5900 tokens : 8.305084745762711% similarity, with 490 matched token, and 5410 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6000 tokens : 7.449999999999999% similarity, with 447 matched token, and 5553 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6100 tokens : 6.655737704918033% similarity, with 406 matched token, and 5694 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6200 tokens : 6.064516129032258% similarity, with 376 matched token, and 5824 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6300 tokens : 5.65079365079365% similarity, with 356 matched token, and 5944 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6400 tokens : 5.328125% similarity, with 341 matched token, and 6059 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6500 tokens : 4.984615384615385% similarity, with 324 matched token, and 6176 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6600 tokens : 4.6818181818181825% similarity, with 309 matched token, and 6291 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6700 tokens : 4.432835820895523% similarity, with 297 matched token, and 6403 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6800 tokens : 4.25% similarity, with 289 matched token, and 6511 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6900 tokens : 4.08695652173913% similarity, with 282 matched token, and 6618 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7000 tokens : 4.0% similarity, with 280 matched token, and 6720 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7100 tokens : 3.943661971830986% similarity, with 280 matched token, and 6820 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7200 tokens : 3.75% similarity, with 270 matched token, and 6930 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7300 tokens : 3.767123287671233% similarity, with 275 matched token, and 7025 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7400 tokens : 3.689189189189189% similarity, with 273 matched token, and 7127 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7500 tokens : 3.64% similarity, with 273 matched token, and 7227 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7600 tokens : 3.578947368421052% similarity, with 272 matched token, and 7328 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7700 tokens : 3.5844155844155843% similarity, with 276 matched token, and 7424 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7800 tokens : 3.5641025641025643% similarity, with 278 matched token, and 7522 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7900 tokens : 3.468354430379747% similarity, with 274 matched token, and 7626 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8000 tokens : 3.4250000000000003% similarity, with 274 matched token, and 7726 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8100 tokens : 3.432098765432099% similarity, with 278 matched token, and 7822 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8200 tokens : 3.414634146341464% similarity, with 280 matched token, and 7920 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8300 tokens : 3.36144578313253% similarity, with 279 matched token, and 8021 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8400 tokens : 3.3690476190476186% similarity, with 283 matched token, and 8117 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8500 tokens : 3.3411764705882354% similarity, with 284 matched token, and 8216 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8600 tokens : 3.3488372093023258% similarity, with 288 matched token, and 8312 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8700 tokens : 3.3678160919540225% similarity, with 293 matched token, and 8407 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8800 tokens : 3.3295454545454546% similarity, with 293 matched token, and 8507 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8900 tokens : 3.348314606741573% similarity, with 298 matched token, and 8602 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9000 tokens : 3.3333333333333335% similarity, with 300 matched token, and 8700 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9100 tokens : 3.3406593406593412% similarity, with 304 matched token, and 8796 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9200 tokens : 3.3260869565217392% similarity, with 306 matched token, and 8894 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9300 tokens : 3.3010752688172045% similarity, with 307 matched token, and 8993 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9400 tokens : 3.2978723404255317% similarity, with 310 matched token, and 9090 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9500 tokens : 3.3157894736842106% similarity, with 315 matched token, and 9185 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9600 tokens : 3.3229166666666665% similarity, with 319 matched token, and 9281 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9700 tokens : 3.3195876288659796% similarity, with 322 matched token, and 9378 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9800 tokens : 3.316326530612245% similarity, with 325 matched token, and 9475 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9900 tokens : 3.3333333333333335% similarity, with 330 matched token, and 9570 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10000 tokens : 3.37% similarity, with 337 matched token, and 9663 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10100 tokens : 3.3861386138613865% similarity, with 342 matched token, and 9758 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10200 tokens : 3.3725490196078427% similarity, with 344 matched token, and 9856 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10300 tokens : 3.349514563106796% similarity, with 345 matched token, and 9955 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10400 tokens : 3.355769230769231% similarity, with 349 matched token, and 10051 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10500 tokens : 3.371428571428572% similarity, with 354 matched token, and 10146 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10600 tokens : 3.3584905660377355% similarity, with 356 matched token, and 10244 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10700 tokens : 3.392523364485981% similarity, with 363 matched token, and 10337 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10800 tokens : 3.4074074074074074% similarity, with 368 matched token, and 10432 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10900 tokens : 3.3853211009174315% similarity, with 369 matched token, and 10531 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11000 tokens : 3.390909090909091% similarity, with 373 matched token, and 10627 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11100 tokens : 3.3963963963963963% similarity, with 377 matched token, and 10723 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11200 tokens : 3.3839285714285716% similarity, with 379 matched token, and 10821 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11300 tokens : 3.4070796460176993% similarity, with 385 matched token, and 10915 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11400 tokens : 3.43859649122807% similarity, with 392 matched token, and 11008 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11500 tokens : 3.4434782608695653% similarity, with 396 matched token, and 11104 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11600 tokens : 3.4568965517241383% similarity, with 401 matched token, and 11199 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11700 tokens : 3.4444444444444446% similarity, with 403 matched token, and 11297 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11800 tokens : 3.457627118644068% similarity, with 408 matched token, and 11392 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11900 tokens : 3.46218487394958% similarity, with 412 matched token, and 11488 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12000 tokens : 3.4750000000000005% similarity, with 417 matched token, and 11583 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12100 tokens : 3.487603305785124% similarity, with 422 matched token, and 11678 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12200 tokens : 3.475409836065574% similarity, with 424 matched token, and 11776 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12300 tokens : 3.487804878048781% similarity, with 429 matched token, and 11871 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12400 tokens : 3.491935483870968% similarity, with 433 matched token, and 11967 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12500 tokens : 3.488% similarity, with 436 matched token, and 12064 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12600 tokens : 3.484126984126984% similarity, with 439 matched token, and 12161 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12700 tokens : 3.4881889763779523% similarity, with 443 matched token, and 12257 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12800 tokens : 3.484375% similarity, with 446 matched token, and 12354 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12900 tokens : 3.488372093023256% similarity, with 450 matched token, and 12450 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13000 tokens : 3.5000000000000004% similarity, with 455 matched token, and 12545 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13100 tokens : 3.5038167938931295% similarity, with 459 matched token, and 12641 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13200 tokens : 3.5000000000000004% similarity, with 462 matched token, and 12738 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13300 tokens : 3.488721804511278% similarity, with 464 matched token, and 12836 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13400 tokens : 3.514925373134328% similarity, with 471 matched token, and 12929 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13500 tokens : 3.503703703703704% similarity, with 473 matched token, and 13027 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13600 tokens : 3.514705882352941% similarity, with 478 matched token, and 13122 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13700 tokens : 3.510948905109489% similarity, with 481 matched token, and 13219 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13800 tokens : 3.5144927536231885% similarity, with 485 matched token, and 13315 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13900 tokens : 3.5251798561151078% similarity, with 490 matched token, and 13410 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14000 tokens : 3.55% similarity, with 497 matched token, and 13503 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14100 tokens : 3.546099290780142% similarity, with 500 matched token, and 13600 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14200 tokens : 3.535211267605634% similarity, with 502 matched token, and 13698 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14300 tokens : 3.5454545454545454% similarity, with 507 matched token, and 13793 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14400 tokens : 3.5555555555555554% similarity, with 512 matched token, and 13888 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14500 tokens : 3.537931034482759% similarity, with 513 matched token, and 13987 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14600 tokens : 3.5273972602739727% similarity, with 515 matched token, and 14085 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14700 tokens : 3.5646258503401365% similarity, with 524 matched token, and 14176 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14800 tokens : 3.5472972972972974% similarity, with 525 matched token, and 14275 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14900 tokens : 3.550335570469799% similarity, with 529 matched token, and 14371 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15000 tokens : 3.5533333333333332% similarity, with 533 matched token, and 14467 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15100 tokens : 3.576158940397351% similarity, with 540 matched token, and 14560 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15200 tokens : 3.56578947368421% similarity, with 542 matched token, and 14658 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15300 tokens : 3.5490196078431375% similarity, with 543 matched token, and 14757 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15400 tokens : 3.551948051948052% similarity, with 547 matched token, and 14853 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15500 tokens : 3.5483870967741935% similarity, with 550 matched token, and 14950 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15600 tokens : 3.5448717948717947% similarity, with 553 matched token, and 15047 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15700 tokens : 3.5605095541401273% similarity, with 559 matched token, and 15141 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15800 tokens : 3.5506329113924053% similarity, with 561 matched token, and 15239 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15900 tokens : 3.547169811320755% similarity, with 564 matched token, and 15336 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 16000 tokens : 3.5437499999999997% similarity, with 567 matched token, and 15433 token mismatch\r\n", "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-16k.csv\" 4100 16000" ] }, { "cell_type": "markdown", "id": "a74e51c9", "metadata": { "papermill": { "duration": 0.09516, "end_time": "2023-09-05T21:13:06.131143", "exception": false, "start_time": "2023-09-05T21:13:06.035983", "status": "completed" }, "tags": [] }, "source": [ "# EWR V5 benchmark" ] }, { "cell_type": "code", "execution_count": 7, "id": "9d25dfe2", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T21:13:06.323309Z", "iopub.status.busy": "2023-09-05T21:13:06.322372Z", "iopub.status.idle": "2023-09-05T21:13:12.951333Z", "shell.execute_reply": "2023-09-05T21:13:12.950224Z" }, "papermill": { "duration": 6.72745, "end_time": "2023-09-05T21:13:12.953705", "exception": false, "start_time": "2023-09-05T21:13:06.226255", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 21:13:10,829] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Traceback (most recent call last):\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", " asyncio.run(main_function())\r\n", " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", " return loop.run_until_complete(main)\r\n", " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", " return future.result()\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n", " self.model = RWKV(**model_config)\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-1k.csv\"" ] }, { "cell_type": "code", "execution_count": 8, "id": "3fcf3d9c", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T21:13:13.146654Z", "iopub.status.busy": "2023-09-05T21:13:13.146064Z", "iopub.status.idle": "2023-09-05T21:13:19.792768Z", "shell.execute_reply": "2023-09-05T21:13:19.791667Z" }, "papermill": { "duration": 6.745739, "end_time": "2023-09-05T21:13:19.795146", "exception": false, "start_time": "2023-09-05T21:13:13.049407", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 21:13:17,653] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n", "Traceback (most recent call last):\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", " asyncio.run(main_function())\r\n", " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", " return loop.run_until_complete(main)\r\n", " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", " return future.result()\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n", " self.model = RWKV(**model_config)\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-4k.csv\" 1100 4000" ] }, { "cell_type": "code", "execution_count": 9, "id": "b6a68042", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T21:13:19.986694Z", "iopub.status.busy": "2023-09-05T21:13:19.986046Z", "iopub.status.idle": "2023-09-05T21:13:26.675895Z", "shell.execute_reply": "2023-09-05T21:13:26.674749Z" }, "papermill": { "duration": 6.789014, "end_time": "2023-09-05T21:13:26.678244", "exception": false, "start_time": "2023-09-05T21:13:19.889230", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 21:13:24,542] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Traceback (most recent call last):\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", " asyncio.run(main_function())\r\n", " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", " return loop.run_until_complete(main)\r\n", " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", " return future.result()\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n", " self.model = RWKV(**model_config)\r\n", " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-16k.csv\" 4100 16000" ] }, { "cell_type": "markdown", "id": "6ecfc74c", "metadata": { "papermill": { "duration": 0.093639, "end_time": "2023-09-05T21:13:26.866949", "exception": false, "start_time": "2023-09-05T21:13:26.773310", "status": "completed" }, "tags": [] }, "source": [ "# v5-L6-D1024-E0_1-mem-ctx-8k.pth" ] }, { "cell_type": "code", "execution_count": 10, "id": "d480f218", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T21:13:27.058397Z", "iopub.status.busy": "2023-09-05T21:13:27.057750Z", "iopub.status.idle": "2023-09-05T21:14:20.632357Z", "shell.execute_reply": "2023-09-05T21:14:20.631176Z" }, "papermill": { "duration": 53.673513, "end_time": "2023-09-05T21:14:20.634750", "exception": false, "start_time": "2023-09-05T21:13:26.961237", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 21:13:31,592] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 40 tokens : 97.5% similarity, with 39 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 45 tokens : 97.77777777777777% similarity, with 44 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 50 tokens : 94.0% similarity, with 47 matched token, and 3 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 55 tokens : 85.45454545454545% similarity, with 47 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 60 tokens : 83.33333333333334% similarity, with 50 matched token, and 10 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 65 tokens : 81.53846153846153% similarity, with 53 matched token, and 12 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 70 tokens : 72.85714285714285% similarity, with 51 matched token, and 19 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 75 tokens : 68.0% similarity, with 51 matched token, and 24 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 80 tokens : 63.74999999999999% similarity, with 51 matched token, and 29 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 85 tokens : 57.647058823529406% similarity, with 49 matched token, and 36 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 90 tokens : 58.88888888888889% similarity, with 53 matched token, and 37 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 95 tokens : 54.736842105263165% similarity, with 52 matched token, and 43 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 100 tokens : 55.00000000000001% similarity, with 55 matched token, and 45 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 105 tokens : 56.19047619047619% similarity, with 59 matched token, and 46 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 110 tokens : 55.45454545454545% similarity, with 61 matched token, and 49 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 115 tokens : 53.04347826086957% similarity, with 61 matched token, and 54 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 120 tokens : 48.333333333333336% similarity, with 58 matched token, and 62 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 125 tokens : 46.400000000000006% similarity, with 58 matched token, and 67 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 130 tokens : 45.38461538461539% similarity, with 59 matched token, and 71 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 135 tokens : 44.44444444444444% similarity, with 60 matched token, and 75 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 140 tokens : 42.142857142857146% similarity, with 59 matched token, and 81 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 145 tokens : 42.758620689655174% similarity, with 62 matched token, and 83 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 150 tokens : 41.333333333333336% similarity, with 62 matched token, and 88 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 160 tokens : 35.0% similarity, with 56 matched token, and 104 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 170 tokens : 33.52941176470588% similarity, with 57 matched token, and 113 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 180 tokens : 32.77777777777778% similarity, with 59 matched token, and 121 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 190 tokens : 32.631578947368425% similarity, with 62 matched token, and 128 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 200 tokens : 33.0% similarity, with 66 matched token, and 134 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 210 tokens : 32.38095238095238% similarity, with 68 matched token, and 142 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 220 tokens : 29.09090909090909% similarity, with 64 matched token, and 156 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 230 tokens : 28.695652173913043% similarity, with 66 matched token, and 164 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 240 tokens : 30.833333333333336% similarity, with 74 matched token, and 166 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 250 tokens : 30.8% similarity, with 77 matched token, and 173 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 260 tokens : 31.153846153846153% similarity, with 81 matched token, and 179 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 270 tokens : 28.51851851851852% similarity, with 77 matched token, and 193 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 280 tokens : 30.0% similarity, with 84 matched token, and 196 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 290 tokens : 27.586206896551722% similarity, with 80 matched token, and 210 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 300 tokens : 28.000000000000004% similarity, with 84 matched token, and 216 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 325 tokens : 26.153846153846157% similarity, with 85 matched token, and 240 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 350 tokens : 25.142857142857146% similarity, with 88 matched token, and 262 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 375 tokens : 22.933333333333334% similarity, with 86 matched token, and 289 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 400 tokens : 22.75% similarity, with 91 matched token, and 309 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 425 tokens : 22.58823529411765% similarity, with 96 matched token, and 329 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 450 tokens : 20.88888888888889% similarity, with 94 matched token, and 356 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 475 tokens : 19.789473684210527% similarity, with 94 matched token, and 381 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 500 tokens : 18.8% similarity, with 94 matched token, and 406 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 525 tokens : 18.285714285714285% similarity, with 96 matched token, and 429 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 550 tokens : 17.636363636363637% similarity, with 97 matched token, and 453 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 575 tokens : 18.086956521739133% similarity, with 104 matched token, and 471 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 600 tokens : 17.0% similarity, with 102 matched token, and 498 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 625 tokens : 16.96% similarity, with 106 matched token, and 519 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 650 tokens : 15.384615384615385% similarity, with 100 matched token, and 550 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 675 tokens : 15.851851851851853% similarity, with 107 matched token, and 568 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 700 tokens : 14.285714285714285% similarity, with 100 matched token, and 600 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 750 tokens : 14.266666666666666% similarity, with 107 matched token, and 643 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 800 tokens : 13.375% similarity, with 107 matched token, and 693 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 850 tokens : 13.529411764705882% similarity, with 115 matched token, and 735 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 900 tokens : 13.0% similarity, with 117 matched token, and 783 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 950 tokens : 12.0% similarity, with 114 matched token, and 836 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1000 tokens : 11.1% similarity, with 111 matched token, and 889 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D1024-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D1024-E0_1-1k.csv\"" ] }, { "cell_type": "code", "execution_count": 11, "id": "50bc6985", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T21:14:20.832876Z", "iopub.status.busy": "2023-09-05T21:14:20.832220Z", "iopub.status.idle": "2023-09-05T21:17:59.733915Z", "shell.execute_reply": "2023-09-05T21:17:59.732622Z" }, "papermill": { "duration": 219.003796, "end_time": "2023-09-05T21:17:59.736377", "exception": false, "start_time": "2023-09-05T21:14:20.732581", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 21:14:25,362] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1100 tokens : 10.363636363636363% similarity, with 114 matched token, and 986 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1150 tokens : 9.826086956521738% similarity, with 113 matched token, and 1037 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1200 tokens : 9.75% similarity, with 117 matched token, and 1083 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1250 tokens : 9.6% similarity, with 120 matched token, and 1130 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1300 tokens : 9.230769230769232% similarity, with 120 matched token, and 1180 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1350 tokens : 8.592592592592592% similarity, with 116 matched token, and 1234 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1400 tokens : 9.071428571428571% similarity, with 127 matched token, and 1273 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1450 tokens : 8.827586206896552% similarity, with 128 matched token, and 1322 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1500 tokens : 7.933333333333334% similarity, with 119 matched token, and 1381 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1550 tokens : 7.677419354838709% similarity, with 119 matched token, and 1431 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1600 tokens : 7.9375% similarity, with 127 matched token, and 1473 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1650 tokens : 7.212121212121213% similarity, with 119 matched token, and 1531 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1700 tokens : 6.88235294117647% similarity, with 117 matched token, and 1583 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1750 tokens : 6.800000000000001% similarity, with 119 matched token, and 1631 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1800 tokens : 6.888888888888889% similarity, with 124 matched token, and 1676 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1850 tokens : 6.594594594594596% similarity, with 122 matched token, and 1728 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1900 tokens : 6.368421052631579% similarity, with 121 matched token, and 1779 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1950 tokens : 6.102564102564102% similarity, with 119 matched token, and 1831 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2000 tokens : 6.0% similarity, with 120 matched token, and 1880 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2050 tokens : 5.951219512195122% similarity, with 122 matched token, and 1928 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2100 tokens : 5.714285714285714% similarity, with 120 matched token, and 1980 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2150 tokens : 5.627906976744186% similarity, with 121 matched token, and 2029 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2200 tokens : 5.227272727272727% similarity, with 115 matched token, and 2085 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2250 tokens : 5.066666666666666% similarity, with 114 matched token, and 2136 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2300 tokens : 5.043478260869565% similarity, with 116 matched token, and 2184 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2350 tokens : 4.808510638297872% similarity, with 113 matched token, and 2237 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2400 tokens : 4.75% similarity, with 114 matched token, and 2286 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2450 tokens : 4.775510204081632% similarity, with 117 matched token, and 2333 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2500 tokens : 4.68% similarity, with 117 matched token, and 2383 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2550 tokens : 4.627450980392156% similarity, with 118 matched token, and 2432 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2600 tokens : 4.576923076923077% similarity, with 119 matched token, and 2481 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2650 tokens : 4.60377358490566% similarity, with 122 matched token, and 2528 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2700 tokens : 4.62962962962963% similarity, with 125 matched token, and 2575 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2750 tokens : 4.618181818181818% similarity, with 127 matched token, and 2623 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2800 tokens : 4.5% similarity, with 126 matched token, and 2674 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2850 tokens : 4.456140350877193% similarity, with 127 matched token, and 2723 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2900 tokens : 4.344827586206897% similarity, with 126 matched token, and 2774 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2950 tokens : 4.372881355932203% similarity, with 129 matched token, and 2821 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3000 tokens : 4.233333333333333% similarity, with 127 matched token, and 2873 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3050 tokens : 4.19672131147541% similarity, with 128 matched token, and 2922 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3100 tokens : 4.161290322580645% similarity, with 129 matched token, and 2971 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3150 tokens : 4.1269841269841265% similarity, with 130 matched token, and 3020 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3200 tokens : 4.125% similarity, with 132 matched token, and 3068 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3250 tokens : 4.153846153846154% similarity, with 135 matched token, and 3115 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3300 tokens : 4.121212121212121% similarity, with 136 matched token, and 3164 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3350 tokens : 3.940298507462687% similarity, with 132 matched token, and 3218 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3400 tokens : 3.9411764705882355% similarity, with 134 matched token, and 3266 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3450 tokens : 3.91304347826087% similarity, with 135 matched token, and 3315 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3500 tokens : 3.9142857142857146% similarity, with 137 matched token, and 3363 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3550 tokens : 3.859154929577465% similarity, with 137 matched token, and 3413 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3600 tokens : 3.888888888888889% similarity, with 140 matched token, and 3460 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3650 tokens : 3.863013698630137% similarity, with 141 matched token, and 3509 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3700 tokens : 3.8108108108108105% similarity, with 141 matched token, and 3559 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3750 tokens : 3.7600000000000002% similarity, with 141 matched token, and 3609 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3800 tokens : 3.763157894736842% similarity, with 143 matched token, and 3657 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3850 tokens : 3.766233766233766% similarity, with 145 matched token, and 3705 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3900 tokens : 3.717948717948718% similarity, with 145 matched token, and 3755 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3950 tokens : 3.645569620253165% similarity, with 144 matched token, and 3806 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4000 tokens : 3.6249999999999996% similarity, with 145 matched token, and 3855 token mismatch\r\n", "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D1024-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D1024-E0_1-4k.csv\" 1100 4000" ] }, { "cell_type": "code", "execution_count": 12, "id": "488296d3", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T21:17:59.942749Z", "iopub.status.busy": "2023-09-05T21:17:59.941792Z", "iopub.status.idle": "2023-09-05T22:15:37.866692Z", "shell.execute_reply": "2023-09-05T22:15:37.865420Z" }, "papermill": { "duration": 3458.031609, "end_time": "2023-09-05T22:15:37.869014", "exception": false, "start_time": "2023-09-05T21:17:59.837405", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 21:18:04,474] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4100 tokens : 3.6585365853658534% similarity, with 150 matched token, and 3950 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4200 tokens : 3.571428571428571% similarity, with 150 matched token, and 4050 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4300 tokens : 3.5348837209302326% similarity, with 152 matched token, and 4148 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4400 tokens : 3.5227272727272725% similarity, with 155 matched token, and 4245 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4500 tokens : 3.4888888888888885% similarity, with 157 matched token, and 4343 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4600 tokens : 3.5000000000000004% similarity, with 161 matched token, and 4439 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4700 tokens : 3.5106382978723407% similarity, with 165 matched token, and 4535 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4800 tokens : 3.4583333333333335% similarity, with 166 matched token, and 4634 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4900 tokens : 3.4489795918367343% similarity, with 169 matched token, and 4731 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5000 tokens : 3.38% similarity, with 169 matched token, and 4831 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5100 tokens : 3.392156862745098% similarity, with 173 matched token, and 4927 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5200 tokens : 3.307692307692308% similarity, with 172 matched token, and 5028 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5300 tokens : 3.3207547169811322% similarity, with 176 matched token, and 5124 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5400 tokens : 3.2407407407407405% similarity, with 175 matched token, and 5225 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5500 tokens : 3.272727272727273% similarity, with 180 matched token, and 5320 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5600 tokens : 3.2857142857142856% similarity, with 184 matched token, and 5416 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5700 tokens : 3.263157894736842% similarity, with 186 matched token, and 5514 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5800 tokens : 3.2241379310344827% similarity, with 187 matched token, and 5613 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5900 tokens : 3.2542372881355934% similarity, with 192 matched token, and 5708 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6000 tokens : 3.2333333333333334% similarity, with 194 matched token, and 5806 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6100 tokens : 3.245901639344263% similarity, with 198 matched token, and 5902 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6200 tokens : 3.225806451612903% similarity, with 200 matched token, and 6000 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6300 tokens : 3.2380952380952377% similarity, with 204 matched token, and 6096 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6400 tokens : 3.2343749999999996% similarity, with 207 matched token, and 6193 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6500 tokens : 3.2615384615384615% similarity, with 212 matched token, and 6288 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6600 tokens : 3.2424242424242427% similarity, with 214 matched token, and 6386 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6700 tokens : 3.268656716417911% similarity, with 219 matched token, and 6481 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6800 tokens : 3.25% similarity, with 221 matched token, and 6579 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6900 tokens : 3.27536231884058% similarity, with 226 matched token, and 6674 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7000 tokens : 3.257142857142857% similarity, with 228 matched token, and 6772 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7100 tokens : 3.2394366197183095% similarity, with 230 matched token, and 6870 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7200 tokens : 3.236111111111111% similarity, with 233 matched token, and 6967 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7300 tokens : 3.2602739726027394% similarity, with 238 matched token, and 7062 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7400 tokens : 3.256756756756757% similarity, with 241 matched token, and 7159 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7500 tokens : 3.2399999999999998% similarity, with 243 matched token, and 7257 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7600 tokens : 3.25% similarity, with 247 matched token, and 7353 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7700 tokens : 3.25974025974026% similarity, with 251 matched token, and 7449 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7800 tokens : 3.2435897435897436% similarity, with 253 matched token, and 7547 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7900 tokens : 3.2405063291139244% similarity, with 256 matched token, and 7644 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8000 tokens : 3.2375000000000003% similarity, with 259 matched token, and 7741 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8100 tokens : 3.2839506172839505% similarity, with 266 matched token, and 7834 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8200 tokens : 3.2682926829268295% similarity, with 268 matched token, and 7932 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8300 tokens : 3.2530120481927707% similarity, with 270 matched token, and 8030 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8400 tokens : 3.2380952380952377% similarity, with 272 matched token, and 8128 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8500 tokens : 3.2705882352941176% similarity, with 278 matched token, and 8222 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8600 tokens : 3.2674418604651168% similarity, with 281 matched token, and 8319 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8700 tokens : 3.2758620689655173% similarity, with 285 matched token, and 8415 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8800 tokens : 3.25% similarity, with 286 matched token, and 8514 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8900 tokens : 3.258426966292135% similarity, with 290 matched token, and 8610 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9000 tokens : 3.255555555555555% similarity, with 293 matched token, and 8707 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9100 tokens : 3.274725274725275% similarity, with 298 matched token, and 8802 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9200 tokens : 3.2717391304347823% similarity, with 301 matched token, and 8899 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9300 tokens : 3.258064516129032% similarity, with 303 matched token, and 8997 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9400 tokens : 3.2446808510638294% similarity, with 305 matched token, and 9095 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9500 tokens : 3.263157894736842% similarity, with 310 matched token, and 9190 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9600 tokens : 3.2604166666666665% similarity, with 313 matched token, and 9287 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9700 tokens : 3.257731958762886% similarity, with 316 matched token, and 9384 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9800 tokens : 3.2448979591836737% similarity, with 318 matched token, and 9482 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9900 tokens : 3.262626262626263% similarity, with 323 matched token, and 9577 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10000 tokens : 3.29% similarity, with 329 matched token, and 9671 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10100 tokens : 3.306930693069307% similarity, with 334 matched token, and 9766 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10200 tokens : 3.294117647058824% similarity, with 336 matched token, and 9864 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10300 tokens : 3.2815533980582527% similarity, with 338 matched token, and 9962 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10400 tokens : 3.2884615384615388% similarity, with 342 matched token, and 10058 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10500 tokens : 3.3047619047619046% similarity, with 347 matched token, and 10153 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10600 tokens : 3.2924528301886795% similarity, with 349 matched token, and 10251 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10700 tokens : 3.3177570093457946% similarity, with 355 matched token, and 10345 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10800 tokens : 3.3240740740740735% similarity, with 359 matched token, and 10441 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10900 tokens : 3.311926605504587% similarity, with 361 matched token, and 10539 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11000 tokens : 3.327272727272727% similarity, with 366 matched token, and 10634 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11100 tokens : 3.3153153153153156% similarity, with 368 matched token, and 10732 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11200 tokens : 3.303571428571429% similarity, with 370 matched token, and 10830 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11300 tokens : 3.3097345132743365% similarity, with 374 matched token, and 10926 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11400 tokens : 3.3421052631578947% similarity, with 381 matched token, and 11019 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11500 tokens : 3.3304347826086955% similarity, with 383 matched token, and 11117 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11600 tokens : 3.3448275862068964% similarity, with 388 matched token, and 11212 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11700 tokens : 3.3333333333333335% similarity, with 390 matched token, and 11310 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11800 tokens : 3.347457627118644% similarity, with 395 matched token, and 11405 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11900 tokens : 3.34453781512605% similarity, with 398 matched token, and 11502 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12000 tokens : 3.3583333333333334% similarity, with 403 matched token, and 11597 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12100 tokens : 3.3636363636363638% similarity, with 407 matched token, and 11693 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12200 tokens : 3.3524590163934427% similarity, with 409 matched token, and 11791 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12300 tokens : 3.3577235772357725% similarity, with 413 matched token, and 11887 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12400 tokens : 3.354838709677419% similarity, with 416 matched token, and 11984 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12500 tokens : 3.3520000000000003% similarity, with 419 matched token, and 12081 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12600 tokens : 3.349206349206349% similarity, with 422 matched token, and 12178 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12700 tokens : 3.362204724409449% similarity, with 427 matched token, and 12273 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12800 tokens : 3.3515625% similarity, with 429 matched token, and 12371 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12900 tokens : 3.356589147286822% similarity, with 433 matched token, and 12467 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13000 tokens : 3.3692307692307697% similarity, with 438 matched token, and 12562 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13100 tokens : 3.3587786259541987% similarity, with 440 matched token, and 12660 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13200 tokens : 3.3636363636363638% similarity, with 444 matched token, and 12756 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13300 tokens : 3.3533834586466167% similarity, with 446 matched token, and 12854 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13400 tokens : 3.3731343283582094% similarity, with 452 matched token, and 12948 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13500 tokens : 3.355555555555555% similarity, with 453 matched token, and 13047 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13600 tokens : 3.3602941176470584% similarity, with 457 matched token, and 13143 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13700 tokens : 3.343065693430657% similarity, with 458 matched token, and 13242 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13800 tokens : 3.355072463768116% similarity, with 463 matched token, and 13337 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13900 tokens : 3.3741007194244603% similarity, with 469 matched token, and 13431 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14000 tokens : 3.3857142857142857% similarity, with 474 matched token, and 13526 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14100 tokens : 3.3829787234042556% similarity, with 477 matched token, and 13623 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14200 tokens : 3.373239436619718% similarity, with 479 matched token, and 13721 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14300 tokens : 3.3636363636363638% similarity, with 481 matched token, and 13819 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14400 tokens : 3.375% similarity, with 486 matched token, and 13914 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14500 tokens : 3.36551724137931% similarity, with 488 matched token, and 14012 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14600 tokens : 3.356164383561644% similarity, with 490 matched token, and 14110 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14700 tokens : 3.387755102040816% similarity, with 498 matched token, and 14202 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14800 tokens : 3.371621621621622% similarity, with 499 matched token, and 14301 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14900 tokens : 3.3758389261744965% similarity, with 503 matched token, and 14397 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15000 tokens : 3.373333333333333% similarity, with 506 matched token, and 14494 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15100 tokens : 3.357615894039735% similarity, with 507 matched token, and 14593 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15200 tokens : 3.3486842105263155% similarity, with 509 matched token, and 14691 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15300 tokens : 3.3529411764705883% similarity, with 513 matched token, and 14787 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15400 tokens : 3.3441558441558437% similarity, with 515 matched token, and 14885 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15500 tokens : 3.3419354838709676% similarity, with 518 matched token, and 14982 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15600 tokens : 3.346153846153846% similarity, with 522 matched token, and 15078 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15700 tokens : 3.3503184713375793% similarity, with 526 matched token, and 15174 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15800 tokens : 3.3417721518987342% similarity, with 528 matched token, and 15272 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15900 tokens : 3.3333333333333335% similarity, with 530 matched token, and 15370 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 16000 tokens : 3.325% similarity, with 532 matched token, and 15468 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D1024-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D1024-E0_1-16k.csv\" 4100 16000" ] }, { "cell_type": "markdown", "id": "579317b2", "metadata": { "papermill": { "duration": 0.104356, "end_time": "2023-09-05T22:15:38.079271", "exception": false, "start_time": "2023-09-05T22:15:37.974915", "status": "completed" }, "tags": [] }, "source": [ "# v5-L6-D2048-E0_1-mem-ctx-8k.pth" ] }, { "cell_type": "code", "execution_count": 13, "id": "a3bc5e5c", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T22:15:38.293951Z", "iopub.status.busy": "2023-09-05T22:15:38.293240Z", "iopub.status.idle": "2023-09-05T22:16:30.929975Z", "shell.execute_reply": "2023-09-05T22:16:30.928742Z" }, "papermill": { "duration": 52.74712, "end_time": "2023-09-05T22:16:30.932428", "exception": false, "start_time": "2023-09-05T22:15:38.185308", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 22:15:42,702] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 40 tokens : 100.0% similarity, with 40 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 45 tokens : 100.0% similarity, with 45 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 50 tokens : 100.0% similarity, with 50 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 55 tokens : 98.18181818181819% similarity, with 54 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 60 tokens : 100.0% similarity, with 60 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 65 tokens : 98.46153846153847% similarity, with 64 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 70 tokens : 98.57142857142858% similarity, with 69 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 75 tokens : 98.66666666666667% similarity, with 74 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 80 tokens : 100.0% similarity, with 80 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 85 tokens : 100.0% similarity, with 85 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 90 tokens : 97.77777777777777% similarity, with 88 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 95 tokens : 100.0% similarity, with 95 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 100 tokens : 99.0% similarity, with 99 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 105 tokens : 99.04761904761905% similarity, with 104 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 110 tokens : 99.0909090909091% similarity, with 109 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 115 tokens : 99.1304347826087% similarity, with 114 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 120 tokens : 99.16666666666667% similarity, with 119 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 125 tokens : 99.2% similarity, with 124 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 130 tokens : 99.23076923076923% similarity, with 129 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 135 tokens : 99.25925925925925% similarity, with 134 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 140 tokens : 99.28571428571429% similarity, with 139 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 145 tokens : 99.3103448275862% similarity, with 144 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 150 tokens : 99.33333333333333% similarity, with 149 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 160 tokens : 99.375% similarity, with 159 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 170 tokens : 99.41176470588235% similarity, with 169 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 180 tokens : 99.44444444444444% similarity, with 179 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 190 tokens : 97.89473684210527% similarity, with 186 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 200 tokens : 98.5% similarity, with 197 matched token, and 3 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 210 tokens : 98.09523809523809% similarity, with 206 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 220 tokens : 96.36363636363636% similarity, with 212 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 230 tokens : 97.3913043478261% similarity, with 224 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 240 tokens : 97.5% similarity, with 234 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 250 tokens : 97.6% similarity, with 244 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 260 tokens : 97.3076923076923% similarity, with 253 matched token, and 7 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 270 tokens : 97.03703703703704% similarity, with 262 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 280 tokens : 95.35714285714286% similarity, with 267 matched token, and 13 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 290 tokens : 95.17241379310344% similarity, with 276 matched token, and 14 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 300 tokens : 95.33333333333334% similarity, with 286 matched token, and 14 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 325 tokens : 95.6923076923077% similarity, with 311 matched token, and 14 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 350 tokens : 95.14285714285714% similarity, with 333 matched token, and 17 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 375 tokens : 93.60000000000001% similarity, with 351 matched token, and 24 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 400 tokens : 91.75% similarity, with 367 matched token, and 33 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 425 tokens : 91.76470588235294% similarity, with 390 matched token, and 35 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 450 tokens : 89.77777777777777% similarity, with 404 matched token, and 46 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 475 tokens : 89.47368421052632% similarity, with 425 matched token, and 50 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 500 tokens : 88.8% similarity, with 444 matched token, and 56 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 525 tokens : 87.80952380952381% similarity, with 461 matched token, and 64 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 550 tokens : 86.72727272727273% similarity, with 477 matched token, and 73 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 575 tokens : 86.08695652173914% similarity, with 495 matched token, and 80 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 600 tokens : 85.66666666666667% similarity, with 514 matched token, and 86 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 625 tokens : 84.48% similarity, with 528 matched token, and 97 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 650 tokens : 83.23076923076923% similarity, with 541 matched token, and 109 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 675 tokens : 82.07407407407408% similarity, with 554 matched token, and 121 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 700 tokens : 81.0% similarity, with 567 matched token, and 133 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 750 tokens : 78.53333333333333% similarity, with 589 matched token, and 161 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 800 tokens : 76.75% similarity, with 614 matched token, and 186 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 850 tokens : 73.76470588235294% similarity, with 627 matched token, and 223 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 900 tokens : 71.44444444444444% similarity, with 643 matched token, and 257 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 950 tokens : 68.84210526315789% similarity, with 654 matched token, and 296 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1000 tokens : 67.4% similarity, with 674 matched token, and 326 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D2048-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D2048-E0_1-1k.csv\"" ] }, { "cell_type": "code", "execution_count": 14, "id": "6bf21423", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T22:16:31.257032Z", "iopub.status.busy": "2023-09-05T22:16:31.256036Z", "iopub.status.idle": "2023-09-05T22:20:35.318227Z", "shell.execute_reply": "2023-09-05T22:20:35.316693Z" }, "papermill": { "duration": 244.178194, "end_time": "2023-09-05T22:20:35.320591", "exception": false, "start_time": "2023-09-05T22:16:31.142397", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 22:16:35,877] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1100 tokens : 61.0% similarity, with 671 matched token, and 429 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1150 tokens : 58.26086956521739% similarity, with 670 matched token, and 480 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1200 tokens : 56.49999999999999% similarity, with 678 matched token, and 522 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1250 tokens : 54.400000000000006% similarity, with 680 matched token, and 570 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1300 tokens : 51.92307692307693% similarity, with 675 matched token, and 625 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1350 tokens : 50.37037037037037% similarity, with 680 matched token, and 670 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1400 tokens : 48.214285714285715% similarity, with 675 matched token, and 725 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1450 tokens : 45.03448275862069% similarity, with 653 matched token, and 797 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1500 tokens : 43.06666666666666% similarity, with 646 matched token, and 854 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1550 tokens : 41.80645161290323% similarity, with 648 matched token, and 902 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1600 tokens : 41.125% similarity, with 658 matched token, and 942 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1650 tokens : 39.45454545454545% similarity, with 651 matched token, and 999 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1700 tokens : 38.23529411764706% similarity, with 650 matched token, and 1050 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1750 tokens : 36.22857142857143% similarity, with 634 matched token, and 1116 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1800 tokens : 35.388888888888886% similarity, with 637 matched token, and 1163 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1850 tokens : 33.4054054054054% similarity, with 618 matched token, and 1232 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1900 tokens : 32.315789473684205% similarity, with 614 matched token, and 1286 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1950 tokens : 31.538461538461537% similarity, with 615 matched token, and 1335 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2000 tokens : 30.75% similarity, with 615 matched token, and 1385 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2050 tokens : 30.097560975609756% similarity, with 617 matched token, and 1433 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2100 tokens : 29.19047619047619% similarity, with 613 matched token, and 1487 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2150 tokens : 28.511627906976745% similarity, with 613 matched token, and 1537 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2200 tokens : 28.045454545454547% similarity, with 617 matched token, and 1583 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2250 tokens : 27.28888888888889% similarity, with 614 matched token, and 1636 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2300 tokens : 26.608695652173914% similarity, with 612 matched token, and 1688 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2350 tokens : 26.04255319148936% similarity, with 612 matched token, and 1738 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2400 tokens : 25.5% similarity, with 612 matched token, and 1788 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2450 tokens : 24.653061224489793% similarity, with 604 matched token, and 1846 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2500 tokens : 24.2% similarity, with 605 matched token, and 1895 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2550 tokens : 23.764705882352942% similarity, with 606 matched token, and 1944 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2600 tokens : 23.26923076923077% similarity, with 605 matched token, and 1995 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2650 tokens : 22.79245283018868% similarity, with 604 matched token, and 2046 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2700 tokens : 22.25925925925926% similarity, with 601 matched token, and 2099 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2750 tokens : 21.818181818181817% similarity, with 600 matched token, and 2150 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2800 tokens : 21.464285714285715% similarity, with 601 matched token, and 2199 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2850 tokens : 21.157894736842106% similarity, with 603 matched token, and 2247 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2900 tokens : 20.620689655172413% similarity, with 598 matched token, and 2302 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2950 tokens : 20.30508474576271% similarity, with 599 matched token, and 2351 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3000 tokens : 19.933333333333334% similarity, with 598 matched token, and 2402 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3050 tokens : 19.540983606557376% similarity, with 596 matched token, and 2454 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3100 tokens : 19.193548387096772% similarity, with 595 matched token, and 2505 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3150 tokens : 18.88888888888889% similarity, with 595 matched token, and 2555 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3200 tokens : 18.53125% similarity, with 593 matched token, and 2607 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3250 tokens : 18.246153846153845% similarity, with 593 matched token, and 2657 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3300 tokens : 17.87878787878788% similarity, with 590 matched token, and 2710 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3350 tokens : 17.55223880597015% similarity, with 588 matched token, and 2762 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3400 tokens : 17.323529411764707% similarity, with 589 matched token, and 2811 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3450 tokens : 16.98550724637681% similarity, with 586 matched token, and 2864 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3500 tokens : 16.62857142857143% similarity, with 582 matched token, and 2918 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3550 tokens : 16.366197183098592% similarity, with 581 matched token, and 2969 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3600 tokens : 15.944444444444445% similarity, with 574 matched token, and 3026 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3650 tokens : 15.835616438356166% similarity, with 578 matched token, and 3072 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3700 tokens : 15.486486486486486% similarity, with 573 matched token, and 3127 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3750 tokens : 15.28% similarity, with 573 matched token, and 3177 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3800 tokens : 15.026315789473685% similarity, with 571 matched token, and 3229 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3850 tokens : 14.779220779220777% similarity, with 569 matched token, and 3281 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3900 tokens : 14.692307692307693% similarity, with 573 matched token, and 3327 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3950 tokens : 14.27848101265823% similarity, with 564 matched token, and 3386 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4000 tokens : 13.850000000000001% similarity, with 554 matched token, and 3446 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D2048-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D2048-E0_1-4k.csv\" 1100 4000" ] }, { "cell_type": "code", "execution_count": 15, "id": "44ea2959", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T22:20:35.545636Z", "iopub.status.busy": "2023-09-05T22:20:35.545083Z", "iopub.status.idle": "2023-09-05T23:20:17.504268Z", "shell.execute_reply": "2023-09-05T23:20:17.503356Z" }, "papermill": { "duration": 3582.074768, "end_time": "2023-09-05T23:20:17.506577", "exception": false, "start_time": "2023-09-05T22:20:35.431809", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 22:20:39,857] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4100 tokens : 13.390243902439025% similarity, with 549 matched token, and 3551 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4200 tokens : 12.547619047619046% similarity, with 527 matched token, and 3673 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4300 tokens : 11.906976744186046% similarity, with 512 matched token, and 3788 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4400 tokens : 10.772727272727273% similarity, with 474 matched token, and 3926 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4500 tokens : 9.88888888888889% similarity, with 445 matched token, and 4055 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4600 tokens : 8.782608695652174% similarity, with 404 matched token, and 4196 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4700 tokens : 8.085106382978724% similarity, with 380 matched token, and 4320 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4800 tokens : 7.208333333333333% similarity, with 346 matched token, and 4454 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4900 tokens : 6.346938775510204% similarity, with 311 matched token, and 4589 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5000 tokens : 5.4399999999999995% similarity, with 272 matched token, and 4728 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5100 tokens : 4.96078431372549% similarity, with 253 matched token, and 4847 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5200 tokens : 4.5% similarity, with 234 matched token, and 4966 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5300 tokens : 4.377358490566038% similarity, with 232 matched token, and 5068 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5400 tokens : 4.092592592592593% similarity, with 221 matched token, and 5179 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5500 tokens : 4.0% similarity, with 220 matched token, and 5280 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5600 tokens : 3.8214285714285716% similarity, with 214 matched token, and 5386 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5700 tokens : 3.736842105263158% similarity, with 213 matched token, and 5487 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5800 tokens : 3.6551724137931036% similarity, with 212 matched token, and 5588 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5900 tokens : 3.6610169491525424% similarity, with 216 matched token, and 5684 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6000 tokens : 3.55% similarity, with 213 matched token, and 5787 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6100 tokens : 3.540983606557377% similarity, with 216 matched token, and 5884 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6200 tokens : 3.5000000000000004% similarity, with 217 matched token, and 5983 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6300 tokens : 3.492063492063492% similarity, with 220 matched token, and 6080 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6400 tokens : 3.453125% similarity, with 221 matched token, and 6179 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6500 tokens : 3.4615384615384617% similarity, with 225 matched token, and 6275 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6600 tokens : 3.424242424242424% similarity, with 226 matched token, and 6374 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6700 tokens : 3.4477611940298503% similarity, with 231 matched token, and 6469 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6800 tokens : 3.426470588235294% similarity, with 233 matched token, and 6567 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6900 tokens : 3.4492753623188404% similarity, with 238 matched token, and 6662 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7000 tokens : 3.4428571428571426% similarity, with 241 matched token, and 6759 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7100 tokens : 3.4225352112676055% similarity, with 243 matched token, and 6857 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7200 tokens : 3.4027777777777777% similarity, with 245 matched token, and 6955 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7300 tokens : 3.4109589041095894% similarity, with 249 matched token, and 7051 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7400 tokens : 3.4054054054054053% similarity, with 252 matched token, and 7148 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7500 tokens : 3.4133333333333336% similarity, with 256 matched token, and 7244 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7600 tokens : 3.421052631578948% similarity, with 260 matched token, and 7340 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7700 tokens : 3.428571428571429% similarity, with 264 matched token, and 7436 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7800 tokens : 3.4102564102564106% similarity, with 266 matched token, and 7534 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7900 tokens : 3.4177215189873418% similarity, with 270 matched token, and 7630 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8000 tokens : 3.4125% similarity, with 273 matched token, and 7727 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8100 tokens : 3.45679012345679% similarity, with 280 matched token, and 7820 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8200 tokens : 3.439024390243903% similarity, with 282 matched token, and 7918 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8300 tokens : 3.4216867469879517% similarity, with 284 matched token, and 8016 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8400 tokens : 3.428571428571429% similarity, with 288 matched token, and 8112 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8500 tokens : 3.458823529411765% similarity, with 294 matched token, and 8206 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8600 tokens : 3.4534883720930236% similarity, with 297 matched token, and 8303 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8700 tokens : 3.4482758620689653% similarity, with 300 matched token, and 8400 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8800 tokens : 3.4431818181818183% similarity, with 303 matched token, and 8497 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8900 tokens : 3.449438202247191% similarity, with 307 matched token, and 8593 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9000 tokens : 3.4333333333333336% similarity, with 309 matched token, and 8691 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9100 tokens : 3.4505494505494507% similarity, with 314 matched token, and 8786 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9200 tokens : 3.4565217391304346% similarity, with 318 matched token, and 8882 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9300 tokens : 3.4301075268817205% similarity, with 319 matched token, and 8981 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9400 tokens : 3.404255319148936% similarity, with 320 matched token, and 9080 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9500 tokens : 3.431578947368421% similarity, with 326 matched token, and 9174 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9600 tokens : 3.4166666666666665% similarity, with 328 matched token, and 9272 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9700 tokens : 3.4123711340206184% similarity, with 331 matched token, and 9369 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9800 tokens : 3.387755102040816% similarity, with 332 matched token, and 9468 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9900 tokens : 3.424242424242424% similarity, with 339 matched token, and 9561 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10000 tokens : 3.45% similarity, with 345 matched token, and 9655 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10100 tokens : 3.455445544554456% similarity, with 349 matched token, and 9751 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10200 tokens : 3.4509803921568625% similarity, with 352 matched token, and 9848 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10300 tokens : 3.4368932038834954% similarity, with 354 matched token, and 9946 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10400 tokens : 3.4423076923076925% similarity, with 358 matched token, and 10042 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10500 tokens : 3.4666666666666663% similarity, with 364 matched token, and 10136 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10600 tokens : 3.4528301886792456% similarity, with 366 matched token, and 10234 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10700 tokens : 3.4766355140186915% similarity, with 372 matched token, and 10328 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10800 tokens : 3.490740740740741% similarity, with 377 matched token, and 10423 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10900 tokens : 3.4770642201834865% similarity, with 379 matched token, and 10521 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11000 tokens : 3.5000000000000004% similarity, with 385 matched token, and 10615 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11100 tokens : 3.4954954954954953% similarity, with 388 matched token, and 10712 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11200 tokens : 3.482142857142857% similarity, with 390 matched token, and 10810 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11300 tokens : 3.4955752212389384% similarity, with 395 matched token, and 10905 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11400 tokens : 3.543859649122807% similarity, with 404 matched token, and 10996 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11500 tokens : 3.5391304347826087% similarity, with 407 matched token, and 11093 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11600 tokens : 3.5603448275862073% similarity, with 413 matched token, and 11187 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11700 tokens : 3.547008547008547% similarity, with 415 matched token, and 11285 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11800 tokens : 3.5593220338983054% similarity, with 420 matched token, and 11380 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11900 tokens : 3.563025210084034% similarity, with 424 matched token, and 11476 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12000 tokens : 3.5833333333333335% similarity, with 430 matched token, and 11570 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12100 tokens : 3.5867768595041323% similarity, with 434 matched token, and 11666 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12200 tokens : 3.5655737704918034% similarity, with 435 matched token, and 11765 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12300 tokens : 3.585365853658536% similarity, with 441 matched token, and 11859 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12400 tokens : 3.588709677419355% similarity, with 445 matched token, and 11955 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12500 tokens : 3.5839999999999996% similarity, with 448 matched token, and 12052 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12600 tokens : 3.5793650793650795% similarity, with 451 matched token, and 12149 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12700 tokens : 3.5905511811023625% similarity, with 456 matched token, and 12244 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12800 tokens : 3.578125% similarity, with 458 matched token, and 12342 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12900 tokens : 3.573643410852713% similarity, with 461 matched token, and 12439 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13000 tokens : 3.5923076923076924% similarity, with 467 matched token, and 12533 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13100 tokens : 3.572519083969466% similarity, with 468 matched token, and 12632 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13200 tokens : 3.5833333333333335% similarity, with 473 matched token, and 12727 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13300 tokens : 3.56390977443609% similarity, with 474 matched token, and 12826 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13400 tokens : 3.58955223880597% similarity, with 481 matched token, and 12919 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13500 tokens : 3.5777777777777775% similarity, with 483 matched token, and 13017 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13600 tokens : 3.5882352941176467% similarity, with 488 matched token, and 13112 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13700 tokens : 3.576642335766423% similarity, with 490 matched token, and 13210 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13800 tokens : 3.5797101449275366% similarity, with 494 matched token, and 13306 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13900 tokens : 3.5899280575539567% similarity, with 499 matched token, and 13401 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14000 tokens : 3.6142857142857143% similarity, with 506 matched token, and 13494 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14100 tokens : 3.6099290780141846% similarity, with 509 matched token, and 13591 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14200 tokens : 3.5985915492957745% similarity, with 511 matched token, and 13689 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14300 tokens : 3.5944055944055946% similarity, with 514 matched token, and 13786 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14400 tokens : 3.6111111111111107% similarity, with 520 matched token, and 13880 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14500 tokens : 3.5999999999999996% similarity, with 522 matched token, and 13978 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14600 tokens : 3.5890410958904106% similarity, with 524 matched token, and 14076 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14700 tokens : 3.619047619047619% similarity, with 532 matched token, and 14168 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14800 tokens : 3.614864864864865% similarity, with 535 matched token, and 14265 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14900 tokens : 3.610738255033557% similarity, with 538 matched token, and 14362 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15000 tokens : 3.5999999999999996% similarity, with 540 matched token, and 14460 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15100 tokens : 3.596026490066225% similarity, with 543 matched token, and 14557 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15200 tokens : 3.592105263157895% similarity, with 546 matched token, and 14654 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15300 tokens : 3.594771241830065% similarity, with 550 matched token, and 14750 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15400 tokens : 3.5909090909090913% similarity, with 553 matched token, and 14847 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15500 tokens : 3.587096774193548% similarity, with 556 matched token, and 14944 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15600 tokens : 3.5897435897435894% similarity, with 560 matched token, and 15040 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15700 tokens : 3.5923566878980893% similarity, with 564 matched token, and 15136 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15800 tokens : 3.5822784810126582% similarity, with 566 matched token, and 15234 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15900 tokens : 3.578616352201258% similarity, with 569 matched token, and 15331 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 16000 tokens : 3.5687499999999996% similarity, with 571 matched token, and 15429 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D2048-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D2048-E0_1-16k.csv\" 4100 16000" ] }, { "cell_type": "markdown", "id": "b398575a", "metadata": { "papermill": { "duration": 0.123548, "end_time": "2023-09-05T23:20:17.753184", "exception": false, "start_time": "2023-09-05T23:20:17.629636", "status": "completed" }, "tags": [] }, "source": [ "# v5-L6-D4096-E0_1-mem-ctx-8k.pth" ] }, { "cell_type": "code", "execution_count": 16, "id": "b3229188", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T23:20:18.000562Z", "iopub.status.busy": "2023-09-05T23:20:18.000185Z", "iopub.status.idle": "2023-09-05T23:21:27.371500Z", "shell.execute_reply": "2023-09-05T23:21:27.370336Z" }, "papermill": { "duration": 69.497703, "end_time": "2023-09-05T23:21:27.373916", "exception": false, "start_time": "2023-09-05T23:20:17.876213", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 23:20:22,562] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 40 tokens : 100.0% similarity, with 40 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 45 tokens : 100.0% similarity, with 45 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 50 tokens : 100.0% similarity, with 50 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 55 tokens : 100.0% similarity, with 55 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 60 tokens : 100.0% similarity, with 60 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 65 tokens : 100.0% similarity, with 65 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 70 tokens : 100.0% similarity, with 70 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 75 tokens : 100.0% similarity, with 75 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 80 tokens : 100.0% similarity, with 80 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 85 tokens : 100.0% similarity, with 85 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 90 tokens : 100.0% similarity, with 90 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 95 tokens : 100.0% similarity, with 95 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 100 tokens : 100.0% similarity, with 100 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 105 tokens : 100.0% similarity, with 105 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 110 tokens : 100.0% similarity, with 110 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 115 tokens : 100.0% similarity, with 115 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 120 tokens : 100.0% similarity, with 120 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 125 tokens : 100.0% similarity, with 125 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 130 tokens : 100.0% similarity, with 130 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 135 tokens : 100.0% similarity, with 135 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 140 tokens : 100.0% similarity, with 140 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 145 tokens : 100.0% similarity, with 145 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 150 tokens : 99.33333333333333% similarity, with 149 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 160 tokens : 99.375% similarity, with 159 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 170 tokens : 98.82352941176471% similarity, with 168 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 180 tokens : 98.88888888888889% similarity, with 178 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 190 tokens : 98.94736842105263% similarity, with 188 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 200 tokens : 99.0% similarity, with 198 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 210 tokens : 99.04761904761905% similarity, with 208 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 220 tokens : 99.0909090909091% similarity, with 218 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 230 tokens : 99.1304347826087% similarity, with 228 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 240 tokens : 99.58333333333333% similarity, with 239 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 250 tokens : 99.2% similarity, with 248 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 260 tokens : 99.23076923076923% similarity, with 258 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 270 tokens : 98.51851851851852% similarity, with 266 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 280 tokens : 98.57142857142858% similarity, with 276 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 290 tokens : 98.62068965517241% similarity, with 286 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 300 tokens : 98.0% similarity, with 294 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 325 tokens : 98.46153846153847% similarity, with 320 matched token, and 5 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 350 tokens : 97.71428571428571% similarity, with 342 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 375 tokens : 96.53333333333333% similarity, with 362 matched token, and 13 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 400 tokens : 96.75% similarity, with 387 matched token, and 13 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 425 tokens : 96.47058823529412% similarity, with 410 matched token, and 15 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 450 tokens : 96.0% similarity, with 432 matched token, and 18 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 475 tokens : 95.36842105263158% similarity, with 453 matched token, and 22 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 500 tokens : 93.8% similarity, with 469 matched token, and 31 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 525 tokens : 93.9047619047619% similarity, with 493 matched token, and 32 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 550 tokens : 93.81818181818183% similarity, with 516 matched token, and 34 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 575 tokens : 92.8695652173913% similarity, with 534 matched token, and 41 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 600 tokens : 92.66666666666666% similarity, with 556 matched token, and 44 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 625 tokens : 92.0% similarity, with 575 matched token, and 50 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 650 tokens : 90.46153846153845% similarity, with 588 matched token, and 62 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 675 tokens : 90.96296296296296% similarity, with 614 matched token, and 61 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 700 tokens : 91.0% similarity, with 637 matched token, and 63 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 750 tokens : 89.2% similarity, with 669 matched token, and 81 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 800 tokens : 88.0% similarity, with 704 matched token, and 96 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 850 tokens : 87.52941176470588% similarity, with 744 matched token, and 106 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 900 tokens : 87.66666666666667% similarity, with 789 matched token, and 111 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 950 tokens : 85.78947368421052% similarity, with 815 matched token, and 135 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1000 tokens : 83.6% similarity, with 836 matched token, and 164 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D4096-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D4096-E0_1-1k.csv\"" ] }, { "cell_type": "code", "execution_count": 17, "id": "33e254f7", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T23:21:27.628949Z", "iopub.status.busy": "2023-09-05T23:21:27.628479Z", "iopub.status.idle": "2023-09-05T23:25:51.884822Z", "shell.execute_reply": "2023-09-05T23:25:51.883772Z" }, "papermill": { "duration": 264.386818, "end_time": "2023-09-05T23:25:51.887041", "exception": false, "start_time": "2023-09-05T23:21:27.500223", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 23:21:32,282] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1100 tokens : 80.0909090909091% similarity, with 881 matched token, and 219 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1150 tokens : 78.34782608695652% similarity, with 901 matched token, and 249 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1200 tokens : 77.16666666666666% similarity, with 926 matched token, and 274 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1250 tokens : 74.56% similarity, with 932 matched token, and 318 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1300 tokens : 73.0% similarity, with 949 matched token, and 351 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1350 tokens : 72.5925925925926% similarity, with 980 matched token, and 370 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1400 tokens : 70.71428571428572% similarity, with 990 matched token, and 410 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1450 tokens : 68.13793103448276% similarity, with 988 matched token, and 462 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1500 tokens : 66.0% similarity, with 990 matched token, and 510 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1550 tokens : 65.48387096774194% similarity, with 1015 matched token, and 535 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1600 tokens : 63.375% similarity, with 1014 matched token, and 586 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1650 tokens : 62.24242424242424% similarity, with 1027 matched token, and 623 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1700 tokens : 60.411764705882355% similarity, with 1027 matched token, and 673 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1750 tokens : 59.08571428571429% similarity, with 1034 matched token, and 716 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1800 tokens : 56.388888888888886% similarity, with 1015 matched token, and 785 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1850 tokens : 56.00000000000001% similarity, with 1036 matched token, and 814 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1900 tokens : 54.89473684210526% similarity, with 1043 matched token, and 857 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 1950 tokens : 53.17948717948718% similarity, with 1037 matched token, and 913 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2000 tokens : 52.75% similarity, with 1055 matched token, and 945 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2050 tokens : 50.8780487804878% similarity, with 1043 matched token, and 1007 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2100 tokens : 49.57142857142857% similarity, with 1041 matched token, and 1059 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2150 tokens : 47.72093023255814% similarity, with 1026 matched token, and 1124 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2200 tokens : 46.409090909090914% similarity, with 1021 matched token, and 1179 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2250 tokens : 45.33333333333333% similarity, with 1020 matched token, and 1230 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2300 tokens : 43.21739130434782% similarity, with 994 matched token, and 1306 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2350 tokens : 41.61702127659574% similarity, with 978 matched token, and 1372 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2400 tokens : 40.875% similarity, with 981 matched token, and 1419 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2450 tokens : 38.9795918367347% similarity, with 955 matched token, and 1495 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2500 tokens : 37.92% similarity, with 948 matched token, and 1552 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2550 tokens : 36.431372549019606% similarity, with 929 matched token, and 1621 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2600 tokens : 35.53846153846154% similarity, with 924 matched token, and 1676 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2650 tokens : 34.60377358490566% similarity, with 917 matched token, and 1733 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2700 tokens : 33.925925925925924% similarity, with 916 matched token, and 1784 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2750 tokens : 32.690909090909095% similarity, with 899 matched token, and 1851 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2800 tokens : 31.607142857142854% similarity, with 885 matched token, and 1915 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2850 tokens : 31.017543859649123% similarity, with 884 matched token, and 1966 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2900 tokens : 30.06896551724138% similarity, with 872 matched token, and 2028 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 2950 tokens : 29.322033898305083% similarity, with 865 matched token, and 2085 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3000 tokens : 28.7% similarity, with 861 matched token, and 2139 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3050 tokens : 27.77049180327869% similarity, with 847 matched token, and 2203 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3100 tokens : 27.387096774193548% similarity, with 849 matched token, and 2251 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3150 tokens : 26.88888888888889% similarity, with 847 matched token, and 2303 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3200 tokens : 26.34375% similarity, with 843 matched token, and 2357 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3250 tokens : 25.784615384615385% similarity, with 838 matched token, and 2412 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3300 tokens : 25.151515151515152% similarity, with 830 matched token, and 2470 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3350 tokens : 24.507462686567163% similarity, with 821 matched token, and 2529 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3400 tokens : 24.058823529411764% similarity, with 818 matched token, and 2582 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3450 tokens : 23.391304347826086% similarity, with 807 matched token, and 2643 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3500 tokens : 23.0% similarity, with 805 matched token, and 2695 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3550 tokens : 22.7887323943662% similarity, with 809 matched token, and 2741 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3600 tokens : 22.47222222222222% similarity, with 809 matched token, and 2791 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3650 tokens : 22.054794520547947% similarity, with 805 matched token, and 2845 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3700 tokens : 21.756756756756758% similarity, with 805 matched token, and 2895 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3750 tokens : 21.493333333333332% similarity, with 806 matched token, and 2944 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3800 tokens : 21.342105263157897% similarity, with 811 matched token, and 2989 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3850 tokens : 21.038961038961038% similarity, with 810 matched token, and 3040 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3900 tokens : 20.692307692307693% similarity, with 807 matched token, and 3093 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 3950 tokens : 20.32911392405063% similarity, with 803 matched token, and 3147 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4000 tokens : 20.05% similarity, with 802 matched token, and 3198 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D4096-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D4096-E0_1-4k.csv\" 1100 4000" ] }, { "cell_type": "code", "execution_count": 18, "id": "5d33ffaa", "metadata": { "execution": { "iopub.execute_input": "2023-09-05T23:25:52.152096Z", "iopub.status.busy": "2023-09-05T23:25:52.151535Z", "iopub.status.idle": "2023-09-06T00:28:45.815950Z", "shell.execute_reply": "2023-09-06T00:28:45.814816Z" }, "papermill": { "duration": 3773.798194, "end_time": "2023-09-06T00:28:45.818553", "exception": false, "start_time": "2023-09-05T23:25:52.020359", "status": "completed" }, "tags": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[2023-09-05 23:25:56,732] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation start ###\r\n", "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4100 tokens : 19.390243902439025% similarity, with 795 matched token, and 3305 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4200 tokens : 18.452380952380953% similarity, with 775 matched token, and 3425 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4300 tokens : 17.883720930232556% similarity, with 769 matched token, and 3531 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4400 tokens : 17.09090909090909% similarity, with 752 matched token, and 3648 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4500 tokens : 16.400000000000002% similarity, with 738 matched token, and 3762 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4600 tokens : 15.65217391304348% similarity, with 720 matched token, and 3880 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4700 tokens : 14.829787234042552% similarity, with 697 matched token, and 4003 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4800 tokens : 14.145833333333332% similarity, with 679 matched token, and 4121 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 4900 tokens : 13.204081632653061% similarity, with 647 matched token, and 4253 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5000 tokens : 12.46% similarity, with 623 matched token, and 4377 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5100 tokens : 11.490196078431373% similarity, with 586 matched token, and 4514 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5200 tokens : 10.596153846153847% similarity, with 551 matched token, and 4649 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5300 tokens : 9.773584905660378% similarity, with 518 matched token, and 4782 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5400 tokens : 8.685185185185185% similarity, with 469 matched token, and 4931 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5500 tokens : 7.8909090909090915% similarity, with 434 matched token, and 5066 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5600 tokens : 7.214285714285714% similarity, with 404 matched token, and 5196 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5700 tokens : 6.561403508771931% similarity, with 374 matched token, and 5326 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5800 tokens : 5.931034482758621% similarity, with 344 matched token, and 5456 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 5900 tokens : 5.6440677966101696% similarity, with 333 matched token, and 5567 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6000 tokens : 5.166666666666667% similarity, with 310 matched token, and 5690 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6100 tokens : 4.836065573770492% similarity, with 295 matched token, and 5805 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6200 tokens : 4.370967741935484% similarity, with 271 matched token, and 5929 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6300 tokens : 4.222222222222222% similarity, with 266 matched token, and 6034 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6400 tokens : 3.9843749999999996% similarity, with 255 matched token, and 6145 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6500 tokens : 3.8615384615384616% similarity, with 251 matched token, and 6249 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6600 tokens : 3.7575757575757573% similarity, with 248 matched token, and 6352 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6700 tokens : 3.805970149253731% similarity, with 255 matched token, and 6445 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6800 tokens : 3.691176470588235% similarity, with 251 matched token, and 6549 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 6900 tokens : 3.6231884057971016% similarity, with 250 matched token, and 6650 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7000 tokens : 3.571428571428571% similarity, with 250 matched token, and 6750 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7100 tokens : 3.492957746478873% similarity, with 248 matched token, and 6852 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7200 tokens : 3.486111111111111% similarity, with 251 matched token, and 6949 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7300 tokens : 3.493150684931507% similarity, with 255 matched token, and 7045 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7400 tokens : 3.5000000000000004% similarity, with 259 matched token, and 7141 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7500 tokens : 3.4266666666666667% similarity, with 257 matched token, and 7243 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7600 tokens : 3.4342105263157894% similarity, with 261 matched token, and 7339 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7700 tokens : 3.428571428571429% similarity, with 264 matched token, and 7436 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7800 tokens : 3.4230769230769234% similarity, with 267 matched token, and 7533 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 7900 tokens : 3.4050632911392404% similarity, with 269 matched token, and 7631 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8000 tokens : 3.4000000000000004% similarity, with 272 matched token, and 7728 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8100 tokens : 3.4444444444444446% similarity, with 279 matched token, and 7821 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8200 tokens : 3.4268292682926833% similarity, with 281 matched token, and 7919 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8300 tokens : 3.4096385542168677% similarity, with 283 matched token, and 8017 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8400 tokens : 3.392857142857143% similarity, with 285 matched token, and 8115 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8500 tokens : 3.4235294117647057% similarity, with 291 matched token, and 8209 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8600 tokens : 3.4186046511627906% similarity, with 294 matched token, and 8306 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8700 tokens : 3.425287356321839% similarity, with 298 matched token, and 8402 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8800 tokens : 3.4090909090909087% similarity, with 300 matched token, and 8500 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 8900 tokens : 3.4269662921348316% similarity, with 305 matched token, and 8595 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9000 tokens : 3.4111111111111114% similarity, with 307 matched token, and 8693 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9100 tokens : 3.428571428571429% similarity, with 312 matched token, and 8788 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9200 tokens : 3.4239130434782608% similarity, with 315 matched token, and 8885 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9300 tokens : 3.4086021505376345% similarity, with 317 matched token, and 8983 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9400 tokens : 3.393617021276596% similarity, with 319 matched token, and 9081 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9500 tokens : 3.4105263157894736% similarity, with 324 matched token, and 9176 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9600 tokens : 3.4166666666666665% similarity, with 328 matched token, and 9272 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9700 tokens : 3.4123711340206184% similarity, with 331 matched token, and 9369 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9800 tokens : 3.4081632653061225% similarity, with 334 matched token, and 9466 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 9900 tokens : 3.424242424242424% similarity, with 339 matched token, and 9561 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10000 tokens : 3.45% similarity, with 345 matched token, and 9655 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10100 tokens : 3.4653465346534658% similarity, with 350 matched token, and 9750 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10200 tokens : 3.4509803921568625% similarity, with 352 matched token, and 9848 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10300 tokens : 3.4368932038834954% similarity, with 354 matched token, and 9946 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10400 tokens : 3.4423076923076925% similarity, with 358 matched token, and 10042 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10500 tokens : 3.4476190476190474% similarity, with 362 matched token, and 10138 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10600 tokens : 3.443396226415094% similarity, with 365 matched token, and 10235 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10700 tokens : 3.467289719626168% similarity, with 371 matched token, and 10329 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10800 tokens : 3.4722222222222223% similarity, with 375 matched token, and 10425 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 10900 tokens : 3.458715596330275% similarity, with 377 matched token, and 10523 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11000 tokens : 3.481818181818182% similarity, with 383 matched token, and 10617 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11100 tokens : 3.4774774774774775% similarity, with 386 matched token, and 10714 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11200 tokens : 3.455357142857143% similarity, with 387 matched token, and 10813 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11300 tokens : 3.4690265486725664% similarity, with 392 matched token, and 10908 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11400 tokens : 3.5000000000000004% similarity, with 399 matched token, and 11001 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11500 tokens : 3.5043478260869563% similarity, with 403 matched token, and 11097 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11600 tokens : 3.517241379310345% similarity, with 408 matched token, and 11192 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11700 tokens : 3.5042735042735043% similarity, with 410 matched token, and 11290 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11800 tokens : 3.516949152542373% similarity, with 415 matched token, and 11385 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 11900 tokens : 3.521008403361345% similarity, with 419 matched token, and 11481 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12000 tokens : 3.5333333333333337% similarity, with 424 matched token, and 11576 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12100 tokens : 3.5454545454545454% similarity, with 429 matched token, and 11671 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12200 tokens : 3.5327868852459017% similarity, with 431 matched token, and 11769 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12300 tokens : 3.5447154471544713% similarity, with 436 matched token, and 11864 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12400 tokens : 3.540322580645161% similarity, with 439 matched token, and 11961 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12500 tokens : 3.5360000000000005% similarity, with 442 matched token, and 12058 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12600 tokens : 3.5317460317460316% similarity, with 445 matched token, and 12155 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12700 tokens : 3.543307086614173% similarity, with 450 matched token, and 12250 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12800 tokens : 3.5312499999999996% similarity, with 452 matched token, and 12348 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 12900 tokens : 3.5348837209302326% similarity, with 456 matched token, and 12444 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13000 tokens : 3.553846153846154% similarity, with 462 matched token, and 12538 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13100 tokens : 3.5343511450381677% similarity, with 463 matched token, and 12637 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13200 tokens : 3.5378787878787876% similarity, with 467 matched token, and 12733 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13300 tokens : 3.5263157894736845% similarity, with 469 matched token, and 12831 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13400 tokens : 3.544776119402985% similarity, with 475 matched token, and 12925 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13500 tokens : 3.5333333333333337% similarity, with 477 matched token, and 13023 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13600 tokens : 3.5441176470588234% similarity, with 482 matched token, and 13118 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13700 tokens : 3.5328467153284673% similarity, with 484 matched token, and 13216 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13800 tokens : 3.5362318840579707% similarity, with 488 matched token, and 13312 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 13900 tokens : 3.5467625899280577% similarity, with 493 matched token, and 13407 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14000 tokens : 3.564285714285714% similarity, with 499 matched token, and 13501 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14100 tokens : 3.5602836879432624% similarity, with 502 matched token, and 13598 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14200 tokens : 3.549295774647887% similarity, with 504 matched token, and 13696 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14300 tokens : 3.5454545454545454% similarity, with 507 matched token, and 13793 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14400 tokens : 3.5555555555555554% similarity, with 512 matched token, and 13888 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14500 tokens : 3.5448275862068965% similarity, with 514 matched token, and 13986 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14600 tokens : 3.534246575342466% similarity, with 516 matched token, and 14084 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14700 tokens : 3.5646258503401365% similarity, with 524 matched token, and 14176 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14800 tokens : 3.5608108108108105% similarity, with 527 matched token, and 14273 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 14900 tokens : 3.557046979865772% similarity, with 530 matched token, and 14370 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15000 tokens : 3.56% similarity, with 534 matched token, and 14466 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15100 tokens : 3.556291390728477% similarity, with 537 matched token, and 14563 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15200 tokens : 3.546052631578948% similarity, with 539 matched token, and 14661 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15300 tokens : 3.5490196078431375% similarity, with 543 matched token, and 14757 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15400 tokens : 3.538961038961039% similarity, with 545 matched token, and 14855 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15500 tokens : 3.535483870967742% similarity, with 548 matched token, and 14952 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15600 tokens : 3.5384615384615383% similarity, with 552 matched token, and 15048 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15700 tokens : 3.54140127388535% similarity, with 556 matched token, and 15144 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15800 tokens : 3.531645569620253% similarity, with 558 matched token, and 15242 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 15900 tokens : 3.534591194968553% similarity, with 562 matched token, and 15338 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "## Model validation for 16000 tokens : 3.5249999999999995% similarity, with 564 matched token, and 15436 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "###\r\n", "### Model validation end ###\r\n", "###\r\n" ] } ], "source": [ "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D4096-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D4096-E0_1-16k.csv\" 4100 16000" ] } ], "metadata": { "kernelspec": { "display_name": "rwkv-infctx", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.10.12" }, "papermill": { "default_parameters": {}, "duration": 16222.341869, "end_time": "2023-09-06T00:28:46.417740", "environment_variables": {}, "exception": null, "input_path": "/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/Benchmark-V5.ipynb", "output_path": "/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/Benchmark-V5.ipynb", "parameters": {}, "start_time": "2023-09-05T19:58:24.075871", "version": "2.4.0" } }, "nbformat": 4, "nbformat_minor": 5 }