diff --git "a/experiment/memory-bench/Benchmark-V5.ipynb" "b/experiment/memory-bench/Benchmark-V5.ipynb" --- "a/experiment/memory-bench/Benchmark-V5.ipynb" +++ "b/experiment/memory-bench/Benchmark-V5.ipynb" @@ -2,13 +2,13 @@ "cells": [ { "cell_type": "markdown", - "id": "cf73c4cf", + "id": "541b2d35", "metadata": { "papermill": { - "duration": 0.004145, - "end_time": "2023-09-05T19:58:25.321223", + "duration": 0.00391, + "end_time": "2023-08-26T13:27:22.704411", "exception": false, - "start_time": "2023-09-05T19:58:25.317078", + "start_time": "2023-08-26T13:27:22.700501", "status": "completed" }, "tags": [] @@ -22,19 +22,19 @@ { "cell_type": "code", "execution_count": 1, - "id": "aaec4faf", + "id": "13ce0b66", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T19:58:25.330738Z", - "iopub.status.busy": "2023-09-05T19:58:25.330236Z", - "iopub.status.idle": "2023-09-05T20:04:41.032031Z", - "shell.execute_reply": "2023-09-05T20:04:41.030878Z" + "iopub.execute_input": "2023-08-26T13:27:22.713673Z", + "iopub.status.busy": "2023-08-26T13:27:22.712927Z", + "iopub.status.idle": "2023-08-26T13:30:39.555655Z", + "shell.execute_reply": "2023-08-26T13:30:39.554517Z" }, "papermill": { - "duration": 375.709392, - "end_time": "2023-09-05T20:04:41.034546", + "duration": 196.850037, + "end_time": "2023-08-26T13:30:39.558120", "exception": false, - "start_time": "2023-09-05T19:58:25.325154", + "start_time": "2023-08-26T13:27:22.708083", "status": "completed" }, "tags": [] @@ -44,28 +44,22 @@ "name": "stdout", "output_type": "stream", "text": [ - "--2023-09-05 19:58:25-- https://huggingface.co/picocreator/memory-size-experiment-for-rwkv/resolve/main/RWKV-v5-baseline/BaseV5-C-Tune5.pth\r\n", - "Resolving huggingface.co (huggingface.co)... 18.154.227.7, 18.154.227.67, 18.154.227.69, ...\r\n", + "--2023-08-26 13:27:23-- https://huggingface.co/picocreator/memory-size-experiment-for-rwkv/resolve/main/RWKV-v5-baseline/BaseV5-C-Tune5.pth\r\n", + "Resolving huggingface.co (huggingface.co)... 18.154.227.7, 18.154.227.69, 18.154.227.87, ...\r\n", "Connecting to huggingface.co (huggingface.co)|18.154.227.7|:443... connected.\r\n", "HTTP request sent, awaiting response... 302 Found\r\n", - "Location: https://cdn-lfs.huggingface.co/repos/cb/ef/cbef09abb2634a3375b28868bffa285226dfeabedec89b28c2fb302221164d66/c1f89b4d653a240f6f165d25988b51f6db36bf8a2388707e3e3242af751575eb?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27BaseV5-C-Tune5.pth%3B+filename%3D%22BaseV5-C-Tune5.pth%22%3B&Expires=1694203105&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzEwNX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9jYi9lZi9jYmVmMDlhYmIyNjM0YTMzNzViMjg4NjhiZmZhMjg1MjI2ZGZlYWJlZGVjODliMjhjMmZiMzAyMjIxMTY0ZDY2L2MxZjg5YjRkNjUzYTI0MGY2ZjE2NWQyNTk4OGI1MWY2ZGIzNmJmOGEyMzg4NzA3ZTNlMzI0MmFmNzUxNTc1ZWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=ykou8uLrNIvdiZlMOBKSa-TxcLOCLvMDjj9o4SZ5Vj1ovca53yzWCgEu7VINUQKO2GvnX4ivd153xcBlbnlzlCtGT96pIKOf6AT1KwcIthqxPj4SnMm7LaZOfOQPQ2HcRQjLRp9S-ThMRXwrniPe4iB4USdcqbP%7E3YnQRQ7YCnrqrEzF2A7SX8ubT-oNXDevc3Cj21BKYo6qlYuTK%7EMCChwgmcq7EX%7EeP%7E9I3A02TvxkM302k1m-Ex%7ERjA7k0Px9xUp0otVtDIir65Y0mMafarGbJIgtI3T-mQQRYyxn6pymYMLV5td%7EXExISwcje1-Gwsc4cLPgh8rrj7Kr9J2WZg__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", - "--2023-09-05 19:58:25-- https://cdn-lfs.huggingface.co/repos/cb/ef/cbef09abb2634a3375b28868bffa285226dfeabedec89b28c2fb302221164d66/c1f89b4d653a240f6f165d25988b51f6db36bf8a2388707e3e3242af751575eb?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27BaseV5-C-Tune5.pth%3B+filename%3D%22BaseV5-C-Tune5.pth%22%3B&Expires=1694203105&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzEwNX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9jYi9lZi9jYmVmMDlhYmIyNjM0YTMzNzViMjg4NjhiZmZhMjg1MjI2ZGZlYWJlZGVjODliMjhjMmZiMzAyMjIxMTY0ZDY2L2MxZjg5YjRkNjUzYTI0MGY2ZjE2NWQyNTk4OGI1MWY2ZGIzNmJmOGEyMzg4NzA3ZTNlMzI0MmFmNzUxNTc1ZWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=ykou8uLrNIvdiZlMOBKSa-TxcLOCLvMDjj9o4SZ5Vj1ovca53yzWCgEu7VINUQKO2GvnX4ivd153xcBlbnlzlCtGT96pIKOf6AT1KwcIthqxPj4SnMm7LaZOfOQPQ2HcRQjLRp9S-ThMRXwrniPe4iB4USdcqbP%7E3YnQRQ7YCnrqrEzF2A7SX8ubT-oNXDevc3Cj21BKYo6qlYuTK%7EMCChwgmcq7EX%7EeP%7E9I3A02TvxkM302k1m-Ex%7ERjA7k0Px9xUp0otVtDIir65Y0mMafarGbJIgtI3T-mQQRYyxn6pymYMLV5td%7EXExISwcje1-Gwsc4cLPgh8rrj7Kr9J2WZg__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", - "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.49, 108.138.64.111, 108.138.64.36, ...\r\n", - "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.49|:443... connected.\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "HTTP request sent, awaiting response... " + "Location: https://cdn-lfs.huggingface.co/repos/cb/ef/cbef09abb2634a3375b28868bffa285226dfeabedec89b28c2fb302221164d66/c1f89b4d653a240f6f165d25988b51f6db36bf8a2388707e3e3242af751575eb?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27BaseV5-C-Tune5.pth%3B+filename%3D%22BaseV5-C-Tune5.pth%22%3B&Expires=1693315643&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzMxNTY0M319LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9jYi9lZi9jYmVmMDlhYmIyNjM0YTMzNzViMjg4NjhiZmZhMjg1MjI2ZGZlYWJlZGVjODliMjhjMmZiMzAyMjIxMTY0ZDY2L2MxZjg5YjRkNjUzYTI0MGY2ZjE2NWQyNTk4OGI1MWY2ZGIzNmJmOGEyMzg4NzA3ZTNlMzI0MmFmNzUxNTc1ZWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=ziMFzO433qYsnTGI0xEqJgoCCxYDBIDL6BiUB8nY%7EUwhf8whZoVy%7E6kXBMldTd5DrWF1FBW-m%7EZ30YvJkMpWb282unhX6%7EInXiMnuT8KzIY8RmId7ttH21PN4yhomq6PQH5iM8hZq4rzmapJEyeRmDyBMJuHcDbXjYa%7EZonvxseG5TJACA3CIe8775U1sGNl2K8awoALSDKvpUJVIq86twhIdH38kCdQUrfRB52a6sX-xLHsGYpHUelYXtE9YcfajwTeg358Ds-ut4XP-we7vBLIusdR02y0MjvvyuWOIMLTI%7Ewq3OVRkY92Ks7HG7sk52iHWhH0x%7E12mvhQqM0Vzw__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", + "--2023-08-26 13:27:23-- https://cdn-lfs.huggingface.co/repos/cb/ef/cbef09abb2634a3375b28868bffa285226dfeabedec89b28c2fb302221164d66/c1f89b4d653a240f6f165d25988b51f6db36bf8a2388707e3e3242af751575eb?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27BaseV5-C-Tune5.pth%3B+filename%3D%22BaseV5-C-Tune5.pth%22%3B&Expires=1693315643&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzMxNTY0M319LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9jYi9lZi9jYmVmMDlhYmIyNjM0YTMzNzViMjg4NjhiZmZhMjg1MjI2ZGZlYWJlZGVjODliMjhjMmZiMzAyMjIxMTY0ZDY2L2MxZjg5YjRkNjUzYTI0MGY2ZjE2NWQyNTk4OGI1MWY2ZGIzNmJmOGEyMzg4NzA3ZTNlMzI0MmFmNzUxNTc1ZWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=ziMFzO433qYsnTGI0xEqJgoCCxYDBIDL6BiUB8nY%7EUwhf8whZoVy%7E6kXBMldTd5DrWF1FBW-m%7EZ30YvJkMpWb282unhX6%7EInXiMnuT8KzIY8RmId7ttH21PN4yhomq6PQH5iM8hZq4rzmapJEyeRmDyBMJuHcDbXjYa%7EZonvxseG5TJACA3CIe8775U1sGNl2K8awoALSDKvpUJVIq86twhIdH38kCdQUrfRB52a6sX-xLHsGYpHUelYXtE9YcfajwTeg358Ds-ut4XP-we7vBLIusdR02y0MjvvyuWOIMLTI%7Ewq3OVRkY92Ks7HG7sk52iHWhH0x%7E12mvhQqM0Vzw__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", + "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... " ] }, { "name": "stdout", "output_type": "stream", "text": [ - "200 OK\r\n", + "108.138.64.121, 108.138.64.111, 108.138.64.36, ...\r\n", + "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.121|:443... connected.\r\n", + "HTTP request sent, awaiting response... 200 OK\r\n", "Length: 6060483063 (5.6G) [binary/octet-stream]\r\n", "Saving to: ‘BaseV5-C-Tune5.pth’\r\n", "\r\n", @@ -78,7 +72,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 0%[ ] 15.26M 61.3MB/s " + "BaseV5-C-Tune5.pth 1%[ ] 73.21M 366MB/s " ] }, { @@ -86,7 +80,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 0%[ ] 30.52M 67.6MB/s " + "BaseV5-C-Tune5.pth 2%[ ] 146.94M 367MB/s " ] }, { @@ -94,7 +88,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 0%[ ] 45.78M 61.0MB/s " + "BaseV5-C-Tune5.pth 3%[ ] 220.93M 368MB/s " ] }, { @@ -102,7 +96,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 1%[ ] 60.52M 61.9MB/s " + "BaseV5-C-Tune5.pth 5%[> ] 295.39M 369MB/s " ] }, { @@ -110,7 +104,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 1%[ ] 61.03M 50.8MB/s " + "BaseV5-C-Tune5.pth 6%[> ] 369.07M 369MB/s " ] }, { @@ -118,7 +112,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 1%[ ] 76.41M 51.9MB/s " + "BaseV5-C-Tune5.pth 7%[> ] 442.84M 369MB/s " ] }, { @@ -126,7 +120,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 1%[ ] 91.55M 54.7MB/s " + "BaseV5-C-Tune5.pth 8%[> ] 515.57M 368MB/s " ] }, { @@ -134,7 +128,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 1%[ ] 106.29M 56.5MB/s " + "BaseV5-C-Tune5.pth 10%[=> ] 589.96M 369MB/s " ] }, { @@ -142,7 +136,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 1%[ ] 106.81M 51.3MB/s " + "BaseV5-C-Tune5.pth 11%[=> ] 665.46M 370MB/s " ] }, { @@ -150,7 +144,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 2%[ ] 122.07M 53.3MB/s " + "BaseV5-C-Tune5.pth 12%[=> ] 741.08M 371MB/s " ] }, { @@ -158,7 +152,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 2%[ ] 137.33M 51.5MB/s " + "BaseV5-C-Tune5.pth 14%[=> ] 816.99M 371MB/s " ] }, { @@ -166,7 +160,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 2%[ ] 152.59M 50.9MB/s eta 1m 51s " + "BaseV5-C-Tune5.pth 15%[==> ] 892.84M 372MB/s " ] }, { @@ -174,7 +168,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 2%[ ] 162.26M 50.7MB/s eta 1m 51s " + "BaseV5-C-Tune5.pth 16%[==> ] 969.40M 373MB/s " ] }, { @@ -182,7 +176,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 2%[ ] 167.85M 48.0MB/s eta 1m 51s " + "BaseV5-C-Tune5.pth 18%[==> ] 1.02G 373MB/s " ] }, { @@ -190,7 +184,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 3%[ ] 182.59M 48.0MB/s eta 1m 51s " + "BaseV5-C-Tune5.pth 19%[==> ] 1.09G 374MB/s eta 12s " ] }, { @@ -198,7 +192,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 3%[ ] 189.42M 47.3MB/s eta 1m 58s " + "BaseV5-C-Tune5.pth 20%[===> ] 1.17G 375MB/s eta 12s " ] }, { @@ -206,7 +200,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 3%[ ] 198.36M 46.6MB/s eta 1m 58s " + "BaseV5-C-Tune5.pth 22%[===> ] 1.24G 375MB/s eta 12s " ] }, { @@ -214,7 +208,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 3%[ ] 206.18M 45.3MB/s eta 1m 58s " + "BaseV5-C-Tune5.pth 23%[===> ] 1.32G 376MB/s eta 12s " ] }, { @@ -222,7 +216,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 3%[ ] 213.74M 43.4MB/s eta 1m 58s " + "BaseV5-C-Tune5.pth 24%[===> ] 1.39G 378MB/s eta 12s " ] }, { @@ -230,7 +224,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 3%[ ] 228.87M 43.3MB/s eta 1m 58s " + "BaseV5-C-Tune5.pth 26%[====> ] 1.47G 379MB/s eta 11s " ] }, { @@ -238,7 +232,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 4%[ ] 244.13M 43.2MB/s eta 1m 59s " + "BaseV5-C-Tune5.pth 27%[====> ] 1.55G 380MB/s eta 11s " ] }, { @@ -246,7 +240,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 4%[ ] 252.57M 42.5MB/s eta 1m 59s " + "BaseV5-C-Tune5.pth 28%[====> ] 1.63G 383MB/s eta 11s " ] }, { @@ -254,7 +248,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 4%[ ] 259.40M 42.0MB/s eta 1m 59s " + "BaseV5-C-Tune5.pth 30%[=====> ] 1.70G 384MB/s eta 11s " ] }, { @@ -262,7 +256,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 4%[ ] 282.07M 44.6MB/s eta 1m 59s " + "BaseV5-C-Tune5.pth 31%[=====> ] 1.78G 385MB/s eta 11s " ] }, { @@ -270,7 +264,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 5%[> ] 289.92M 43.5MB/s eta 1m 59s " + "BaseV5-C-Tune5.pth 32%[=====> ] 1.86G 386MB/s eta 10s " ] }, { @@ -278,7 +272,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 5%[> ] 305.18M 43.5MB/s eta 1m 59s " + "BaseV5-C-Tune5.pth 34%[=====> ] 1.93G 387MB/s eta 10s " ] }, { @@ -286,7 +280,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 5%[> ] 320.43M 42.4MB/s eta 1m 59s " + "BaseV5-C-Tune5.pth 35%[======> ] 2.01G 388MB/s eta 10s " ] }, { @@ -294,7 +288,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 5%[> ] 340.13M 45.8MB/s eta 1m 59s " + "BaseV5-C-Tune5.pth 36%[======> ] 2.07G 382MB/s eta 10s " ] }, { @@ -302,7 +296,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 6%[> ] 350.39M 46.0MB/s eta 1m 53s " + "BaseV5-C-Tune5.pth 37%[======> ] 2.14G 381MB/s eta 10s " ] }, { @@ -310,7 +304,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 6%[> ] 358.96M 46.4MB/s eta 1m 53s " + "BaseV5-C-Tune5.pth 39%[======> ] 2.21G 381MB/s eta 9s " ] }, { @@ -318,7 +312,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 6%[> ] 381.47M 50.1MB/s eta 1m 53s " + "BaseV5-C-Tune5.pth 40%[=======> ] 2.29G 381MB/s eta 9s " ] }, { @@ -326,7 +320,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 6%[> ] 396.73M 50.6MB/s eta 1m 53s " + "BaseV5-C-Tune5.pth 41%[=======> ] 2.36G 382MB/s eta 9s " ] }, { @@ -334,7 +328,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 7%[> ] 411.47M 53.5MB/s eta 1m 53s " + "BaseV5-C-Tune5.pth 43%[=======> ] 2.44G 383MB/s eta 9s " ] }, { @@ -342,7 +336,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 7%[> ] 416.17M 52.6MB/s eta 1m 49s " + "BaseV5-C-Tune5.pth 44%[=======> ] 2.51G 382MB/s eta 9s " ] }, { @@ -350,7 +344,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 7%[> ] 427.25M 52.3MB/s eta 1m 49s " + "BaseV5-C-Tune5.pth 45%[========> ] 2.59G 382MB/s eta 8s " ] }, { @@ -358,7 +352,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 7%[> ] 442.51M 51.7MB/s eta 1m 49s " + "BaseV5-C-Tune5.pth 47%[========> ] 2.67G 382MB/s eta 8s " ] }, { @@ -366,7 +360,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 7%[> ] 455.18M 53.4MB/s eta 1m 49s " + "BaseV5-C-Tune5.pth 48%[========> ] 2.74G 381MB/s eta 8s " ] }, { @@ -374,7 +368,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 7%[> ] 457.76M 51.2MB/s eta 1m 50s " + "BaseV5-C-Tune5.pth 49%[========> ] 2.82G 381MB/s eta 8s " ] }, { @@ -382,7 +376,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 8%[> ] 472.50M 54.1MB/s eta 1m 50s " + "BaseV5-C-Tune5.pth 51%[=========> ] 2.89G 381MB/s eta 8s " ] }, { @@ -390,7 +384,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 8%[> ] 476.21M 50.8MB/s eta 1m 50s " + "BaseV5-C-Tune5.pth 52%[=========> ] 2.97G 380MB/s eta 7s " ] }, { @@ -398,7 +392,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 8%[> ] 488.28M 50.2MB/s eta 1m 50s " + "BaseV5-C-Tune5.pth 53%[=========> ] 3.04G 380MB/s eta 7s " ] }, { @@ -406,7 +400,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 8%[> ] 502.28M 50.0MB/s eta 1m 50s " + "BaseV5-C-Tune5.pth 55%[==========> ] 3.12G 380MB/s eta 7s " ] }, { @@ -414,7 +408,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 9%[> ] 532.23M 54.6MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 56%[==========> ] 3.20G 385MB/s eta 7s " ] }, { @@ -422,7 +416,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 9%[> ] 540.75M 52.4MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 57%[==========> ] 3.27G 385MB/s eta 7s " ] }, { @@ -430,7 +424,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 9%[> ] 549.31M 54.1MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 59%[==========> ] 3.35G 388MB/s eta 6s " ] }, { @@ -438,7 +432,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 9%[> ] 564.58M 50.6MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 60%[===========> ] 3.42G 388MB/s eta 6s " ] }, { @@ -446,7 +440,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 10%[=> ] 579.31M 51.0MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 61%[===========> ] 3.50G 387MB/s eta 6s " ] }, { @@ -454,7 +448,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 10%[=> ] 593.27M 49.9MB/s eta 1m 44s " + "BaseV5-C-Tune5.pth 63%[===========> ] 3.57G 387MB/s eta 6s " ] }, { @@ -462,7 +456,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 10%[=> ] 610.35M 50.6MB/s eta 1m 44s " + "BaseV5-C-Tune5.pth 64%[===========> ] 3.65G 387MB/s eta 6s " ] }, { @@ -470,7 +464,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 10%[=> ] 625.61M 53.3MB/s eta 1m 44s " + "BaseV5-C-Tune5.pth 65%[============> ] 3.72G 387MB/s eta 5s " ] }, { @@ -478,7 +472,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 10%[=> ] 635.17M 53.9MB/s eta 1m 44s " + "BaseV5-C-Tune5.pth 67%[============> ] 3.80G 387MB/s eta 5s " ] }, { @@ -486,7 +480,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 11%[=> ] 640.87M 50.4MB/s eta 1m 44s " + "BaseV5-C-Tune5.pth 68%[============> ] 3.88G 387MB/s eta 5s " ] }, { @@ -494,7 +488,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 11%[=> ] 656.13M 51.3MB/s eta 1m 44s " + "BaseV5-C-Tune5.pth 70%[=============> ] 3.95G 387MB/s eta 5s " ] }, { @@ -502,7 +496,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 11%[=> ] 670.87M 50.0MB/s eta 1m 44s " + "BaseV5-C-Tune5.pth 71%[=============> ] 4.03G 387MB/s eta 5s " ] }, { @@ -510,7 +504,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 11%[=> ] 684.82M 53.1MB/s eta 1m 44s " + "BaseV5-C-Tune5.pth 72%[=============> ] 4.08G 379MB/s eta 4s " ] }, { @@ -518,7 +512,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 11%[=> ] 686.64M 49.2MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 72%[=============> ] 4.10G 362MB/s eta 4s " ] }, { @@ -526,7 +520,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 12%[=> ] 701.39M 51.6MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 74%[=============> ] 4.18G 362MB/s eta 4s " ] }, { @@ -534,7 +528,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 12%[=> ] 717.16M 48.9MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 75%[==============> ] 4.25G 362MB/s eta 4s " ] }, { @@ -542,7 +536,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 12%[=> ] 732.42M 47.2MB/s eta 1m 45s " + "BaseV5-C-Tune5.pth 76%[==============> ] 4.33G 362MB/s eta 4s " ] }, { @@ -550,7 +544,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 12%[=> ] 747.69M 46.6MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 78%[==============> ] 4.41G 363MB/s eta 3s " ] }, { @@ -558,7 +552,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 13%[=> ] 762.94M 47.2MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 79%[==============> ] 4.48G 363MB/s eta 3s " ] }, { @@ -566,7 +560,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 13%[=> ] 767.13M 44.7MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 80%[===============> ] 4.55G 361MB/s eta 3s " ] }, { @@ -574,7 +568,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 13%[=> ] 778.20M 45.5MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 81%[===============> ] 4.60G 352MB/s eta 3s " ] }, { @@ -582,7 +576,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 13%[=> ] 791.63M 46.0MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 82%[===============> ] 4.67G 351MB/s eta 3s " ] }, { @@ -590,7 +584,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 13%[=> ] 793.46M 42.8MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 84%[===============> ] 4.75G 351MB/s eta 2s " ] }, { @@ -598,7 +592,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 13%[=> ] 808.71M 41.9MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 85%[================> ] 4.83G 352MB/s eta 2s " ] }, { @@ -606,7 +600,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 14%[=> ] 823.97M 42.7MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 86%[================> ] 4.90G 351MB/s eta 2s " ] }, { @@ -614,7 +608,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 14%[=> ] 839.23M 43.7MB/s eta 1m 43s " + "BaseV5-C-Tune5.pth 88%[================> ] 4.98G 352MB/s eta 2s " ] }, { @@ -622,7 +616,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 14%[=> ] 853.98M 44.2MB/s eta 1m 42s " + "BaseV5-C-Tune5.pth 89%[================> ] 5.05G 352MB/s eta 2s " ] }, { @@ -630,7 +624,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 15%[==> ] 869.24M 45.9MB/s eta 1m 42s " + "BaseV5-C-Tune5.pth 90%[=================> ] 5.13G 353MB/s eta 1s " ] }, { @@ -638,7 +632,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 15%[==> ] 882.01M 45.5MB/s eta 1m 42s " + "BaseV5-C-Tune5.pth 92%[=================> ] 5.21G 372MB/s eta 1s " ] }, { @@ -646,7 +640,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 15%[==> ] 885.01M 46.0MB/s eta 1m 42s " + "BaseV5-C-Tune5.pth 93%[=================> ] 5.28G 377MB/s eta 1s " ] }, { @@ -654,7 +648,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 15%[==> ] 899.75M 46.5MB/s eta 1m 42s " + "BaseV5-C-Tune5.pth 94%[=================> ] 5.36G 377MB/s eta 1s " ] }, { @@ -662,7 +656,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 15%[==> ] 915.01M 44.4MB/s eta 1m 41s " + "BaseV5-C-Tune5.pth 96%[==================> ] 5.44G 378MB/s eta 1s " ] }, { @@ -670,7 +664,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 16%[==> ] 930.27M 46.6MB/s eta 1m 41s " + "BaseV5-C-Tune5.pth 97%[==================> ] 5.51G 378MB/s eta 0s " ] }, { @@ -678,7 +672,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 16%[==> ] 939.22M 45.3MB/s eta 1m 41s " + "BaseV5-C-Tune5.pth 99%[==================> ] 5.59G 377MB/s eta 0s " ] }, { @@ -686,31 +680,43 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 16%[==> ] 946.04M 44.1MB/s eta 1m 41s " + "BaseV5-C-Tune5.pth 100%[===================>] 5.64G 377MB/s in 15s \r\n", + "\r\n", + "2023-08-26 13:27:38 (377 MB/s) - ‘BaseV5-C-Tune5.pth’ saved [6060483063/6060483063]\r\n", + "\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "BaseV5-C-Tune5.pth 16%[==> ] 961.30M 44.8MB/s eta 1m 41s " + "--2023-08-26 13:27:38-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/EWR-1B5-E0_1-mem-ctx-8k.pth\r\n", + "Resolving huggingface.co (huggingface.co)... 18.154.227.7, 18.154.227.87, 18.154.227.69, ...\r\n", + "Connecting to huggingface.co (huggingface.co)|18.154.227.7|:443... connected.\r\n", + "HTTP request sent, awaiting response... 302 Found\r\n", + "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/e886ffafd5148b502a00b1c10c847ca918cec61c4c956956a2fe9811c210029b?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27EWR-1B5-E0_1-mem-ctx-8k.pth%3B+filename%3D%22EWR-1B5-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693315658&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzMxNTY1OH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwL2U4ODZmZmFmZDUxNDhiNTAyYTAwYjFjMTBjODQ3Y2E5MThjZWM2MWM0Yzk1Njk1NmEyZmU5ODExYzIxMDAyOWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=uku0uUHXaL19jduBgCuGdQVstpytTc2QSL0CxF3ZbE%7E3KoqpZgFWx1DJLuTk7pRnrXBNW-0cOp2MV-WONmJU7VmZvSwnbX6o3FCRpQ6xTneRWKmWXa1%7E73xUgwvg7tzs32tkYbOPkHjJXsHTZD1Pbceks1qp-brKKR58sOX%7EaB2aUPZwBgM15qjmy5fgPzyK8UgDTQ27%7EJAXtzIP8tS73n0hIaaePD1aItyVcNGs2nu4Cq6fEIfGJgvcitTm9rsLy8kUO6J6JwHrWon3PR-H5yIol5F2rVjtbmv-V9lJHq-5i1a2f%7E4AV3GlSzQ2TlOqPpExnfoeteDBPlFtzNj5%7EA__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", + "--2023-08-26 13:27:38-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/e886ffafd5148b502a00b1c10c847ca918cec61c4c956956a2fe9811c210029b?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27EWR-1B5-E0_1-mem-ctx-8k.pth%3B+filename%3D%22EWR-1B5-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693315658&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzMxNTY1OH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwL2U4ODZmZmFmZDUxNDhiNTAyYTAwYjFjMTBjODQ3Y2E5MThjZWM2MWM0Yzk1Njk1NmEyZmU5ODExYzIxMDAyOWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=uku0uUHXaL19jduBgCuGdQVstpytTc2QSL0CxF3ZbE%7E3KoqpZgFWx1DJLuTk7pRnrXBNW-0cOp2MV-WONmJU7VmZvSwnbX6o3FCRpQ6xTneRWKmWXa1%7E73xUgwvg7tzs32tkYbOPkHjJXsHTZD1Pbceks1qp-brKKR58sOX%7EaB2aUPZwBgM15qjmy5fgPzyK8UgDTQ27%7EJAXtzIP8tS73n0hIaaePD1aItyVcNGs2nu4Cq6fEIfGJgvcitTm9rsLy8kUO6J6JwHrWon3PR-H5yIol5F2rVjtbmv-V9lJHq-5i1a2f%7E4AV3GlSzQ2TlOqPpExnfoeteDBPlFtzNj5%7EA__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", + "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.49, 108.138.64.36, 108.138.64.111, ...\r\n", + "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.49|:443... connected.\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "BaseV5-C-Tune5.pth 16%[==> ] 976.55M 46.2MB/s eta 1m 41s " + "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ + "200 OK\r\n", + "Length: 6060483163 (5.6G) [binary/octet-stream]\r\n", + "Saving to: ‘EWR-1B5-E0_1-mem-ctx-8k.pth’\r\n", + "\r\n", "\r", - "BaseV5-C-Tune5.pth 17%[==> ] 991.82M 46.6MB/s eta 1m 41s " + " EWR-1B5-E 0%[ ] 0 --.-KB/s " ] }, { @@ -718,7 +724,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 17%[==> ] 1007M 46.9MB/s eta 1m 41s " + " EWR-1B5-E0 0%[ ] 15.26M 48.0MB/s " ] }, { @@ -726,7 +732,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 17%[==> ] 1007M 46.0MB/s eta 1m 40s " + " EWR-1B5-E0_ 0%[ ] 30.52M 47.4MB/s " ] }, { @@ -734,7 +740,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 17%[==> ] 1022M 46.5MB/s eta 1m 40s " + " EWR-1B5-E0_1 0%[ ] 45.78M 52.5MB/s " ] }, { @@ -742,7 +748,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 17%[==> ] 1.01G 46.2MB/s eta 1m 40s " + " EWR-1B5-E0_1- 1%[ ] 61.03M 53.0MB/s " ] }, { @@ -750,7 +756,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 18%[==> ] 1.03G 45.1MB/s eta 1m 40s " + " EWR-1B5-E0_1-m 1%[ ] 76.29M 54.5MB/s " ] }, { @@ -758,7 +764,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 18%[==> ] 1.04G 47.6MB/s eta 98s " + " EWR-1B5-E0_1-me 1%[ ] 91.55M 54.1MB/s " ] }, { @@ -766,7 +772,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 18%[==> ] 1.04G 45.0MB/s eta 98s " + " EWR-1B5-E0_1-mem 1%[ ] 106.29M 55.8MB/s " ] }, { @@ -774,7 +780,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 18%[==> ] 1.06G 45.5MB/s eta 98s " + " EWR-1B5-E0_1-mem- 2%[ ] 119.78M 56.9MB/s " ] }, { @@ -782,7 +788,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 18%[==> ] 1.06G 43.5MB/s eta 98s " + " EWR-1B5-E0_1-mem-c 2%[ ] 136.81M 58.2MB/s " ] }, { @@ -790,7 +796,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 19%[==> ] 1.07G 43.7MB/s eta 99s " + "EWR-1B5-E0_1-mem-ct 2%[ ] 152.59M 58.4MB/s " ] }, { @@ -798,7 +804,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 19%[==> ] 1.09G 43.7MB/s eta 99s " + "WR-1B5-E0_1-mem-ctx 2%[ ] 167.85M 58.2MB/s " ] }, { @@ -806,7 +812,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 19%[==> ] 1.09G 42.9MB/s eta 99s " + "R-1B5-E0_1-mem-ctx- 3%[ ] 188.29M 61.0MB/s eta 92s " ] }, { @@ -814,7 +820,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 19%[==> ] 1.10G 41.8MB/s eta 99s " + "-1B5-E0_1-mem-ctx-8 3%[ ] 197.85M 59.8MB/s eta 92s " ] }, { @@ -822,7 +828,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 19%[==> ] 1.12G 43.0MB/s eta 99s " + "1B5-E0_1-mem-ctx-8k 3%[ ] 198.49M 55.4MB/s eta 92s " ] }, { @@ -830,7 +836,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 19%[==> ] 1.12G 39.4MB/s eta 99s " + "B5-E0_1-mem-ctx-8k. 3%[ ] 213.62M 55.5MB/s eta 92s " ] }, { @@ -838,7 +844,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 20%[===> ] 1.13G 41.5MB/s eta 99s " + "5-E0_1-mem-ctx-8k.p 4%[ ] 243.63M 59.3MB/s eta 93s " ] }, { @@ -846,7 +852,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 20%[===> ] 1.15G 40.3MB/s eta 99s " + "-E0_1-mem-ctx-8k.pt 4%[ ] 256.89M 58.3MB/s eta 93s " ] }, { @@ -854,7 +860,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 20%[===> ] 1.16G 39.5MB/s eta 99s " + "E0_1-mem-ctx-8k.pth 4%[ ] 259.40M 56.3MB/s eta 93s " ] }, { @@ -862,7 +868,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 20%[===> ] 1.17G 38.3MB/s eta 99s " + "0_1-mem-ctx-8k.pth 4%[ ] 274.52M 58.9MB/s eta 93s " ] }, { @@ -870,7 +876,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 20%[===> ] 1.18G 40.2MB/s eta 99s " + "_1-mem-ctx-8k.pth 5%[> ] 289.40M 58.6MB/s eta 93s " ] }, { @@ -878,7 +884,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 21%[===> ] 1.19G 40.4MB/s eta 99s " + "1-mem-ctx-8k.pth 5%[> ] 304.66M 59.7MB/s eta 94s " ] }, { @@ -886,7 +892,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 21%[===> ] 1.21G 39.5MB/s eta 98s " + "-mem-ctx-8k.pth 5%[> ] 320.43M 59.6MB/s eta 94s " ] }, { @@ -894,7 +900,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 21%[===> ] 1.22G 41.4MB/s eta 98s " + "mem-ctx-8k.pth 5%[> ] 328.90M 58.2MB/s eta 94s " ] }, { @@ -902,7 +908,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 21%[===> ] 1.24G 41.9MB/s eta 98s " + "em-ctx-8k.pth 6%[> ] 350.44M 62.2MB/s eta 94s " ] }, { @@ -910,7 +916,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 22%[===> ] 1.25G 42.6MB/s eta 98s " + "m-ctx-8k.pth 6%[> ] 365.70M 60.4MB/s eta 92s " ] }, { @@ -918,7 +924,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 22%[===> ] 1.27G 44.5MB/s eta 96s " + "-ctx-8k.pth 6%[> ] 378.57M 59.1MB/s eta 92s " ] }, { @@ -926,7 +932,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 22%[===> ] 1.28G 43.6MB/s eta 96s " + "ctx-8k.pth 6%[> ] 381.47M 56.2MB/s eta 92s " ] }, { @@ -934,7 +940,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 22%[===> ] 1.29G 46.3MB/s eta 96s " + "tx-8k.pth 6%[> ] 396.73M 54.2MB/s eta 92s " ] }, { @@ -942,7 +948,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 23%[===> ] 1.30G 45.9MB/s eta 96s " + "x-8k.pth 7%[> ] 412.11M 57.5MB/s eta 92s " ] }, { @@ -950,7 +956,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 23%[===> ] 1.30G 44.5MB/s eta 96s " + "-8k.pth 7%[> ] 429.56M 60.0MB/s eta 92s " ] }, { @@ -958,7 +964,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 23%[===> ] 1.31G 44.9MB/s eta 96s " + "8k.pth 7%[> ] 442.51M 60.2MB/s eta 92s " ] }, { @@ -966,7 +972,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 23%[===> ] 1.31G 39.0MB/s eta 96s " + "k.pth 7%[> ] 455.93M 58.7MB/s eta 92s " ] }, { @@ -974,7 +980,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 23%[===> ] 1.31G 38.1MB/s eta 96s " + ".pth 7%[> ] 459.83M 55.8MB/s eta 92s " ] }, { @@ -982,7 +988,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 23%[===> ] 1.33G 38.3MB/s eta 98s " + "pth 8%[> ] 473.02M 53.8MB/s eta 92s " ] }, { @@ -990,7 +996,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 23%[===> ] 1.34G 38.9MB/s eta 98s " + "th 8%[> ] 488.28M 56.0MB/s eta 94s " ] }, { @@ -998,7 +1004,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 24%[===> ] 1.37G 41.1MB/s eta 98s " + "h 8%[> ] 503.54M 55.2MB/s eta 94s " ] }, { @@ -1006,7 +1012,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 24%[===> ] 1.37G 39.7MB/s eta 98s " + " 9%[> ] 524.76M 56.2MB/s eta 94s " ] }, { @@ -1014,7 +1020,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 24%[===> ] 1.39G 39.7MB/s eta 96s " + " E 9%[> ] 548.80M 61.4MB/s eta 94s " ] }, { @@ -1022,7 +1028,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 24%[===> ] 1.40G 38.1MB/s eta 96s " + " EW 9%[> ] 557.00M 58.1MB/s eta 94s " ] }, { @@ -1030,7 +1036,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 25%[====> ] 1.42G 37.7MB/s eta 96s " + " EWR 9%[> ] 564.84M 58.3MB/s eta 90s " ] }, { @@ -1038,7 +1044,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 25%[====> ] 1.43G 36.2MB/s eta 95s " + " EWR- 10%[=> ] 580.87M 58.5MB/s eta 90s " ] }, { @@ -1046,7 +1052,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 25%[====> ] 1.44G 38.6MB/s eta 95s " + " EWR-1 10%[=> ] 595.69M 57.2MB/s eta 90s " ] }, { @@ -1054,7 +1060,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 25%[====> ] 1.45G 35.3MB/s eta 95s " + " EWR-1B 10%[=> ] 608.90M 59.8MB/s eta 90s " ] }, { @@ -1062,7 +1068,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 25%[====> ] 1.46G 37.0MB/s eta 95s " + " EWR-1B5 10%[=> ] 621.86M 58.7MB/s eta 90s " ] }, { @@ -1070,7 +1076,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 26%[====> ] 1.47G 39.6MB/s eta 94s " + " EWR-1B5- 11%[=> ] 640.87M 62.3MB/s eta 87s " ] }, { @@ -1078,7 +1084,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 26%[====> ] 1.48G 40.5MB/s eta 94s " + " EWR-1B5-E 11%[=> ] 656.13M 61.3MB/s eta 87s " ] }, { @@ -1086,7 +1092,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 26%[====> ] 1.49G 41.8MB/s eta 94s " + " EWR-1B5-E0 11%[=> ] 671.38M 61.1MB/s eta 87s " ] }, { @@ -1094,7 +1100,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 26%[====> ] 1.50G 44.1MB/s eta 94s " + " EWR-1B5-E0_ 11%[=> ] 686.13M 61.7MB/s eta 87s " ] }, { @@ -1102,7 +1108,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 26%[====> ] 1.51G 45.6MB/s eta 94s " + " EWR-1B5-E0_1 12%[=> ] 700.08M 62.2MB/s eta 87s " ] }, { @@ -1110,7 +1116,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 26%[====> ] 1.52G 45.4MB/s eta 93s " + " EWR-1B5-E0_1- 12%[=> ] 716.64M 61.7MB/s eta 87s " ] }, { @@ -1118,7 +1124,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 27%[====> ] 1.53G 44.7MB/s eta 93s " + " EWR-1B5-E0_1-m 12%[=> ] 732.42M 63.1MB/s eta 87s " ] }, { @@ -1126,7 +1132,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 27%[====> ] 1.54G 41.4MB/s eta 93s " + " EWR-1B5-E0_1-me 12%[=> ] 748.05M 62.9MB/s eta 87s " ] }, { @@ -1134,7 +1140,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 27%[====> ] 1.55G 40.4MB/s eta 93s " + " EWR-1B5-E0_1-mem 13%[=> ] 762.94M 62.3MB/s eta 87s " ] }, { @@ -1142,7 +1148,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 27%[====> ] 1.56G 40.5MB/s eta 93s " + " EWR-1B5-E0_1-mem- 13%[=> ] 778.20M 61.8MB/s eta 85s " ] }, { @@ -1150,7 +1156,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 28%[====> ] 1.59G 44.7MB/s eta 91s " + " EWR-1B5-E0_1-mem-c 13%[=> ] 805.10M 65.5MB/s eta 85s " ] }, { @@ -1158,7 +1164,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 28%[====> ] 1.59G 44.2MB/s eta 91s " + "EWR-1B5-E0_1-mem-ct 13%[=> ] 808.71M 63.9MB/s eta 85s " ] }, { @@ -1166,7 +1172,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 28%[====> ] 1.60G 43.1MB/s eta 91s " + "WR-1B5-E0_1-mem-ctx 14%[=> ] 823.46M 63.6MB/s eta 85s " ] }, { @@ -1174,7 +1180,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 28%[====> ] 1.61G 43.4MB/s eta 91s " + "R-1B5-E0_1-mem-ctx- 14%[=> ] 838.71M 62.6MB/s eta 85s " ] }, { @@ -1182,7 +1188,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 28%[====> ] 1.62G 45.2MB/s eta 91s " + "-1B5-E0_1-mem-ctx-8 14%[=> ] 854.49M 63.7MB/s eta 83s " ] }, { @@ -1190,7 +1196,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 29%[====> ] 1.64G 46.1MB/s eta 90s " + "1B5-E0_1-mem-ctx-8k 14%[=> ] 863.43M 58.8MB/s eta 83s " ] }, { @@ -1198,7 +1204,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 29%[====> ] 1.65G 45.3MB/s eta 90s " + "B5-E0_1-mem-ctx-8k. 15%[==> ] 869.75M 59.2MB/s eta 83s " ] }, { @@ -1206,7 +1212,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 29%[====> ] 1.65G 42.5MB/s eta 90s " + "5-E0_1-mem-ctx-8k.p 15%[==> ] 895.53M 61.7MB/s eta 83s " ] }, { @@ -1214,7 +1220,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 29%[====> ] 1.66G 41.6MB/s eta 90s " + "-E0_1-mem-ctx-8k.pt 15%[==> ] 912.72M 63.1MB/s eta 83s " ] }, { @@ -1222,7 +1228,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 29%[====> ] 1.67G 40.0MB/s eta 90s " + "E0_1-mem-ctx-8k.pth 16%[==> ] 930.27M 64.0MB/s eta 80s " ] }, { @@ -1230,7 +1236,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 29%[====> ] 1.68G 43.1MB/s eta 90s " + "0_1-mem-ctx-8k.pth 16%[==> ] 946.04M 65.8MB/s eta 80s " ] }, { @@ -1238,7 +1244,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 30%[=====> ] 1.70G 42.7MB/s eta 90s " + "_1-mem-ctx-8k.pth 16%[==> ] 976.55M 70.6MB/s eta 80s " ] }, { @@ -1246,7 +1252,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 30%[=====> ] 1.71G 45.1MB/s eta 90s " + "1-mem-ctx-8k.pth 17%[==> ] 991.82M 70.7MB/s eta 80s " ] }, { @@ -1254,7 +1260,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 30%[=====> ] 1.72G 44.8MB/s eta 90s " + "-mem-ctx-8k.pth 17%[==> ] 1007M 69.5MB/s eta 78s " ] }, { @@ -1262,7 +1268,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 30%[=====> ] 1.73G 46.3MB/s eta 89s " + "mem-ctx-8k.pth 17%[==> ] 1013M 67.1MB/s eta 78s " ] }, { @@ -1270,7 +1276,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 30%[=====> ] 1.74G 47.4MB/s eta 89s " + "em-ctx-8k.pth 17%[==> ] 1022M 65.3MB/s eta 78s " ] }, { @@ -1278,7 +1284,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 31%[=====> ] 1.76G 47.1MB/s eta 89s " + "m-ctx-8k.pth 18%[==> ] 1.02G 67.6MB/s eta 78s " ] }, { @@ -1286,7 +1292,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 31%[=====> ] 1.77G 44.3MB/s eta 89s " + "-ctx-8k.pth 18%[==> ] 1.03G 62.7MB/s eta 78s " ] }, { @@ -1294,7 +1300,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 31%[=====> ] 1.79G 46.4MB/s eta 87s " + "ctx-8k.pth 18%[==> ] 1.05G 64.9MB/s eta 77s " ] }, { @@ -1302,7 +1308,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 31%[=====> ] 1.79G 45.9MB/s eta 87s " + "tx-8k.pth 18%[==> ] 1.06G 66.9MB/s eta 77s " ] }, { @@ -1310,7 +1316,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 31%[=====> ] 1.80G 45.3MB/s eta 87s " + "x-8k.pth 18%[==> ] 1.07G 67.2MB/s eta 77s " ] }, { @@ -1318,7 +1324,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 32%[=====> ] 1.82G 44.6MB/s eta 87s " + "-8k.pth 19%[==> ] 1.08G 63.0MB/s eta 77s " ] }, { @@ -1326,7 +1332,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 32%[=====> ] 1.82G 43.9MB/s eta 86s " + "8k.pth 19%[==> ] 1.09G 64.2MB/s eta 77s " ] }, { @@ -1334,7 +1340,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 32%[=====> ] 1.83G 43.5MB/s eta 86s " + "k.pth 19%[==> ] 1.10G 63.7MB/s eta 77s " ] }, { @@ -1342,7 +1348,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 32%[=====> ] 1.85G 42.9MB/s eta 86s " + ".pth 19%[==> ] 1.12G 62.6MB/s eta 77s " ] }, { @@ -1350,7 +1356,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 32%[=====> ] 1.86G 45.9MB/s eta 86s " + "pth 20%[===> ] 1.13G 61.6MB/s eta 77s " ] }, { @@ -1358,7 +1364,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 32%[=====> ] 1.86G 46.2MB/s eta 86s " + "th 20%[===> ] 1.15G 61.3MB/s eta 77s " ] }, { @@ -1366,7 +1372,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 33%[=====> ] 1.86G 45.2MB/s eta 86s " + "h 20%[===> ] 1.16G 60.6MB/s eta 77s " ] }, { @@ -1374,7 +1380,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 33%[=====> ] 1.88G 45.5MB/s eta 86s " + " 20%[===> ] 1.18G 58.5MB/s eta 76s " ] }, { @@ -1382,7 +1388,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 33%[=====> ] 1.89G 45.2MB/s eta 86s " + " E 21%[===> ] 1.19G 58.3MB/s eta 76s " ] }, { @@ -1390,7 +1396,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 33%[=====> ] 1.91G 47.1MB/s eta 86s " + " EW 21%[===> ] 1.21G 59.0MB/s eta 76s " ] }, { @@ -1398,7 +1404,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 34%[=====> ] 1.92G 46.0MB/s eta 84s " + " EWR 21%[===> ] 1.22G 58.0MB/s eta 76s " ] }, { @@ -1406,7 +1412,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 34%[=====> ] 1.94G 45.8MB/s eta 84s " + " EWR- 22%[===> ] 1.25G 62.4MB/s eta 76s " ] }, { @@ -1414,7 +1420,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 34%[=====> ] 1.95G 45.3MB/s eta 84s " + " EWR-1 22%[===> ] 1.25G 61.8MB/s eta 74s " ] }, { @@ -1422,7 +1428,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 34%[=====> ] 1.97G 45.7MB/s eta 84s " + " EWR-1B 22%[===> ] 1.27G 59.8MB/s eta 74s " ] }, { @@ -1430,7 +1436,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 35%[======> ] 1.98G 46.2MB/s eta 82s " + " EWR-1B5 22%[===> ] 1.27G 57.5MB/s eta 74s " ] }, { @@ -1438,7 +1444,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 35%[======> ] 1.98G 45.6MB/s eta 82s " + " EWR-1B5- 22%[===> ] 1.28G 58.3MB/s eta 74s " ] }, { @@ -1446,7 +1452,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 35%[======> ] 2.00G 43.6MB/s eta 82s " + " EWR-1B5-E 22%[===> ] 1.30G 58.0MB/s eta 74s " ] }, { @@ -1454,7 +1460,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 35%[======> ] 2.01G 44.9MB/s eta 82s " + " EWR-1B5-E0 23%[===> ] 1.31G 57.3MB/s eta 74s " ] }, { @@ -1462,7 +1468,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 35%[======> ] 2.02G 44.0MB/s eta 82s " + " EWR-1B5-E0_ 23%[===> ] 1.32G 57.0MB/s eta 74s " ] }, { @@ -1470,7 +1476,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 36%[======> ] 2.04G 46.1MB/s eta 82s " + " EWR-1B5-E0_1 23%[===> ] 1.33G 56.8MB/s eta 74s " ] }, { @@ -1478,7 +1484,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 36%[======> ] 2.04G 44.6MB/s eta 82s " + " EWR-1B5-E0_1- 23%[===> ] 1.34G 55.8MB/s eta 74s " ] }, { @@ -1486,7 +1492,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 36%[======> ] 2.06G 46.8MB/s eta 81s " + " EWR-1B5-E0_1-m 23%[===> ] 1.34G 55.4MB/s eta 74s " ] }, { @@ -1494,7 +1500,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 36%[======> ] 2.07G 47.3MB/s eta 81s " + " EWR-1B5-E0_1-me 24%[===> ] 1.36G 56.5MB/s eta 74s " ] }, { @@ -1502,7 +1508,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 36%[======> ] 2.08G 45.3MB/s eta 81s " + " EWR-1B5-E0_1-mem 24%[===> ] 1.37G 54.5MB/s eta 74s " ] }, { @@ -1510,7 +1516,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 37%[======> ] 2.10G 48.0MB/s eta 81s " + " EWR-1B5-E0_1-mem- 24%[===> ] 1.39G 53.5MB/s eta 74s " ] }, { @@ -1518,7 +1524,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 37%[======> ] 2.12G 45.6MB/s eta 80s " + " EWR-1B5-E0_1-mem-c 24%[===> ] 1.40G 52.8MB/s eta 74s " ] }, { @@ -1526,7 +1532,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 37%[======> ] 2.12G 42.9MB/s eta 80s " + "EWR-1B5-E0_1-mem-ct 24%[===> ] 1.40G 49.1MB/s eta 74s " ] }, { @@ -1534,7 +1540,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 37%[======> ] 2.13G 40.2MB/s eta 80s " + "WR-1B5-E0_1-mem-ctx 25%[====> ] 1.42G 49.6MB/s eta 74s " ] }, { @@ -1542,7 +1548,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 37%[======> ] 2.13G 39.4MB/s eta 80s " + "R-1B5-E0_1-mem-ctx- 25%[====> ] 1.43G 50.7MB/s eta 74s " ] }, { @@ -1550,7 +1556,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 38%[======> ] 2.15G 40.5MB/s eta 80s " + "-1B5-E0_1-mem-ctx-8 25%[====> ] 1.45G 51.7MB/s eta 74s " ] }, { @@ -1558,7 +1564,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 38%[======> ] 2.16G 39.9MB/s eta 80s " + "1B5-E0_1-mem-ctx-8k 25%[====> ] 1.47G 51.5MB/s eta 74s " ] }, { @@ -1566,7 +1572,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 38%[======> ] 2.17G 43.0MB/s eta 80s " + "B5-E0_1-mem-ctx-8k. 26%[====> ] 1.47G 52.0MB/s eta 72s " ] }, { @@ -1574,7 +1580,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 38%[======> ] 2.18G 40.1MB/s eta 80s " + "5-E0_1-mem-ctx-8k.p 26%[====> ] 1.49G 55.0MB/s eta 72s " ] }, { @@ -1582,7 +1588,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 38%[======> ] 2.19G 42.6MB/s eta 80s " + "-E0_1-mem-ctx-8k.pt 26%[====> ] 1.50G 53.3MB/s eta 72s " ] }, { @@ -1590,7 +1596,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 39%[======> ] 2.21G 44.4MB/s eta 78s " + "E0_1-mem-ctx-8k.pth 26%[====> ] 1.51G 50.7MB/s eta 72s " ] }, { @@ -1598,7 +1604,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 39%[======> ] 2.21G 42.6MB/s eta 78s " + "0_1-mem-ctx-8k.pth 27%[====> ] 1.53G 53.3MB/s eta 71s " ] }, { @@ -1606,7 +1612,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 39%[======> ] 2.22G 41.0MB/s eta 78s " + "_1-mem-ctx-8k.pth 27%[====> ] 1.54G 53.8MB/s eta 71s " ] }, { @@ -1614,7 +1620,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 39%[======> ] 2.23G 42.1MB/s eta 78s " + "1-mem-ctx-8k.pth 27%[====> ] 1.57G 56.2MB/s eta 71s " ] }, { @@ -1622,7 +1628,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 39%[======> ] 2.23G 39.8MB/s eta 78s " + "-mem-ctx-8k.pth 27%[====> ] 1.57G 56.5MB/s eta 71s " ] }, { @@ -1630,7 +1636,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 39%[======> ] 2.25G 41.5MB/s eta 77s " + "mem-ctx-8k.pth 28%[====> ] 1.59G 56.8MB/s eta 71s " ] }, { @@ -1638,7 +1644,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 39%[======> ] 2.25G 40.6MB/s eta 77s " + "em-ctx-8k.pth 28%[====> ] 1.60G 58.8MB/s eta 70s " ] }, { @@ -1646,7 +1652,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 40%[=======> ] 2.26G 39.0MB/s eta 77s " + "m-ctx-8k.pth 28%[====> ] 1.61G 55.0MB/s eta 70s " ] }, { @@ -1654,7 +1660,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 40%[=======> ] 2.29G 41.8MB/s eta 77s " + "-ctx-8k.pth 28%[====> ] 1.62G 60.7MB/s eta 70s " ] }, { @@ -1662,7 +1668,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 40%[=======> ] 2.31G 48.5MB/s eta 76s " + "ctx-8k.pth 28%[====> ] 1.63G 58.7MB/s eta 70s " ] }, { @@ -1670,7 +1676,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 40%[=======> ] 2.31G 44.5MB/s eta 76s " + "tx-8k.pth 29%[====> ] 1.65G 59.2MB/s eta 70s " ] }, { @@ -1678,7 +1684,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 40%[=======> ] 2.31G 43.3MB/s eta 76s " + "x-8k.pth 29%[====> ] 1.67G 58.5MB/s eta 69s " ] }, { @@ -1686,7 +1692,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 41%[=======> ] 2.32G 40.6MB/s eta 76s " + "-8k.pth 29%[====> ] 1.68G 56.9MB/s eta 69s " ] }, { @@ -1694,7 +1700,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 41%[=======> ] 2.34G 42.9MB/s eta 75s " + "8k.pth 30%[=====> ] 1.70G 59.8MB/s eta 69s " ] }, { @@ -1702,7 +1708,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 41%[=======> ] 2.35G 41.5MB/s eta 75s " + "k.pth 30%[=====> ] 1.71G 59.5MB/s eta 69s " ] }, { @@ -1710,7 +1716,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 41%[=======> ] 2.37G 43.3MB/s eta 75s " + ".pth 30%[=====> ] 1.73G 62.8MB/s eta 69s " ] }, { @@ -1718,7 +1724,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 42%[=======> ] 2.38G 44.3MB/s eta 75s " + "pth 30%[=====> ] 1.75G 64.8MB/s eta 67s " ] }, { @@ -1726,7 +1732,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 42%[=======> ] 2.39G 44.3MB/s eta 75s " + "th 31%[=====> ] 1.76G 62.1MB/s eta 67s " ] }, { @@ -1734,7 +1740,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 42%[=======> ] 2.40G 46.1MB/s eta 74s " + "h 31%[=====> ] 1.77G 62.7MB/s eta 67s " ] }, { @@ -1742,7 +1748,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 42%[=======> ] 2.41G 45.2MB/s eta 74s " + " 31%[=====> ] 1.79G 59.0MB/s eta 67s " ] }, { @@ -1750,7 +1756,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 43%[=======> ] 2.43G 46.5MB/s eta 74s " + " E 31%[=====> ] 1.79G 56.4MB/s eta 67s " ] }, { @@ -1758,7 +1764,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 43%[=======> ] 2.44G 49.4MB/s eta 74s " + " EW 31%[=====> ] 1.80G 59.3MB/s eta 67s " ] }, { @@ -1766,7 +1772,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 43%[=======> ] 2.45G 46.9MB/s eta 73s " + " EWR 32%[=====> ] 1.82G 59.8MB/s eta 67s " ] }, { @@ -1774,7 +1780,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 43%[=======> ] 2.46G 45.0MB/s eta 73s " + " EWR- 32%[=====> ] 1.83G 61.9MB/s eta 67s " ] }, { @@ -1782,7 +1788,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 43%[=======> ] 2.47G 43.5MB/s eta 73s " + " EWR-1 32%[=====> ] 1.85G 60.6MB/s eta 67s " ] }, { @@ -1790,7 +1796,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 44%[=======> ] 2.49G 43.9MB/s eta 72s " + " EWR-1B 33%[=====> ] 1.86G 60.1MB/s eta 66s " ] }, { @@ -1798,7 +1804,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 44%[=======> ] 2.50G 47.7MB/s eta 72s " + " EWR-1B5 33%[=====> ] 1.88G 61.6MB/s eta 66s " ] }, { @@ -1806,7 +1812,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 44%[=======> ] 2.51G 46.2MB/s eta 72s " + " EWR-1B5- 33%[=====> ] 1.88G 60.3MB/s eta 66s " ] }, { @@ -1814,7 +1820,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 44%[=======> ] 2.52G 46.1MB/s eta 72s " + " EWR-1B5-E 33%[=====> ] 1.90G 60.8MB/s eta 66s " ] }, { @@ -1822,7 +1828,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 44%[=======> ] 2.53G 45.3MB/s eta 71s " + " EWR-1B5-E0 33%[=====> ] 1.91G 59.2MB/s eta 66s " ] }, { @@ -1830,7 +1836,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 45%[========> ] 2.55G 45.5MB/s eta 71s " + " EWR-1B5-E0_ 34%[=====> ] 1.93G 59.0MB/s eta 64s " ] }, { @@ -1838,7 +1844,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 45%[========> ] 2.56G 46.1MB/s eta 71s " + " EWR-1B5-E0_1 34%[=====> ] 1.94G 61.9MB/s eta 64s " ] }, { @@ -1846,7 +1852,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 45%[========> ] 2.56G 44.2MB/s eta 71s " + " EWR-1B5-E0_1- 34%[=====> ] 1.97G 61.8MB/s eta 64s " ] }, { @@ -1854,7 +1860,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 45%[========> ] 2.58G 44.9MB/s eta 70s " + " EWR-1B5-E0_1-m 35%[======> ] 1.98G 59.1MB/s eta 64s " ] }, { @@ -1862,7 +1868,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 46%[========> ] 2.60G 47.1MB/s eta 70s " + " EWR-1B5-E0_1-me 35%[======> ] 2.00G 57.4MB/s eta 63s " ] }, { @@ -1870,7 +1876,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 46%[========> ] 2.61G 46.3MB/s eta 70s " + " EWR-1B5-E0_1-mem 35%[======> ] 2.01G 58.6MB/s eta 63s " ] }, { @@ -1878,7 +1884,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 46%[========> ] 2.62G 47.3MB/s eta 70s " + " EWR-1B5-E0_1-mem- 35%[======> ] 2.03G 60.6MB/s eta 63s " ] }, { @@ -1886,7 +1892,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 46%[========> ] 2.64G 48.2MB/s eta 70s " + " EWR-1B5-E0_1-mem-c 36%[======> ] 2.05G 62.3MB/s eta 63s " ] }, { @@ -1894,7 +1900,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 46%[========> ] 2.64G 46.1MB/s eta 68s " + "EWR-1B5-E0_1-mem-ct 36%[======> ] 2.06G 60.9MB/s eta 63s " ] }, { @@ -1902,7 +1908,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 46%[========> ] 2.65G 47.2MB/s eta 68s " + "WR-1B5-E0_1-mem-ctx 36%[======> ] 2.08G 63.2MB/s eta 61s " ] }, { @@ -1910,7 +1916,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 47%[========> ] 2.67G 46.0MB/s eta 68s " + "R-1B5-E0_1-mem-ctx- 36%[======> ] 2.09G 64.8MB/s eta 61s " ] }, { @@ -1918,7 +1924,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 47%[========> ] 2.68G 47.8MB/s eta 68s " + "-1B5-E0_1-mem-ctx-8 37%[======> ] 2.10G 63.8MB/s eta 61s " ] }, { @@ -1926,7 +1932,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 47%[========> ] 2.70G 50.3MB/s eta 67s " + "1B5-E0_1-mem-ctx-8k 37%[======> ] 2.12G 64.0MB/s eta 61s " ] }, { @@ -1934,7 +1940,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 48%[========> ] 2.71G 50.5MB/s eta 67s " + "B5-E0_1-mem-ctx-8k. 37%[======> ] 2.13G 64.6MB/s eta 60s " ] }, { @@ -1942,7 +1948,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 48%[========> ] 2.73G 50.5MB/s eta 67s " + "5-E0_1-mem-ctx-8k.p 38%[======> ] 2.15G 64.6MB/s eta 60s " ] }, { @@ -1950,7 +1956,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 48%[========> ] 2.74G 53.0MB/s eta 67s " + "-E0_1-mem-ctx-8k.pt 38%[======> ] 2.16G 63.1MB/s eta 60s " ] }, { @@ -1958,7 +1964,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 48%[========> ] 2.76G 50.7MB/s eta 65s " + "E0_1-mem-ctx-8k.pth 38%[======> ] 2.17G 63.0MB/s eta 60s " ] }, { @@ -1966,7 +1972,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 49%[========> ] 2.77G 49.9MB/s eta 65s " + "0_1-mem-ctx-8k.pth 38%[======> ] 2.17G 59.8MB/s eta 60s " ] }, { @@ -1974,7 +1980,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 49%[========> ] 2.77G 51.3MB/s eta 65s " + "_1-mem-ctx-8k.pth 38%[======> ] 2.19G 58.1MB/s eta 60s " ] }, { @@ -1982,7 +1988,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 49%[========> ] 2.78G 51.3MB/s eta 65s " + "1-mem-ctx-8k.pth 39%[======> ] 2.21G 56.9MB/s eta 60s " ] }, { @@ -1990,7 +1996,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 49%[========> ] 2.79G 48.2MB/s eta 65s " + "-mem-ctx-8k.pth 39%[======> ] 2.22G 59.8MB/s eta 60s " ] }, { @@ -1998,7 +2004,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 49%[========> ] 2.80G 48.2MB/s eta 64s " + "mem-ctx-8k.pth 39%[======> ] 2.24G 62.8MB/s eta 60s " ] }, { @@ -2006,7 +2012,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 49%[========> ] 2.82G 48.0MB/s eta 64s " + "em-ctx-8k.pth 39%[======> ] 2.25G 60.7MB/s eta 60s " ] }, { @@ -2014,7 +2020,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 50%[=========> ] 2.83G 48.5MB/s eta 64s " + "m-ctx-8k.pth 40%[=======> ] 2.26G 63.2MB/s eta 58s " ] }, { @@ -2022,7 +2028,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 50%[=========> ] 2.85G 48.2MB/s eta 64s " + "-ctx-8k.pth 40%[=======> ] 2.28G 63.0MB/s eta 58s " ] }, { @@ -2030,7 +2036,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 50%[=========> ] 2.86G 48.4MB/s eta 63s " + "ctx-8k.pth 40%[=======> ] 2.31G 64.9MB/s eta 58s " ] }, { @@ -2038,7 +2044,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 50%[=========> ] 2.86G 44.2MB/s eta 63s " + "tx-8k.pth 41%[=======> ] 2.32G 63.9MB/s eta 58s " ] }, { @@ -2046,7 +2052,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 50%[=========> ] 2.87G 44.1MB/s eta 63s " + "x-8k.pth 41%[=======> ] 2.33G 63.3MB/s eta 58s " ] }, { @@ -2054,7 +2060,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 50%[=========> ] 2.88G 43.8MB/s eta 63s " + "-8k.pth 41%[=======> ] 2.34G 62.2MB/s eta 57s " ] }, { @@ -2062,7 +2068,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 51%[=========> ] 2.89G 42.9MB/s eta 63s " + "8k.pth 41%[=======> ] 2.35G 60.1MB/s eta 57s " ] }, { @@ -2070,7 +2076,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 51%[=========> ] 2.90G 44.6MB/s eta 62s " + "k.pth 42%[=======> ] 2.37G 64.0MB/s eta 57s " ] }, { @@ -2078,7 +2084,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 51%[=========> ] 2.91G 40.1MB/s eta 62s " + ".pth 42%[=======> ] 2.38G 63.1MB/s eta 57s " ] }, { @@ -2086,7 +2092,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 51%[=========> ] 2.92G 43.4MB/s eta 62s " + "pth 42%[=======> ] 2.40G 63.1MB/s eta 56s " ] }, { @@ -2094,7 +2100,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 52%[=========> ] 2.93G 44.2MB/s eta 62s " + "th 42%[=======> ] 2.41G 62.3MB/s eta 56s " ] }, { @@ -2102,7 +2108,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 52%[=========> ] 2.94G 45.0MB/s eta 61s " + "h 42%[=======> ] 2.41G 61.0MB/s eta 56s " ] }, { @@ -2110,7 +2116,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 52%[=========> ] 2.95G 39.8MB/s eta 61s " + " 42%[=======> ] 2.42G 61.6MB/s eta 56s " ] }, { @@ -2118,7 +2124,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 52%[=========> ] 2.96G 37.8MB/s eta 61s " + " E 43%[=======> ] 2.43G 58.4MB/s eta 56s " ] }, { @@ -2126,7 +2132,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 52%[=========> ] 2.96G 38.6MB/s eta 61s " + " EW 43%[=======> ] 2.44G 57.0MB/s eta 55s " ] }, { @@ -2134,7 +2140,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 52%[=========> ] 2.98G 37.8MB/s eta 61s " + " EWR 43%[=======> ] 2.46G 55.1MB/s eta 55s " ] }, { @@ -2142,7 +2148,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 52%[=========> ] 2.98G 37.4MB/s eta 61s " + " EWR- 43%[=======> ] 2.47G 54.6MB/s eta 55s " ] }, { @@ -2150,7 +2156,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 53%[=========> ] 3.00G 35.8MB/s eta 61s " + " EWR-1 44%[=======> ] 2.49G 55.4MB/s eta 55s " ] }, { @@ -2158,7 +2164,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 53%[=========> ] 3.00G 34.2MB/s eta 61s " + " EWR-1B 44%[=======> ] 2.51G 54.5MB/s eta 54s " ] }, { @@ -2166,7 +2172,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 53%[=========> ] 3.01G 37.1MB/s eta 61s " + " EWR-1B5 44%[=======> ] 2.52G 52.9MB/s eta 54s " ] }, { @@ -2174,7 +2180,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 53%[=========> ] 3.02G 38.2MB/s eta 60s " + " EWR-1B5- 44%[=======> ] 2.53G 52.0MB/s eta 54s " ] }, { @@ -2182,7 +2188,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 53%[=========> ] 3.03G 39.9MB/s eta 60s " + " EWR-1B5-E 45%[========> ] 2.55G 54.1MB/s eta 54s " ] }, { @@ -2190,7 +2196,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 53%[=========> ] 3.04G 37.5MB/s eta 60s " + " EWR-1B5-E0 45%[========> ] 2.56G 54.3MB/s eta 53s " ] }, { @@ -2198,7 +2204,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 54%[=========> ] 3.05G 40.4MB/s eta 60s " + " EWR-1B5-E0_ 45%[========> ] 2.58G 54.2MB/s eta 53s " ] }, { @@ -2206,7 +2212,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 54%[=========> ] 3.06G 40.4MB/s eta 60s " + " EWR-1B5-E0_1 45%[========> ] 2.59G 53.5MB/s eta 53s " ] }, { @@ -2214,7 +2220,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 54%[=========> ] 3.07G 41.2MB/s eta 59s " + " EWR-1B5-E0_1- 46%[========> ] 2.61G 55.1MB/s eta 53s " ] }, { @@ -2222,7 +2228,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 54%[=========> ] 3.08G 39.5MB/s eta 59s " + " EWR-1B5-E0_1-m 46%[========> ] 2.62G 54.6MB/s eta 52s " ] }, { @@ -2230,7 +2236,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 54%[=========> ] 3.10G 41.3MB/s eta 59s " + " EWR-1B5-E0_1-me 46%[========> ] 2.64G 57.2MB/s eta 52s " ] }, { @@ -2238,7 +2244,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 55%[==========> ] 3.11G 41.4MB/s eta 59s " + " EWR-1B5-E0_1-mem 46%[========> ] 2.65G 56.7MB/s eta 52s " ] }, { @@ -2246,7 +2252,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 55%[==========> ] 3.13G 41.8MB/s eta 57s " + " EWR-1B5-E0_1-mem- 47%[========> ] 2.67G 56.7MB/s eta 52s " ] }, { @@ -2254,7 +2260,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 55%[==========> ] 3.14G 44.4MB/s eta 57s " + " EWR-1B5-E0_1-mem-c 47%[========> ] 2.67G 54.0MB/s eta 52s " ] }, { @@ -2262,7 +2268,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 55%[==========> ] 3.16G 46.2MB/s eta 57s " + "EWR-1B5-E0_1-mem-ct 47%[========> ] 2.68G 54.5MB/s eta 52s " ] }, { @@ -2270,7 +2276,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 56%[==========> ] 3.17G 47.9MB/s eta 57s " + "WR-1B5-E0_1-mem-ctx 47%[========> ] 2.70G 55.3MB/s eta 52s " ] }, { @@ -2278,7 +2284,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 56%[==========> ] 3.19G 48.7MB/s eta 57s " + "R-1B5-E0_1-mem-ctx- 48%[========> ] 2.71G 54.9MB/s eta 52s " ] }, { @@ -2286,7 +2292,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 56%[==========> ] 3.20G 50.1MB/s eta 55s " + "-1B5-E0_1-mem-ctx-8 48%[========> ] 2.73G 55.6MB/s eta 52s " ] }, { @@ -2294,7 +2300,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 56%[==========> ] 3.21G 52.3MB/s eta 55s " + "1B5-E0_1-mem-ctx-8k 48%[========> ] 2.75G 57.7MB/s eta 50s " ] }, { @@ -2302,7 +2308,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 57%[==========> ] 3.23G 54.4MB/s eta 55s " + "B5-E0_1-mem-ctx-8k. 49%[========> ] 2.77G 60.1MB/s eta 50s " ] }, { @@ -2310,7 +2316,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 57%[==========> ] 3.23G 52.9MB/s eta 55s " + "5-E0_1-mem-ctx-8k.p 49%[========> ] 2.79G 62.6MB/s eta 50s " ] }, { @@ -2318,7 +2324,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 57%[==========> ] 3.25G 52.5MB/s eta 55s " + "-E0_1-mem-ctx-8k.pt 49%[========> ] 2.80G 62.1MB/s eta 50s " ] }, { @@ -2326,7 +2332,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 57%[==========> ] 3.26G 53.8MB/s eta 54s " + "E0_1-mem-ctx-8k.pth 49%[========> ] 2.81G 60.5MB/s eta 50s " ] }, { @@ -2334,7 +2340,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 58%[==========> ] 3.28G 54.6MB/s eta 54s " + "0_1-mem-ctx-8k.pth 50%[=========> ] 2.83G 59.2MB/s eta 49s " ] }, { @@ -2342,7 +2348,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 58%[==========> ] 3.29G 56.2MB/s eta 54s " + "_1-mem-ctx-8k.pth 50%[=========> ] 2.85G 58.6MB/s eta 49s " ] }, { @@ -2350,7 +2356,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 58%[==========> ] 3.30G 56.0MB/s eta 54s " + "1-mem-ctx-8k.pth 50%[=========> ] 2.86G 59.7MB/s eta 49s " ] }, { @@ -2358,7 +2364,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 58%[==========> ] 3.31G 55.1MB/s eta 54s " + "-mem-ctx-8k.pth 50%[=========> ] 2.88G 60.7MB/s eta 49s " ] }, { @@ -2366,7 +2372,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 58%[==========> ] 3.32G 54.4MB/s eta 52s " + "mem-ctx-8k.pth 51%[=========> ] 2.89G 62.7MB/s eta 49s " ] }, { @@ -2374,7 +2380,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 59%[==========> ] 3.34G 53.6MB/s eta 52s " + "em-ctx-8k.pth 51%[=========> ] 2.90G 62.6MB/s eta 47s " ] }, { @@ -2382,7 +2388,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 59%[==========> ] 3.35G 56.0MB/s eta 52s " + "m-ctx-8k.pth 51%[=========> ] 2.92G 63.8MB/s eta 47s " ] }, { @@ -2390,7 +2396,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 59%[==========> ] 3.37G 56.2MB/s eta 52s " + "-ctx-8k.pth 52%[=========> ] 2.94G 69.4MB/s eta 47s " ] }, { @@ -2398,7 +2404,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 59%[==========> ] 3.37G 52.1MB/s eta 51s " + "ctx-8k.pth 52%[=========> ] 2.95G 67.2MB/s eta 47s " ] }, { @@ -2406,7 +2412,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 59%[==========> ] 3.38G 54.2MB/s eta 51s " + "tx-8k.pth 52%[=========> ] 2.96G 66.9MB/s eta 47s " ] }, { @@ -2414,7 +2420,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 59%[==========> ] 3.38G 50.2MB/s eta 51s " + "x-8k.pth 52%[=========> ] 2.98G 67.4MB/s eta 46s " ] }, { @@ -2422,7 +2428,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 60%[===========> ] 3.40G 48.0MB/s eta 51s " + "-8k.pth 53%[=========> ] 3.00G 66.6MB/s eta 46s " ] }, { @@ -2430,7 +2436,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 60%[===========> ] 3.41G 47.9MB/s eta 50s " + "8k.pth 53%[=========> ] 3.01G 64.8MB/s eta 46s " ] }, { @@ -2438,7 +2444,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 60%[===========> ] 3.43G 47.6MB/s eta 50s " + "k.pth 53%[=========> ] 3.02G 61.8MB/s eta 46s " ] }, { @@ -2446,7 +2452,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 60%[===========> ] 3.43G 44.6MB/s eta 50s " + ".pth 53%[=========> ] 3.02G 58.7MB/s eta 45s " ] }, { @@ -2454,7 +2460,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 60%[===========> ] 3.44G 43.0MB/s eta 50s " + "pth 53%[=========> ] 3.04G 59.3MB/s eta 45s " ] }, { @@ -2462,7 +2468,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 61%[===========> ] 3.46G 43.8MB/s eta 49s " + "th 54%[=========> ] 3.05G 58.1MB/s eta 45s " ] }, { @@ -2470,7 +2476,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 61%[===========> ] 3.47G 45.6MB/s eta 49s " + "h 54%[=========> ] 3.07G 57.3MB/s eta 45s " ] }, { @@ -2478,7 +2484,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 61%[===========> ] 3.47G 43.9MB/s eta 49s " + " 54%[=========> ] 3.08G 57.6MB/s eta 44s " ] }, { @@ -2486,7 +2492,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 61%[===========> ] 3.49G 43.4MB/s eta 49s " + " E 55%[==========> ] 3.11G 59.3MB/s eta 44s " ] }, { @@ -2494,7 +2500,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 61%[===========> ] 3.49G 39.3MB/s eta 49s " + " EW 55%[==========> ] 3.11G 59.0MB/s eta 44s " ] }, { @@ -2502,7 +2508,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 62%[===========> ] 3.50G 42.4MB/s eta 48s " + " EWR 55%[==========> ] 3.14G 61.7MB/s eta 44s " ] }, { @@ -2510,7 +2516,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 62%[===========> ] 3.52G 39.4MB/s eta 48s " + " EWR- 55%[==========> ] 3.14G 61.5MB/s eta 44s " ] }, { @@ -2518,7 +2524,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 62%[===========> ] 3.53G 41.6MB/s eta 48s " + " EWR-1 55%[==========> ] 3.15G 58.4MB/s eta 43s " ] }, { @@ -2526,7 +2532,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 62%[===========> ] 3.55G 42.1MB/s eta 48s " + " EWR-1B 56%[==========> ] 3.17G 59.0MB/s eta 43s " ] }, { @@ -2534,7 +2540,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 63%[===========> ] 3.56G 45.4MB/s eta 47s " + " EWR-1B5 56%[==========> ] 3.19G 58.9MB/s eta 43s " ] }, { @@ -2542,7 +2548,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 63%[===========> ] 3.58G 47.9MB/s eta 47s " + " EWR-1B5- 56%[==========> ] 3.20G 59.0MB/s eta 43s " ] }, { @@ -2550,7 +2556,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 63%[===========> ] 3.58G 43.9MB/s eta 47s " + " EWR-1B5-E 56%[==========> ] 3.21G 57.7MB/s eta 43s " ] }, { @@ -2558,7 +2564,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 63%[===========> ] 3.59G 47.3MB/s eta 47s " + " EWR-1B5-E0 57%[==========> ] 3.22G 57.2MB/s eta 42s " ] }, { @@ -2566,7 +2572,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 63%[===========> ] 3.60G 45.5MB/s eta 46s " + " EWR-1B5-E0_ 57%[==========> ] 3.23G 56.4MB/s eta 42s " ] }, { @@ -2574,7 +2580,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 63%[===========> ] 3.61G 43.0MB/s eta 46s " + " EWR-1B5-E0_1 57%[==========> ] 3.25G 59.6MB/s eta 42s " ] }, { @@ -2582,7 +2588,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 64%[===========> ] 3.62G 44.2MB/s eta 46s " + " EWR-1B5-E0_1- 57%[==========> ] 3.26G 59.3MB/s eta 42s " ] }, { @@ -2590,7 +2596,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 64%[===========> ] 3.64G 43.5MB/s eta 46s " + " EWR-1B5-E0_1-m 58%[==========> ] 3.28G 58.9MB/s eta 41s " ] }, { @@ -2598,7 +2604,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 64%[===========> ] 3.65G 45.0MB/s eta 45s " + " EWR-1B5-E0_1-me 58%[==========> ] 3.29G 60.7MB/s eta 41s " ] }, { @@ -2606,7 +2612,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 64%[===========> ] 3.67G 44.2MB/s eta 45s " + " EWR-1B5-E0_1-mem 58%[==========> ] 3.31G 59.8MB/s eta 41s " ] }, { @@ -2614,7 +2620,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 65%[============> ] 3.68G 48.1MB/s eta 45s " + " EWR-1B5-E0_1-mem- 58%[==========> ] 3.32G 57.6MB/s eta 41s " ] }, { @@ -2622,7 +2628,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 65%[============> ] 3.69G 47.1MB/s eta 45s " + " EWR-1B5-E0_1-mem-c 59%[==========> ] 3.34G 54.6MB/s eta 40s " ] }, { @@ -2630,7 +2636,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 65%[============> ] 3.71G 46.2MB/s eta 44s " + "EWR-1B5-E0_1-mem-ct 59%[==========> ] 3.35G 56.0MB/s eta 40s " ] }, { @@ -2638,7 +2644,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 65%[============> ] 3.72G 49.3MB/s eta 44s " + "WR-1B5-E0_1-mem-ctx 59%[==========> ] 3.37G 56.1MB/s eta 40s " ] }, { @@ -2646,7 +2652,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 66%[============> ] 3.72G 43.7MB/s eta 44s " + "R-1B5-E0_1-mem-ctx- 59%[==========> ] 3.38G 56.4MB/s eta 40s " ] }, { @@ -2654,7 +2660,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 66%[============> ] 3.74G 42.6MB/s eta 44s " + "-1B5-E0_1-mem-ctx-8 60%[===========> ] 3.40G 55.8MB/s eta 39s " ] }, { @@ -2662,7 +2668,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 66%[============> ] 3.75G 43.8MB/s eta 43s " + "1B5-E0_1-mem-ctx-8k 60%[===========> ] 3.41G 57.9MB/s eta 39s " ] }, { @@ -2670,7 +2676,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 66%[============> ] 3.76G 46.0MB/s eta 43s " + "B5-E0_1-mem-ctx-8k. 60%[===========> ] 3.42G 58.1MB/s eta 39s " ] }, { @@ -2678,7 +2684,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 66%[============> ] 3.77G 45.6MB/s eta 43s " + "5-E0_1-mem-ctx-8k.p 60%[===========> ] 3.43G 57.3MB/s eta 39s " ] }, { @@ -2686,7 +2692,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 67%[============> ] 3.79G 48.9MB/s eta 43s " + "-E0_1-mem-ctx-8k.pt 61%[===========> ] 3.45G 60.7MB/s eta 39s " ] }, { @@ -2694,7 +2700,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 67%[============> ] 3.80G 49.8MB/s eta 43s " + "E0_1-mem-ctx-8k.pth 61%[===========> ] 3.46G 61.2MB/s eta 38s " ] }, { @@ -2702,7 +2708,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 67%[============> ] 3.81G 50.5MB/s eta 41s " + "0_1-mem-ctx-8k.pth 61%[===========> ] 3.47G 58.5MB/s eta 38s " ] }, { @@ -2710,7 +2716,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 67%[============> ] 3.81G 48.8MB/s eta 41s " + "_1-mem-ctx-8k.pth 61%[===========> ] 3.49G 61.9MB/s eta 38s " ] }, { @@ -2718,7 +2724,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 67%[============> ] 3.83G 47.3MB/s eta 41s " + "1-mem-ctx-8k.pth 62%[===========> ] 3.50G 59.6MB/s eta 38s " ] }, { @@ -2726,7 +2732,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 68%[============> ] 3.85G 49.0MB/s eta 41s " + "-mem-ctx-8k.pth 62%[===========> ] 3.51G 59.7MB/s eta 38s " ] }, { @@ -2734,7 +2740,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 68%[============> ] 3.86G 48.2MB/s eta 40s " + "mem-ctx-8k.pth 62%[===========> ] 3.52G 58.4MB/s eta 37s " ] }, { @@ -2742,7 +2748,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 68%[============> ] 3.87G 46.7MB/s eta 40s " + "em-ctx-8k.pth 62%[===========> ] 3.55G 58.3MB/s eta 37s " ] }, { @@ -2750,7 +2756,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 68%[============> ] 3.89G 47.1MB/s eta 40s " + "m-ctx-8k.pth 63%[===========> ] 3.56G 58.9MB/s eta 37s " ] }, { @@ -2758,7 +2764,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 69%[============> ] 3.90G 46.8MB/s eta 40s " + "-ctx-8k.pth 63%[===========> ] 3.58G 61.0MB/s eta 37s " ] }, { @@ -2766,7 +2772,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 69%[============> ] 3.91G 44.9MB/s eta 39s " + "ctx-8k.pth 63%[===========> ] 3.59G 59.7MB/s eta 35s " ] }, { @@ -2774,7 +2780,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 69%[============> ] 3.93G 49.0MB/s eta 39s " + "tx-8k.pth 63%[===========> ] 3.61G 62.3MB/s eta 35s " ] }, { @@ -2782,7 +2788,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 69%[============> ] 3.93G 46.4MB/s eta 39s " + "x-8k.pth 64%[===========> ] 3.62G 61.7MB/s eta 35s " ] }, { @@ -2790,7 +2796,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 69%[============> ] 3.94G 43.3MB/s eta 39s " + "-8k.pth 64%[===========> ] 3.65G 64.8MB/s eta 35s " ] }, { @@ -2798,7 +2804,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 69%[============> ] 3.95G 43.9MB/s eta 38s " + "8k.pth 64%[===========> ] 3.65G 64.6MB/s eta 35s " ] }, { @@ -2806,7 +2812,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 70%[=============> ] 3.96G 43.9MB/s eta 38s " + "k.pth 64%[===========> ] 3.66G 60.3MB/s eta 34s " ] }, { @@ -2814,7 +2820,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 70%[=============> ] 3.98G 44.2MB/s eta 38s " + ".pth 65%[============> ] 3.67G 61.6MB/s eta 34s " ] }, { @@ -2822,7 +2828,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 70%[=============> ] 3.99G 43.2MB/s eta 38s " + "pth 65%[============> ] 3.68G 60.6MB/s eta 34s " ] }, { @@ -2830,7 +2836,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 71%[=============> ] 4.01G 45.9MB/s eta 37s " + "th 65%[============> ] 3.70G 61.4MB/s eta 34s " ] }, { @@ -2838,7 +2844,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 71%[=============> ] 4.02G 46.5MB/s eta 37s " + "h 65%[============> ] 3.71G 60.5MB/s eta 34s " ] }, { @@ -2846,7 +2852,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 71%[=============> ] 4.02G 46.1MB/s eta 37s " + " 66%[============> ] 3.72G 60.7MB/s eta 33s " ] }, { @@ -2854,7 +2860,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 71%[=============> ] 4.04G 47.3MB/s eta 37s " + " E 66%[============> ] 3.74G 60.1MB/s eta 33s " ] }, { @@ -2862,7 +2868,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 71%[=============> ] 4.05G 45.5MB/s eta 36s " + " EW 66%[============> ] 3.75G 60.4MB/s eta 33s " ] }, { @@ -2870,7 +2876,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 72%[=============> ] 4.08G 47.3MB/s eta 36s " + " EWR 66%[============> ] 3.76G 60.2MB/s eta 33s " ] }, { @@ -2878,7 +2884,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 72%[=============> ] 4.08G 48.5MB/s eta 36s " + " EWR- 66%[============> ] 3.77G 57.2MB/s eta 33s " ] }, { @@ -2886,7 +2892,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 72%[=============> ] 4.10G 49.9MB/s eta 36s " + " EWR-1 67%[============> ] 3.79G 60.2MB/s eta 32s " ] }, { @@ -2894,7 +2900,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 72%[=============> ] 4.11G 49.3MB/s eta 36s " + " EWR-1B 67%[============> ] 3.80G 57.8MB/s eta 32s " ] }, { @@ -2902,7 +2908,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 72%[=============> ] 4.12G 47.1MB/s eta 34s " + " EWR-1B5 67%[============> ] 3.83G 60.2MB/s eta 32s " ] }, { @@ -2910,7 +2916,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 73%[=============> ] 4.13G 49.1MB/s eta 34s " + " EWR-1B5- 68%[============> ] 3.84G 60.5MB/s eta 32s " ] }, { @@ -2918,7 +2924,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 73%[=============> ] 4.13G 48.9MB/s eta 34s " + " EWR-1B5-E 68%[============> ] 3.85G 58.6MB/s eta 31s " ] }, { @@ -2926,7 +2932,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 73%[=============> ] 4.13G 46.9MB/s eta 34s " + " EWR-1B5-E0 68%[============> ] 3.87G 58.6MB/s eta 31s " ] }, { @@ -2934,7 +2940,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 73%[=============> ] 4.14G 45.6MB/s eta 34s " + " EWR-1B5-E0_ 68%[============> ] 3.88G 59.9MB/s eta 31s " ] }, { @@ -2942,7 +2948,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 73%[=============> ] 4.16G 48.3MB/s eta 34s " + " EWR-1B5-E0_1 69%[============> ] 3.90G 60.3MB/s eta 31s " ] }, { @@ -2950,7 +2956,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 73%[=============> ] 4.16G 47.3MB/s eta 34s " + " EWR-1B5-E0_1- 69%[============> ] 3.90G 57.2MB/s eta 31s " ] }, { @@ -2958,7 +2964,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 73%[=============> ] 4.17G 46.6MB/s eta 34s " + " EWR-1B5-E0_1-m 69%[============> ] 3.92G 59.1MB/s eta 30s " ] }, { @@ -2966,7 +2972,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 74%[=============> ] 4.19G 47.4MB/s eta 34s " + " EWR-1B5-E0_1-me 69%[============> ] 3.95G 61.3MB/s eta 30s " ] }, { @@ -2974,7 +2980,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 74%[=============> ] 4.20G 47.7MB/s eta 32s " + " EWR-1B5-E0_1-mem 70%[=============> ] 3.96G 61.8MB/s eta 30s " ] }, { @@ -2982,7 +2988,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 74%[=============> ] 4.21G 45.7MB/s eta 32s " + " EWR-1B5-E0_1-mem- 70%[=============> ] 3.98G 61.4MB/s eta 30s " ] }, { @@ -2990,7 +2996,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 74%[=============> ] 4.22G 46.3MB/s eta 32s " + " EWR-1B5-E0_1-mem-c 70%[=============> ] 3.99G 63.5MB/s eta 28s " ] }, { @@ -2998,7 +3004,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 75%[==============> ] 4.24G 51.0MB/s eta 32s " + "EWR-1B5-E0_1-mem-ct 71%[=============> ] 4.01G 64.4MB/s eta 28s " ] }, { @@ -3006,7 +3012,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 75%[==============> ] 4.26G 49.9MB/s eta 32s " + "WR-1B5-E0_1-mem-ctx 71%[=============> ] 4.03G 65.3MB/s eta 28s " ] }, { @@ -3014,7 +3020,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 75%[==============> ] 4.27G 48.2MB/s eta 31s " + "R-1B5-E0_1-mem-ctx- 71%[=============> ] 4.04G 60.4MB/s eta 28s " ] }, { @@ -3022,7 +3028,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 75%[==============> ] 4.27G 45.4MB/s eta 31s " + "-1B5-E0_1-mem-ctx-8 71%[=============> ] 4.05G 58.8MB/s eta 27s " ] }, { @@ -3030,7 +3036,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 75%[==============> ] 4.28G 44.7MB/s eta 31s " + "1B5-E0_1-mem-ctx-8k 71%[=============> ] 4.05G 57.0MB/s eta 27s " ] }, { @@ -3038,7 +3044,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 76%[==============> ] 4.29G 45.8MB/s eta 31s " + "B5-E0_1-mem-ctx-8k. 72%[=============> ] 4.07G 57.3MB/s eta 27s " ] }, { @@ -3046,7 +3052,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 76%[==============> ] 4.31G 47.6MB/s eta 31s " + "5-E0_1-mem-ctx-8k.p 72%[=============> ] 4.08G 56.8MB/s eta 27s " ] }, { @@ -3054,7 +3060,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 76%[==============> ] 4.32G 49.4MB/s eta 30s " + "-E0_1-mem-ctx-8k.pt 72%[=============> ] 4.09G 56.5MB/s eta 27s " ] }, { @@ -3062,7 +3068,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 76%[==============> ] 4.34G 53.6MB/s eta 30s " + "E0_1-mem-ctx-8k.pth 72%[=============> ] 4.10G 55.3MB/s eta 27s " ] }, { @@ -3070,7 +3076,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 77%[==============> ] 4.35G 52.4MB/s eta 30s " + "0_1-mem-ctx-8k.pth 72%[=============> ] 4.11G 54.9MB/s eta 27s " ] }, { @@ -3078,7 +3084,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 77%[==============> ] 4.35G 52.2MB/s eta 30s " + "_1-mem-ctx-8k.pth 73%[=============> ] 4.13G 58.7MB/s eta 27s " ] }, { @@ -3086,7 +3092,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 77%[==============> ] 4.37G 51.0MB/s eta 29s " + "1-mem-ctx-8k.pth 73%[=============> ] 4.14G 58.0MB/s eta 27s " ] }, { @@ -3094,7 +3100,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 77%[==============> ] 4.37G 50.1MB/s eta 29s " + "-mem-ctx-8k.pth 73%[=============> ] 4.16G 56.7MB/s eta 27s " ] }, { @@ -3102,7 +3108,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 77%[==============> ] 4.38G 50.4MB/s eta 29s " + "mem-ctx-8k.pth 73%[=============> ] 4.17G 56.0MB/s eta 25s " ] }, { @@ -3110,7 +3116,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 77%[==============> ] 4.39G 49.4MB/s eta 29s " + "em-ctx-8k.pth 74%[=============> ] 4.18G 52.3MB/s eta 25s " ] }, { @@ -3118,7 +3124,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 78%[==============> ] 4.41G 51.4MB/s eta 29s " + "m-ctx-8k.pth 74%[=============> ] 4.19G 53.2MB/s eta 25s " ] }, { @@ -3126,7 +3132,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 78%[==============> ] 4.41G 47.5MB/s eta 28s " + "-ctx-8k.pth 74%[=============> ] 4.21G 52.5MB/s eta 25s " ] }, { @@ -3134,7 +3140,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 78%[==============> ] 4.43G 48.8MB/s eta 28s " + "ctx-8k.pth 74%[=============> ] 4.22G 51.5MB/s eta 25s " ] }, { @@ -3142,7 +3148,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 78%[==============> ] 4.44G 46.8MB/s eta 28s " + "tx-8k.pth 74%[=============> ] 4.23G 52.1MB/s eta 24s " ] }, { @@ -3150,7 +3156,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 78%[==============> ] 4.46G 46.6MB/s eta 28s " + "x-8k.pth 75%[==============> ] 4.25G 53.7MB/s eta 24s " ] }, { @@ -3158,7 +3164,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 79%[==============> ] 4.47G 46.6MB/s eta 26s " + "-8k.pth 75%[==============> ] 4.26G 53.8MB/s eta 24s " ] }, { @@ -3166,7 +3172,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 79%[==============> ] 4.48G 47.1MB/s eta 26s " + "8k.pth 75%[==============> ] 4.28G 56.1MB/s eta 24s " ] }, { @@ -3174,7 +3180,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 79%[==============> ] 4.50G 48.6MB/s eta 26s " + "k.pth 76%[==============> ] 4.30G 59.0MB/s eta 23s " ] }, { @@ -3182,7 +3188,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 79%[==============> ] 4.51G 51.0MB/s eta 26s " + ".pth 76%[==============> ] 4.32G 61.1MB/s eta 23s " ] }, { @@ -3190,7 +3196,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 80%[===============> ] 4.53G 48.6MB/s eta 25s " + "pth 76%[==============> ] 4.33G 61.3MB/s eta 23s " ] }, { @@ -3198,7 +3204,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 80%[===============> ] 4.54G 47.3MB/s eta 25s " + "th 77%[==============> ] 4.35G 60.6MB/s eta 23s " ] }, { @@ -3206,7 +3212,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 80%[===============> ] 4.55G 46.7MB/s eta 25s " + "h 77%[==============> ] 4.37G 58.6MB/s eta 22s " ] }, { @@ -3214,7 +3220,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 80%[===============> ] 4.56G 48.6MB/s eta 25s " + " 77%[==============> ] 4.38G 59.4MB/s eta 22s " ] }, { @@ -3222,7 +3228,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 81%[===============> ] 4.57G 50.5MB/s eta 25s " + " E 77%[==============> ] 4.40G 59.9MB/s eta 22s " ] }, { @@ -3230,7 +3236,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 81%[===============> ] 4.59G 51.3MB/s eta 23s " + " EW 78%[==============> ] 4.41G 61.4MB/s eta 22s " ] }, { @@ -3238,7 +3244,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 81%[===============> ] 4.60G 52.3MB/s eta 23s " + " EWR 78%[==============> ] 4.42G 63.3MB/s eta 21s " ] }, { @@ -3246,7 +3252,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 81%[===============> ] 4.61G 52.6MB/s eta 23s " + " EWR- 78%[==============> ] 4.44G 62.6MB/s eta 21s " ] }, { @@ -3254,7 +3260,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 81%[===============> ] 4.62G 51.2MB/s eta 23s " + " EWR-1 78%[==============> ] 4.46G 62.5MB/s eta 21s " ] }, { @@ -3262,7 +3268,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 82%[===============> ] 4.63G 53.8MB/s eta 23s " + " EWR-1B 79%[==============> ] 4.47G 62.5MB/s eta 21s " ] }, { @@ -3270,7 +3276,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 82%[===============> ] 4.65G 53.4MB/s eta 22s " + " EWR-1B5 79%[==============> ] 4.48G 64.9MB/s eta 21s " ] }, { @@ -3278,7 +3284,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 82%[===============> ] 4.65G 50.5MB/s eta 22s " + " EWR-1B5- 79%[==============> ] 4.50G 65.2MB/s eta 20s " ] }, { @@ -3286,7 +3292,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 82%[===============> ] 4.66G 51.3MB/s eta 22s " + " EWR-1B5-E 79%[==============> ] 4.51G 62.3MB/s eta 20s " ] }, { @@ -3294,7 +3300,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 82%[===============> ] 4.68G 50.3MB/s eta 22s " + " EWR-1B5-E0 80%[===============> ] 4.52G 62.7MB/s eta 20s " ] }, { @@ -3302,7 +3308,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 83%[===============> ] 4.69G 50.6MB/s eta 21s " + " EWR-1B5-E0_ 80%[===============> ] 4.55G 64.9MB/s eta 20s " ] }, { @@ -3310,7 +3316,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 83%[===============> ] 4.69G 48.4MB/s eta 21s " + " EWR-1B5-E0_1 80%[===============> ] 4.56G 65.7MB/s eta 20s " ] }, { @@ -3318,7 +3324,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 83%[===============> ] 4.71G 49.1MB/s eta 21s " + " EWR-1B5-E0_1- 81%[===============> ] 4.57G 62.9MB/s eta 18s " ] }, { @@ -3326,7 +3332,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 83%[===============> ] 4.72G 48.8MB/s eta 21s " + " EWR-1B5-E0_1-m 81%[===============> ] 4.59G 60.8MB/s eta 18s " ] }, { @@ -3334,7 +3340,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 83%[===============> ] 4.74G 48.9MB/s eta 20s " + " EWR-1B5-E0_1-me 81%[===============> ] 4.60G 62.4MB/s eta 18s " ] }, { @@ -3342,7 +3348,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 84%[===============> ] 4.75G 47.1MB/s eta 20s " + " EWR-1B5-E0_1-mem 81%[===============> ] 4.62G 63.8MB/s eta 18s " ] }, { @@ -3350,7 +3356,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 84%[===============> ] 4.77G 49.3MB/s eta 20s " + " EWR-1B5-E0_1-mem- 82%[===============> ] 4.63G 65.1MB/s eta 17s " ] }, { @@ -3358,7 +3364,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 84%[===============> ] 4.78G 51.0MB/s eta 20s " + " EWR-1B5-E0_1-mem-c 82%[===============> ] 4.65G 63.3MB/s eta 17s " ] }, { @@ -3366,7 +3372,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 85%[================> ] 4.80G 50.7MB/s eta 20s " + "EWR-1B5-E0_1-mem-ct 82%[===============> ] 4.68G 65.4MB/s eta 17s " ] }, { @@ -3374,7 +3380,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 85%[================> ] 4.81G 51.0MB/s eta 18s " + "WR-1B5-E0_1-mem-ctx 83%[===============> ] 4.69G 66.3MB/s eta 17s " ] }, { @@ -3382,7 +3388,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 85%[================> ] 4.82G 49.5MB/s eta 18s " + "R-1B5-E0_1-mem-ctx- 83%[===============> ] 4.70G 65.5MB/s eta 17s " ] }, { @@ -3390,7 +3396,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 85%[================> ] 4.83G 45.3MB/s eta 18s " + "-1B5-E0_1-mem-ctx-8 83%[===============> ] 4.71G 63.6MB/s eta 16s " ] }, { @@ -3398,7 +3404,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 85%[================> ] 4.84G 46.8MB/s eta 18s " + "1B5-E0_1-mem-ctx-8k 83%[===============> ] 4.72G 63.2MB/s eta 16s " ] }, { @@ -3406,7 +3412,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 86%[================> ] 4.86G 47.3MB/s eta 18s " + "B5-E0_1-mem-ctx-8k. 83%[===============> ] 4.74G 64.0MB/s eta 16s " ] }, { @@ -3414,7 +3420,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 86%[================> ] 4.87G 49.0MB/s eta 18s " + "5-E0_1-mem-ctx-8k.p 84%[===============> ] 4.74G 63.0MB/s eta 16s " ] }, { @@ -3422,7 +3428,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 86%[================> ] 4.89G 46.8MB/s eta 18s " + "-E0_1-mem-ctx-8k.pt 84%[===============> ] 4.75G 60.2MB/s eta 16s " ] }, { @@ -3430,7 +3436,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 86%[================> ] 4.90G 47.9MB/s eta 16s " + "E0_1-mem-ctx-8k.pth 84%[===============> ] 4.77G 56.0MB/s eta 15s " ] }, { @@ -3438,7 +3444,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 87%[================> ] 4.92G 48.2MB/s eta 16s " + "0_1-mem-ctx-8k.pth 84%[===============> ] 4.78G 56.7MB/s eta 15s " ] }, { @@ -3446,7 +3452,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 87%[================> ] 4.93G 48.5MB/s eta 16s " + "_1-mem-ctx-8k.pth 85%[================> ] 4.80G 60.8MB/s eta 15s " ] }, { @@ -3454,7 +3460,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 87%[================> ] 4.95G 48.5MB/s eta 16s " + "1-mem-ctx-8k.pth 85%[================> ] 4.83G 62.1MB/s eta 15s " ] }, { @@ -3462,7 +3468,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 87%[================> ] 4.95G 46.3MB/s eta 15s " + "-mem-ctx-8k.pth 85%[================> ] 4.84G 60.7MB/s eta 14s " ] }, { @@ -3470,7 +3476,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 87%[================> ] 4.96G 47.7MB/s eta 15s " + "mem-ctx-8k.pth 86%[================> ] 4.86G 56.9MB/s eta 14s " ] }, { @@ -3478,7 +3484,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 87%[================> ] 4.96G 45.5MB/s eta 15s " + "em-ctx-8k.pth 86%[================> ] 4.88G 58.5MB/s eta 14s " ] }, { @@ -3486,7 +3492,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 88%[================> ] 4.98G 44.7MB/s eta 15s " + "m-ctx-8k.pth 86%[================> ] 4.89G 58.3MB/s eta 14s " ] }, { @@ -3494,7 +3500,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 88%[================> ] 4.98G 42.7MB/s eta 15s " + "-ctx-8k.pth 86%[================> ] 4.90G 60.5MB/s eta 14s " ] }, { @@ -3502,7 +3508,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 88%[================> ] 4.99G 39.5MB/s eta 15s " + "ctx-8k.pth 87%[================> ] 4.92G 60.0MB/s eta 12s " ] }, { @@ -3510,7 +3516,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 88%[================> ] 5.00G 41.0MB/s eta 15s " + "tx-8k.pth 87%[================> ] 4.93G 59.4MB/s eta 12s " ] }, { @@ -3518,7 +3524,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 88%[================> ] 5.02G 42.5MB/s eta 15s " + "x-8k.pth 87%[================> ] 4.95G 59.1MB/s eta 12s " ] }, { @@ -3526,7 +3532,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 88%[================> ] 5.02G 41.8MB/s eta 15s " + "-8k.pth 87%[================> ] 4.96G 60.6MB/s eta 12s " ] }, { @@ -3534,7 +3540,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 89%[================> ] 5.04G 41.1MB/s eta 14s " + "8k.pth 88%[================> ] 4.99G 63.2MB/s eta 11s " ] }, { @@ -3542,7 +3548,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 89%[================> ] 5.05G 41.3MB/s eta 14s " + "k.pth 88%[================> ] 5.01G 63.3MB/s eta 11s " ] }, { @@ -3550,7 +3556,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 89%[================> ] 5.05G 36.6MB/s eta 14s " + ".pth 88%[================> ] 5.01G 57.9MB/s eta 11s " ] }, { @@ -3558,7 +3564,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 89%[================> ] 5.07G 39.2MB/s eta 14s " + "pth 89%[================> ] 5.03G 59.8MB/s eta 11s " ] }, { @@ -3566,7 +3572,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 89%[================> ] 5.07G 37.7MB/s eta 13s " + "th 89%[================> ] 5.04G 60.3MB/s eta 11s " ] }, { @@ -3574,7 +3580,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 90%[=================> ] 5.08G 36.2MB/s eta 13s " + "h 89%[================> ] 5.05G 56.5MB/s eta 10s " ] }, { @@ -3582,7 +3588,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 90%[=================> ] 5.10G 37.0MB/s eta 13s " + " 89%[================> ] 5.07G 56.9MB/s eta 10s " ] }, { @@ -3590,7 +3596,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 90%[=================> ] 5.11G 39.6MB/s eta 13s " + " E 90%[=================> ] 5.08G 56.4MB/s eta 10s " ] }, { @@ -3598,7 +3604,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 90%[=================> ] 5.12G 39.4MB/s eta 12s " + " EW 90%[=================> ] 5.10G 57.6MB/s eta 10s " ] }, { @@ -3606,7 +3612,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 91%[=================> ] 5.14G 41.6MB/s eta 12s " + " EWR 90%[=================> ] 5.11G 56.0MB/s eta 9s " ] }, { @@ -3614,7 +3620,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 91%[=================> ] 5.14G 40.0MB/s eta 12s " + " EWR- 90%[=================> ] 5.12G 55.5MB/s eta 9s " ] }, { @@ -3622,7 +3628,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 91%[=================> ] 5.16G 42.4MB/s eta 12s " + " EWR-1 90%[=================> ] 5.13G 56.8MB/s eta 9s " ] }, { @@ -3630,7 +3636,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 91%[=================> ] 5.17G 43.9MB/s eta 12s " + " EWR-1B 91%[=================> ] 5.14G 55.0MB/s eta 9s " ] }, { @@ -3638,7 +3644,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 91%[=================> ] 5.17G 41.0MB/s eta 11s " + " EWR-1B5 91%[=================> ] 5.15G 54.6MB/s eta 9s " ] }, { @@ -3646,7 +3652,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 91%[=================> ] 5.19G 43.9MB/s eta 11s " + " EWR-1B5- 91%[=================> ] 5.17G 54.1MB/s eta 8s " ] }, { @@ -3654,7 +3660,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 92%[=================> ] 5.20G 44.1MB/s eta 11s " + " EWR-1B5-E 91%[=================> ] 5.17G 51.3MB/s eta 8s " ] }, { @@ -3662,7 +3668,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 92%[=================> ] 5.21G 44.2MB/s eta 11s " + " EWR-1B5-E0 91%[=================> ] 5.19G 50.3MB/s eta 8s " ] }, { @@ -3670,7 +3676,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 92%[=================> ] 5.23G 44.7MB/s eta 9s " + " EWR-1B5-E0_ 92%[=================> ] 5.20G 51.1MB/s eta 8s " ] }, { @@ -3678,7 +3684,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 92%[=================> ] 5.24G 44.5MB/s eta 9s " + " EWR-1B5-E0_1 92%[=================> ] 5.21G 53.3MB/s eta 7s " ] }, { @@ -3686,7 +3692,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 93%[=================> ] 5.25G 45.6MB/s eta 9s " + " EWR-1B5-E0_1- 92%[=================> ] 5.24G 56.3MB/s eta 7s " ] }, { @@ -3694,7 +3700,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 93%[=================> ] 5.26G 49.2MB/s eta 9s " + " EWR-1B5-E0_1-m 93%[=================> ] 5.26G 55.1MB/s eta 7s " ] }, { @@ -3702,7 +3708,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 93%[=================> ] 5.27G 48.5MB/s eta 9s " + " EWR-1B5-E0_1-me 93%[=================> ] 5.27G 57.5MB/s eta 7s " ] }, { @@ -3710,7 +3716,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 93%[=================> ] 5.29G 49.6MB/s eta 8s " + " EWR-1B5-E0_1-mem 93%[=================> ] 5.29G 58.3MB/s eta 7s " ] }, { @@ -3718,7 +3724,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 93%[=================> ] 5.29G 46.3MB/s eta 8s " + " EWR-1B5-E0_1-mem- 93%[=================> ] 5.30G 58.3MB/s eta 6s " ] }, { @@ -3726,7 +3732,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 94%[=================> ] 5.31G 47.3MB/s eta 8s " + " EWR-1B5-E0_1-mem-c 94%[=================> ] 5.32G 58.8MB/s eta 6s " ] }, { @@ -3734,7 +3740,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 94%[=================> ] 5.32G 47.0MB/s eta 8s " + "EWR-1B5-E0_1-mem-ct 94%[=================> ] 5.33G 59.2MB/s eta 6s " ] }, { @@ -3742,7 +3748,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 94%[=================> ] 5.33G 49.8MB/s eta 8s " + "WR-1B5-E0_1-mem-ctx 94%[=================> ] 5.35G 60.8MB/s eta 6s " ] }, { @@ -3750,7 +3756,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 94%[=================> ] 5.35G 49.5MB/s eta 7s " + "R-1B5-E0_1-mem-ctx- 95%[==================> ] 5.36G 61.8MB/s eta 6s " ] }, { @@ -3758,7 +3764,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 95%[==================> ] 5.36G 48.9MB/s eta 7s " + "-1B5-E0_1-mem-ctx-8 95%[==================> ] 5.38G 61.8MB/s eta 5s " ] }, { @@ -3766,7 +3772,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 95%[==================> ] 5.38G 51.0MB/s eta 7s " + "1B5-E0_1-mem-ctx-8k 95%[==================> ] 5.39G 60.5MB/s eta 5s " ] }, { @@ -3774,7 +3780,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 95%[==================> ] 5.39G 52.7MB/s eta 7s " + "B5-E0_1-mem-ctx-8k. 95%[==================> ] 5.41G 61.4MB/s eta 5s " ] }, { @@ -3782,7 +3788,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 95%[==================> ] 5.41G 53.1MB/s eta 7s " + "5-E0_1-mem-ctx-8k.p 96%[==================> ] 5.42G 62.4MB/s eta 5s " ] }, { @@ -3790,7 +3796,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 95%[==================> ] 5.41G 51.9MB/s eta 5s " + "-E0_1-mem-ctx-8k.pt 96%[==================> ] 5.44G 61.7MB/s eta 4s " ] }, { @@ -3798,7 +3804,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 96%[==================> ] 5.42G 51.9MB/s eta 5s " + "E0_1-mem-ctx-8k.pth 96%[==================> ] 5.45G 60.3MB/s eta 4s " ] }, { @@ -3806,7 +3812,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 96%[==================> ] 5.44G 53.3MB/s eta 5s " + "0_1-mem-ctx-8k.pth 96%[==================> ] 5.47G 58.9MB/s eta 4s " ] }, { @@ -3814,7 +3820,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 96%[==================> ] 5.45G 53.7MB/s eta 5s " + "_1-mem-ctx-8k.pth 97%[==================> ] 5.48G 56.8MB/s eta 4s " ] }, { @@ -3822,7 +3828,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 96%[==================> ] 5.46G 53.6MB/s eta 5s " + "1-mem-ctx-8k.pth 97%[==================> ] 5.50G 56.2MB/s eta 3s " ] }, { @@ -3830,7 +3836,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 96%[==================> ] 5.47G 52.1MB/s eta 4s " + "-mem-ctx-8k.pth 97%[==================> ] 5.51G 54.8MB/s eta 3s " ] }, { @@ -3838,7 +3844,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 97%[==================> ] 5.49G 53.2MB/s eta 4s " + "mem-ctx-8k.pth 97%[==================> ] 5.52G 54.3MB/s eta 3s " ] }, { @@ -3846,7 +3852,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 97%[==================> ] 5.50G 52.6MB/s eta 4s " + "em-ctx-8k.pth 97%[==================> ] 5.53G 52.5MB/s eta 3s " ] }, { @@ -3854,7 +3860,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 97%[==================> ] 5.51G 52.9MB/s eta 4s " + "m-ctx-8k.pth 98%[==================> ] 5.54G 52.4MB/s eta 2s " ] }, { @@ -3862,7 +3868,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 97%[==================> ] 5.51G 52.5MB/s eta 4s " + "-ctx-8k.pth 98%[==================> ] 5.56G 52.3MB/s eta 2s " ] }, { @@ -3870,7 +3876,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 97%[==================> ] 5.52G 49.7MB/s eta 3s " + "ctx-8k.pth 98%[==================> ] 5.57G 52.1MB/s eta 2s " ] }, { @@ -3878,7 +3884,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 97%[==================> ] 5.53G 49.4MB/s eta 3s " + "tx-8k.pth 98%[==================> ] 5.58G 49.7MB/s eta 2s " ] }, { @@ -3886,7 +3892,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 98%[==================> ] 5.54G 48.4MB/s eta 3s " + "x-8k.pth 99%[==================> ] 5.59G 50.4MB/s eta 2s " ] }, { @@ -3894,7 +3900,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 98%[==================> ] 5.56G 48.0MB/s eta 3s " + "-8k.pth 99%[==================> ] 5.61G 55.0MB/s eta 1s " ] }, { @@ -3902,7 +3908,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 98%[==================> ] 5.57G 50.4MB/s eta 3s " + "8k.pth 99%[==================> ] 5.63G 55.0MB/s eta 1s " ] }, { @@ -3910,31 +3916,44 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 99%[==================> ] 5.59G 48.2MB/s eta 1s " + "k.pth 99%[==================> ] 5.64G 56.1MB/s eta 1s \r", + "EWR-1B5-E0_1-mem-ct 100%[===================>] 5.64G 56.3MB/s in 98s \r\n", + "\r\n", + "2023-08-26 13:29:16 (59.2 MB/s) - ‘EWR-1B5-E0_1-mem-ctx-8k.pth’ saved [6060483163/6060483163]\r\n", + "\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "BaseV5-C-Tune5.pth 99%[==================> ] 5.60G 48.7MB/s eta 1s " + "--2023-08-26 13:29:16-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D2048-E0_1-mem-ctx-8k.pth\r\n", + "Resolving huggingface.co (huggingface.co)... 18.154.227.67, 18.154.227.7, 18.154.227.87, ...\r\n", + "Connecting to huggingface.co (huggingface.co)|18.154.227.67|:443... connected.\r\n", + "HTTP request sent, awaiting response... 302 Found\r\n", + "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/87b64f45529c2049a8b044b7e7c0338a9ede8ba8259d17d987d8e73f8a34fd75?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D2048-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D2048-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693315756&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzMxNTc1Nn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzg3YjY0ZjQ1NTI5YzIwNDlhOGIwNDRiN2U3YzAzMzhhOWVkZThiYTgyNTlkMTdkOTg3ZDhlNzNmOGEzNGZkNzU%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=nQ-K9pUZqkf3Qb-X5VycpSsb2NBCdUjo2I2d1pYB%7EE1ldNGTAfgN6a9qOGn5UuHtD8nAyITD6NgR95cqWgn2AqAUWCTWcqYBc7tuhVIPmbwrYHUwl6FJ52hjrRPmxZngcRQu2Lbg7PXij9qDfqdh1r%7E6z05NRVnGTQ0GkZQQb3maRu5uC9d83DSC88AmR371N2AwiH3t5VUs8w80YL%7E90nAIoeoBsBaMEATtt8k6x6KER-NDZ2fmKLch4cTHxIDGPEaYOKnFyimPy5PWpFC8WYAoGlCE6jLa5P5eXpArLXCNScNiYp4tGyNmcA80Pf9TN9E6UZ-PfU7LwjmrUR2hKg__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", + "--2023-08-26 13:29:16-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/87b64f45529c2049a8b044b7e7c0338a9ede8ba8259d17d987d8e73f8a34fd75?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D2048-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D2048-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693315756&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzMxNTc1Nn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzg3YjY0ZjQ1NTI5YzIwNDlhOGIwNDRiN2U3YzAzMzhhOWVkZThiYTgyNTlkMTdkOTg3ZDhlNzNmOGEzNGZkNzU%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=nQ-K9pUZqkf3Qb-X5VycpSsb2NBCdUjo2I2d1pYB%7EE1ldNGTAfgN6a9qOGn5UuHtD8nAyITD6NgR95cqWgn2AqAUWCTWcqYBc7tuhVIPmbwrYHUwl6FJ52hjrRPmxZngcRQu2Lbg7PXij9qDfqdh1r%7E6z05NRVnGTQ0GkZQQb3maRu5uC9d83DSC88AmR371N2AwiH3t5VUs8w80YL%7E90nAIoeoBsBaMEATtt8k6x6KER-NDZ2fmKLch4cTHxIDGPEaYOKnFyimPy5PWpFC8WYAoGlCE6jLa5P5eXpArLXCNScNiYp4tGyNmcA80Pf9TN9E6UZ-PfU7LwjmrUR2hKg__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", + "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.121, 108.138.64.111, 108.138.64.36, ...\r\n", + "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.121|:443... connected.\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "BaseV5-C-Tune5.pth 99%[==================> ] 5.62G 47.2MB/s eta 1s " + "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ + "200 OK\r\n", + "Length: 1066508293 (1017M) [binary/octet-stream]\r\n", + "Saving to: ‘v5-L6-D2048-E0_1-mem-ctx-8k.pth’\r\n", + "\r\n", "\r", - "BaseV5-C-Tune5.pth 99%[==================> ] 5.63G 50.1MB/s eta 1s " + " v5-L6-D20 0%[ ] 0 --.-KB/s " ] }, { @@ -3942,7 +3961,7 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 99%[==================> ] 5.63G 46.6MB/s eta 0s " + " v5-L6-D204 1%[ ] 15.26M 59.8MB/s " ] }, { @@ -3950,45 +3969,31 @@ "output_type": "stream", "text": [ "\r", - "BaseV5-C-Tune5.pth 99%[==================> ] 5.64G 44.2MB/s eta 0s \r", - "BaseV5-C-Tune5.pth 100%[===================>] 5.64G 44.3MB/s in 2m 6s \r\n", - "\r\n", - "2023-09-05 20:00:31 (46.0 MB/s) - ‘BaseV5-C-Tune5.pth’ saved [6060483063/6060483063]\r\n", - "\r\n" + " v5-L6-D2048 2%[ ] 30.00M 60.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ - "--2023-09-05 20:00:31-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/EWR-1B5-E0_1-mem-ctx-8k.pth\r\n", - "Resolving huggingface.co (huggingface.co)... 18.154.227.67, 18.154.227.7, 18.154.227.69, ...\r\n", - "Connecting to huggingface.co (huggingface.co)|18.154.227.67|:443... connected.\r\n", - "HTTP request sent, awaiting response... " + "\r", + " v5-L6-D2048- 4%[ ] 45.26M 63.8MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ - "302 Found\r\n", - "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/e886ffafd5148b502a00b1c10c847ca918cec61c4c956956a2fe9811c210029b?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27EWR-1B5-E0_1-mem-ctx-8k.pth%3B+filename%3D%22EWR-1B5-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203231&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzIzMX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwL2U4ODZmZmFmZDUxNDhiNTAyYTAwYjFjMTBjODQ3Y2E5MThjZWM2MWM0Yzk1Njk1NmEyZmU5ODExYzIxMDAyOWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=H7dALzpJjHXiRmYXfCi5wdUGBxT-ks5NF0PcdQAODDoHu%7E%7EBwyHOnsQGokQKeqqOmFA-%7E2cFXnl87ifEl3RrCl-xYvtCqJsTu-PCrHupXjKegnvyjToQCJIDtyW5f4RJ9aMmecwsGyTEJG1Nz0q-7Xm4OQfTBH-ItJ34BnzDQgW2XnuVav0keVtbME-KGM-ors8KbEGdI-tHni2lihjuxbBBxaV226vGo9Q7jssSP7WPLseWzK3-16BBLv3At3JjlpxbmDMCBFqNxBnJZbyTsrwmAIRj31kHFM15VSAa0y0CRfQ1Uh09OgdQr2zjlEWgU0mqpgv0M53%7ELLAtQP%7E%7ENw__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", - "--2023-09-05 20:00:31-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/e886ffafd5148b502a00b1c10c847ca918cec61c4c956956a2fe9811c210029b?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27EWR-1B5-E0_1-mem-ctx-8k.pth%3B+filename%3D%22EWR-1B5-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203231&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzIzMX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwL2U4ODZmZmFmZDUxNDhiNTAyYTAwYjFjMTBjODQ3Y2E5MThjZWM2MWM0Yzk1Njk1NmEyZmU5ODExYzIxMDAyOWI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=H7dALzpJjHXiRmYXfCi5wdUGBxT-ks5NF0PcdQAODDoHu%7E%7EBwyHOnsQGokQKeqqOmFA-%7E2cFXnl87ifEl3RrCl-xYvtCqJsTu-PCrHupXjKegnvyjToQCJIDtyW5f4RJ9aMmecwsGyTEJG1Nz0q-7Xm4OQfTBH-ItJ34BnzDQgW2XnuVav0keVtbME-KGM-ors8KbEGdI-tHni2lihjuxbBBxaV226vGo9Q7jssSP7WPLseWzK3-16BBLv3At3JjlpxbmDMCBFqNxBnJZbyTsrwmAIRj31kHFM15VSAa0y0CRfQ1Uh09OgdQr2zjlEWgU0mqpgv0M53%7ELLAtQP%7E%7ENw__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", - "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.111, 108.138.64.36, 108.138.64.49, ...\r\n", - "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.111|:443... connected.\r\n", - "HTTP request sent, awaiting response... " + "\r", + " v5-L6-D2048-E 4%[ ] 45.90M 48.9MB/s " ] }, { "name": "stdout", "output_type": "stream", "text": [ - "200 OK\r\n", - "Length: 6060483163 (5.6G) [binary/octet-stream]\r\n", - "Saving to: ‘EWR-1B5-E0_1-mem-ctx-8k.pth’\r\n", - "\r\n", "\r", - " EWR-1B5-E 0%[ ] 0 --.-KB/s " + " v5-L6-D2048-E0 5%[> ] 60.52M 47.1MB/s " ] }, { @@ -3996,7 +4001,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0 0%[ ] 14.74M 63.3MB/s " + " v5-L6-D2048-E0_ 7%[> ] 75.78M 50.3MB/s " ] }, { @@ -4004,7 +4009,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_ 0%[ ] 17.24M 39.8MB/s " + " v5-L6-D2048-E0_1 8%[> ] 86.07M 50.4MB/s " ] }, { @@ -4012,7 +4017,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1 0%[ ] 30.00M 46.2MB/s " + " v5-L6-D2048-E0_1- 9%[> ] 96.66M 50.7MB/s " ] }, { @@ -4020,7 +4025,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1- 0%[ ] 30.52M 33.1MB/s " + " v5-L6-D2048-E0_1-m 10%[=> ] 106.81M 50.2MB/s " ] }, { @@ -4028,7 +4033,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-m 0%[ ] 46.48M 41.5MB/s " + "v5-L6-D2048-E0_1-me 12%[=> ] 127.07M 54.6MB/s " ] }, { @@ -4036,7 +4041,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-me 1%[ ] 60.52M 41.9MB/s " + "5-L6-D2048-E0_1-mem 14%[=> ] 151.05M 59.7MB/s " ] }, { @@ -4044,7 +4049,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem 1%[ ] 62.21M 37.8MB/s " + "-L6-D2048-E0_1-mem- 15%[==> ] 161.83M 59.3MB/s " ] }, { @@ -4052,7 +4057,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem- 1%[ ] 76.29M 39.9MB/s " + "L6-D2048-E0_1-mem-c 16%[==> ] 167.85M 56.4MB/s " ] }, { @@ -4060,7 +4065,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem-c 1%[ ] 91.55M 41.8MB/s " + "6-D2048-E0_1-mem-ct 18%[==> ] 183.10M 53.6MB/s eta 16s " ] }, { @@ -4068,7 +4073,7 @@ "output_type": "stream", "text": [ "\r", - "EWR-1B5-E0_1-mem-ct 1%[ ] 106.81M 41.6MB/s " + "-D2048-E0_1-mem-ctx 19%[==> ] 198.36M 54.4MB/s eta 16s " ] }, { @@ -4076,7 +4081,7 @@ "output_type": "stream", "text": [ "\r", - "WR-1B5-E0_1-mem-ctx 2%[ ] 120.25M 43.2MB/s " + "D2048-E0_1-mem-ctx- 21%[===> ] 213.62M 54.5MB/s eta 16s " ] }, { @@ -4084,7 +4089,7 @@ "output_type": "stream", "text": [ "\r", - "R-1B5-E0_1-mem-ctx- 2%[ ] 127.59M 42.8MB/s " + "2048-E0_1-mem-ctx-8 21%[===> ] 219.93M 51.6MB/s eta 16s " ] }, { @@ -4092,7 +4097,7 @@ "output_type": "stream", "text": [ "\r", - "-1B5-E0_1-mem-ctx-8 2%[ ] 137.33M 42.9MB/s eta 2m 12s " + "048-E0_1-mem-ctx-8k 22%[===> ] 229.84M 52.4MB/s eta 16s " ] }, { @@ -4100,7 +4105,7 @@ "output_type": "stream", "text": [ "\r", - "1B5-E0_1-mem-ctx-8k 2%[ ] 152.45M 44.6MB/s eta 2m 12s " + "48-E0_1-mem-ctx-8k. 23%[===> ] 242.32M 50.5MB/s eta 15s " ] }, { @@ -4108,7 +4113,7 @@ "output_type": "stream", "text": [ "\r", - "B5-E0_1-mem-ctx-8k. 2%[ ] 152.59M 41.9MB/s eta 2m 12s " + "8-E0_1-mem-ctx-8k.p 25%[====> ] 258.89M 53.4MB/s eta 15s " ] }, { @@ -4116,7 +4121,7 @@ "output_type": "stream", "text": [ "\r", - "5-E0_1-mem-ctx-8k.p 2%[ ] 163.51M 42.6MB/s eta 2m 12s " + "-E0_1-mem-ctx-8k.pt 26%[====> ] 274.14M 53.7MB/s eta 15s " ] }, { @@ -4124,7 +4129,7 @@ "output_type": "stream", "text": [ "\r", - "-E0_1-mem-ctx-8k.pt 3%[ ] 181.57M 45.0MB/s eta 2m 12s " + "E0_1-mem-ctx-8k.pth 28%[====> ] 289.40M 55.0MB/s eta 15s " ] }, { @@ -4132,7 +4137,7 @@ "output_type": "stream", "text": [ "\r", - "E0_1-mem-ctx-8k.pth 3%[ ] 183.10M 42.7MB/s eta 2m 11s " + "0_1-mem-ctx-8k.pth 29%[====> ] 296.23M 54.0MB/s eta 15s " ] }, { @@ -4140,7 +4145,7 @@ "output_type": "stream", "text": [ "\r", - "0_1-mem-ctx-8k.pth 3%[ ] 198.36M 40.6MB/s eta 2m 11s " + "_1-mem-ctx-8k.pth 30%[=====> ] 305.18M 54.5MB/s eta 14s " ] }, { @@ -4148,7 +4153,7 @@ "output_type": "stream", "text": [ "\r", - "_1-mem-ctx-8k.pth 3%[ ] 213.62M 43.7MB/s eta 2m 11s " + "1-mem-ctx-8k.pth 33%[=====> ] 335.69M 57.8MB/s eta 14s " ] }, { @@ -4156,7 +4161,7 @@ "output_type": "stream", "text": [ "\r", - "1-mem-ctx-8k.pth 3%[ ] 228.36M 43.1MB/s eta 2m 11s " + "-mem-ctx-8k.pth 35%[======> ] 357.26M 57.6MB/s eta 14s " ] }, { @@ -4164,7 +4169,7 @@ "output_type": "stream", "text": [ "\r", - "-mem-ctx-8k.pth 4%[ ] 239.57M 46.2MB/s eta 2m 6s " + "mem-ctx-8k.pth 36%[======> ] 376.17M 58.0MB/s eta 14s " ] }, { @@ -4172,7 +4177,7 @@ "output_type": "stream", "text": [ "\r", - "mem-ctx-8k.pth 4%[ ] 244.13M 42.5MB/s eta 2m 6s " + "em-ctx-8k.pth 37%[======> ] 381.47M 56.0MB/s eta 14s " ] }, { @@ -4180,7 +4185,7 @@ "output_type": "stream", "text": [ "\r", - "em-ctx-8k.pth 4%[ ] 259.40M 42.9MB/s eta 2m 6s " + "m-ctx-8k.pth 39%[======> ] 396.73M 55.5MB/s eta 11s " ] }, { @@ -4188,7 +4193,7 @@ "output_type": "stream", "text": [ "\r", - "m-ctx-8k.pth 4%[ ] 274.52M 45.9MB/s eta 2m 6s " + "-ctx-8k.pth 40%[=======> ] 410.16M 55.5MB/s eta 11s " ] }, { @@ -4196,7 +4201,7 @@ "output_type": "stream", "text": [ "\r", - "-ctx-8k.pth 5%[> ] 289.92M 44.5MB/s eta 2m 5s " + "ctx-8k.pth 41%[=======> ] 426.73M 57.1MB/s eta 11s " ] }, { @@ -4204,7 +4209,7 @@ "output_type": "stream", "text": [ "\r", - "ctx-8k.pth 5%[> ] 305.18M 45.2MB/s eta 2m 5s " + "tx-8k.pth 42%[=======> ] 436.06M 59.8MB/s eta 11s " ] }, { @@ -4212,7 +4217,7 @@ "output_type": "stream", "text": [ "\r", - "tx-8k.pth 5%[> ] 320.56M 45.1MB/s eta 2m 5s " + "x-8k.pth 43%[=======> ] 442.51M 57.7MB/s eta 11s " ] }, { @@ -4220,7 +4225,7 @@ "output_type": "stream", "text": [ "\r", - "x-8k.pth 5%[> ] 335.18M 47.6MB/s eta 2m 5s " + "-8k.pth 45%[========> ] 465.45M 62.0MB/s eta 10s " ] }, { @@ -4228,7 +4233,7 @@ "output_type": "stream", "text": [ "\r", - "-8k.pth 6%[> ] 350.95M 48.8MB/s eta 1m 58s " + "8k.pth 46%[========> ] 473.02M 61.3MB/s eta 10s " ] }, { @@ -4236,7 +4241,7 @@ "output_type": "stream", "text": [ "\r", - "8k.pth 6%[> ] 366.20M 46.3MB/s eta 1m 58s " + "k.pth 48%[========> ] 488.28M 64.5MB/s eta 10s " ] }, { @@ -4244,7 +4249,7 @@ "output_type": "stream", "text": [ "\r", - "k.pth 6%[> ] 381.47M 49.4MB/s eta 1m 58s " + ".pth 49%[========> ] 503.03M 64.2MB/s eta 10s " ] }, { @@ -4252,7 +4257,7 @@ "output_type": "stream", "text": [ "\r", - ".pth 6%[> ] 396.73M 48.3MB/s eta 1m 58s " + "pth 51%[=========> ] 518.80M 65.1MB/s eta 10s " ] }, { @@ -4260,7 +4265,7 @@ "output_type": "stream", "text": [ "\r", - "pth 7%[> ] 414.61M 49.7MB/s eta 1m 58s " + "th 52%[=========> ] 535.97M 65.2MB/s eta 8s " ] }, { @@ -4268,7 +4273,7 @@ "output_type": "stream", "text": [ "\r", - "th 7%[> ] 426.73M 51.4MB/s eta 1m 58s " + "h 54%[=========> ] 549.31M 67.0MB/s eta 8s " ] }, { @@ -4276,7 +4281,7 @@ "output_type": "stream", "text": [ "\r", - "h 7%[> ] 430.51M 49.0MB/s eta 1m 58s " + " 55%[==========> ] 564.06M 67.8MB/s eta 8s " ] }, { @@ -4284,7 +4289,7 @@ "output_type": "stream", "text": [ "\r", - " 7%[> ] 440.68M 48.0MB/s eta 1m 58s " + " v 57%[==========> ] 579.83M 59.7MB/s eta 8s " ] }, { @@ -4292,7 +4297,7 @@ "output_type": "stream", "text": [ "\r", - " E 7%[> ] 455.93M 49.6MB/s eta 1m 57s " + " v5 58%[==========> ] 595.09M 60.2MB/s eta 7s " ] }, { @@ -4300,7 +4305,7 @@ "output_type": "stream", "text": [ "\r", - " EW 7%[> ] 460.26M 48.1MB/s eta 1m 57s " + " v5- 60%[===========> ] 610.35M 60.2MB/s eta 7s " ] }, { @@ -4308,7 +4313,7 @@ "output_type": "stream", "text": [ "\r", - " EWR 8%[> ] 468.32M 46.0MB/s eta 1m 57s " + " v5-L 61%[===========> ] 625.61M 59.7MB/s eta 7s " ] }, { @@ -4316,7 +4321,7 @@ "output_type": "stream", "text": [ "\r", - " EWR- 8%[> ] 473.50M 46.0MB/s eta 1m 57s " + " v5-L6 63%[===========> ] 640.87M 57.7MB/s eta 7s " ] }, { @@ -4324,7 +4329,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1 8%[> ] 488.28M 44.7MB/s eta 1m 57s " + " v5-L6- 64%[===========> ] 655.62M 57.6MB/s eta 6s " ] }, { @@ -4332,7 +4337,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B 8%[> ] 503.54M 40.7MB/s eta 2m 0s " + " v5-L6-D 65%[============> ] 667.88M 56.7MB/s eta 6s " ] }, { @@ -4340,7 +4345,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5 8%[> ] 518.80M 44.0MB/s eta 2m 0s " + " v5-L6-D2 65%[============> ] 669.55M 55.9MB/s eta 6s " ] }, { @@ -4348,7 +4353,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5- 9%[> ] 534.05M 40.9MB/s eta 2m 0s " + " v5-L6-D20 67%[============> ] 686.13M 55.7MB/s eta 6s " ] }, { @@ -4356,7 +4361,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E 9%[> ] 548.80M 43.9MB/s eta 2m 0s " + " v5-L6-D204 69%[============> ] 701.90M 53.6MB/s eta 6s " ] }, { @@ -4364,7 +4369,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0 9%[> ] 556.34M 41.7MB/s eta 2m 0s " + " v5-L6-D2048 70%[=============> ] 717.16M 52.7MB/s eta 5s " ] }, { @@ -4372,7 +4377,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_ 9%[> ] 564.58M 43.2MB/s eta 1m 57s " + " v5-L6-D2048- 72%[=============> ] 732.42M 53.9MB/s eta 5s " ] }, { @@ -4380,7 +4385,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1 9%[> ] 577.31M 41.3MB/s eta 1m 57s " + " v5-L6-D2048-E 73%[=============> ] 747.69M 53.1MB/s eta 5s " ] }, { @@ -4388,7 +4393,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1- 10%[=> ] 579.83M 39.0MB/s eta 1m 57s " + " v5-L6-D2048-E0 75%[==============> ] 762.94M 52.9MB/s eta 5s " ] }, { @@ -4396,7 +4401,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-m 10%[=> ] 594.57M 42.3MB/s eta 1m 57s " + " v5-L6-D2048-E0_ 76%[==============> ] 777.68M 53.0MB/s eta 5s " ] }, { @@ -4404,7 +4409,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-me 10%[=> ] 605.08M 42.6MB/s eta 1m 57s " + " v5-L6-D2048-E0_1 77%[==============> ] 792.94M 53.8MB/s eta 4s " ] }, { @@ -4412,7 +4417,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem 10%[=> ] 610.35M 41.2MB/s eta 1m 57s " + " v5-L6-D2048-E0_1- 79%[==============> ] 808.20M 54.2MB/s eta 4s " ] }, { @@ -4420,7 +4425,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem- 10%[=> ] 625.61M 42.7MB/s eta 1m 57s " + " v5-L6-D2048-E0_1-m 81%[===============> ] 823.97M 53.3MB/s eta 4s " ] }, { @@ -4428,7 +4433,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem-c 11%[=> ] 640.87M 43.7MB/s eta 1m 57s " + "v5-L6-D2048-E0_1-me 82%[===============> ] 839.23M 53.4MB/s eta 4s " ] }, { @@ -4436,7 +4441,7 @@ "output_type": "stream", "text": [ "\r", - "EWR-1B5-E0_1-mem-ct 11%[=> ] 656.13M 45.2MB/s eta 1m 57s " + "5-L6-D2048-E0_1-mem 84%[===============> ] 854.49M 55.2MB/s eta 3s " ] }, { @@ -4444,7 +4449,7 @@ "output_type": "stream", "text": [ "\r", - "WR-1B5-E0_1-mem-ctx 11%[=> ] 671.38M 45.5MB/s eta 1m 54s " + "-L6-D2048-E0_1-mem- 86%[================> ] 882.15M 58.6MB/s eta 3s " ] }, { @@ -4452,7 +4457,7 @@ "output_type": "stream", "text": [ "\r", - "R-1B5-E0_1-mem-ctx- 11%[=> ] 686.64M 44.7MB/s eta 1m 54s " + "L6-D2048-E0_1-mem-c 86%[================> ] 884.49M 58.0MB/s eta 3s " ] }, { @@ -4460,7 +4465,7 @@ "output_type": "stream", "text": [ "\r", - "-1B5-E0_1-mem-ctx-8 12%[=> ] 701.90M 45.3MB/s eta 1m 54s " + "6-D2048-E0_1-mem-ct 88%[================> ] 899.75M 59.7MB/s eta 3s " ] }, { @@ -4468,7 +4473,7 @@ "output_type": "stream", "text": [ "\r", - "1B5-E0_1-mem-ctx-8k 12%[=> ] 716.64M 44.2MB/s eta 1m 54s " + "-D2048-E0_1-mem-ctx 89%[================> ] 915.01M 61.3MB/s eta 3s " ] }, { @@ -4476,7 +4481,7 @@ "output_type": "stream", "text": [ "\r", - "B5-E0_1-mem-ctx-8k. 12%[=> ] 719.78M 44.5MB/s eta 1m 53s " + "D2048-E0_1-mem-ctx- 91%[=================> ] 928.95M 60.5MB/s eta 2s " ] }, { @@ -4484,7 +4489,7 @@ "output_type": "stream", "text": [ "\r", - "5-E0_1-mem-ctx-8k.p 12%[=> ] 731.91M 44.2MB/s eta 1m 53s " + "2048-E0_1-mem-ctx-8 93%[=================> ] 946.04M 61.1MB/s eta 2s " ] }, { @@ -4492,7 +4497,7 @@ "output_type": "stream", "text": [ "\r", - "-E0_1-mem-ctx-8k.pt 12%[=> ] 744.53M 46.8MB/s eta 1m 53s " + "048-E0_1-mem-ctx-8k 94%[=================> ] 961.30M 59.8MB/s eta 2s " ] }, { @@ -4500,7 +4505,7 @@ "output_type": "stream", "text": [ "\r", - "E0_1-mem-ctx-8k.pth 12%[=> ] 747.81M 43.0MB/s eta 1m 53s " + "48-E0_1-mem-ctx-8k. 96%[==================> ] 976.55M 62.9MB/s eta 2s " ] }, { @@ -4508,7 +4513,7 @@ "output_type": "stream", "text": [ "\r", - "0_1-mem-ctx-8k.pth 13%[=> ] 762.42M 45.4MB/s eta 1m 53s " + "8-E0_1-mem-ctx-8k.p 97%[==================> ] 993.88M 62.0MB/s eta 0s " ] }, { @@ -4516,7 +4521,7 @@ "output_type": "stream", "text": [ "\r", - "_1-mem-ctx-8k.pth 13%[=> ] 763.07M 42.7MB/s eta 1m 53s " + "-E0_1-mem-ctx-8k.pt 98%[==================> ] 1002M 60.7MB/s eta 0s " ] }, { @@ -4524,7 +4529,7 @@ "output_type": "stream", "text": [ "\r", - "1-mem-ctx-8k.pth 13%[=> ] 778.20M 43.9MB/s eta 1m 53s " + "E0_1-mem-ctx-8k.pth 99%[==================> ] 1007M 57.6MB/s eta 0s " ] }, { @@ -4532,31 +4537,45 @@ "output_type": "stream", "text": [ "\r", - "-mem-ctx-8k.pth 13%[=> ] 793.31M 46.6MB/s eta 1m 53s " + "0_1-mem-ctx-8k.pth 99%[==================> ] 1016M 56.2MB/s eta 0s \r", + "v5-L6-D2048-E0_1-me 100%[===================>] 1017M 56.5MB/s in 18s \r\n", + "\r\n", + "2023-08-26 13:29:35 (56.7 MB/s) - ‘v5-L6-D2048-E0_1-mem-ctx-8k.pth’ saved [1066508293/1066508293]\r\n", + "\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "mem-ctx-8k.pth 13%[=> ] 800.53M 46.0MB/s eta 1m 53s " + "--2023-08-26 13:29:35-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D4096-E0_1-mem-ctx-8k.pth\r\n", + "Resolving huggingface.co (huggingface.co)... 18.154.227.69, 18.154.227.87, 18.154.227.7, ...\r\n", + "Connecting to huggingface.co (huggingface.co)|18.154.227.69|:443... connected.\r\n", + "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "em-ctx-8k.pth 13%[=> ] 808.20M 44.3MB/s eta 1m 53s " + "302 Found\r\n", + "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/5f93b1f6f6f7fb2193130a3a51f8ed41a0541b1b5eab100ca9318c8218d481fa?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D4096-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D4096-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693315775&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzMxNTc3NX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzVmOTNiMWY2ZjZmN2ZiMjE5MzEzMGEzYTUxZjhlZDQxYTA1NDFiMWI1ZWFiMTAwY2E5MzE4YzgyMThkNDgxZmE%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=0PAV9vjTAoSaKMEFt4ra050ppnm5%7EebPodEspDpM%7Egvrid9e19xm4sLLXhnWRGgm63iOJ2eZykOhOquOiG9HtoO5NACC2I3xGt4x8Ti%7Eujc0ObTE8Ks9NcRCIrd2B5DeiQANgL-qAUZfh5hj9MGOyy7MMQZNET%7E7eTFHVGLpB2ijJYbdQPjUO5qF0ZHho9T6avOAi8AyTLlwAfXXldcR7JLX1DLCMWgzZXFvv8AP2i6QgstOqEZ8MX5W%7ESS0mwHkJMhtC234TiouvTE0GcZV7ErFMjAats%7EOPqJj6pp9oh3azAdUqXR%7EBRTlZIZCe5E5oTkBzS3m33LT7cRt5cVSSw__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", + "--2023-08-26 13:29:35-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/5f93b1f6f6f7fb2193130a3a51f8ed41a0541b1b5eab100ca9318c8218d481fa?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D4096-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D4096-E0_1-mem-ctx-8k.pth%22%3B&Expires=1693315775&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5MzMxNTc3NX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzVmOTNiMWY2ZjZmN2ZiMjE5MzEzMGEzYTUxZjhlZDQxYTA1NDFiMWI1ZWFiMTAwY2E5MzE4YzgyMThkNDgxZmE%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=0PAV9vjTAoSaKMEFt4ra050ppnm5%7EebPodEspDpM%7Egvrid9e19xm4sLLXhnWRGgm63iOJ2eZykOhOquOiG9HtoO5NACC2I3xGt4x8Ti%7Eujc0ObTE8Ks9NcRCIrd2B5DeiQANgL-qAUZfh5hj9MGOyy7MMQZNET%7E7eTFHVGLpB2ijJYbdQPjUO5qF0ZHho9T6avOAi8AyTLlwAfXXldcR7JLX1DLCMWgzZXFvv8AP2i6QgstOqEZ8MX5W%7ESS0mwHkJMhtC234TiouvTE0GcZV7ErFMjAats%7EOPqJj6pp9oh3azAdUqXR%7EBRTlZIZCe5E5oTkBzS3m33LT7cRt5cVSSw__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", + "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.49, 108.138.64.36, 108.138.64.111, ...\r\n", + "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.49|:443... connected.\r\n", + "HTTP request sent, awaiting response... " ] }, { "name": "stdout", "output_type": "stream", "text": [ + "200 OK\r\n", + "Length: 3441599237 (3.2G) [binary/octet-stream]\r\n", + "Saving to: ‘v5-L6-D4096-E0_1-mem-ctx-8k.pth’\r\n", + "\r\n", "\r", - "m-ctx-8k.pth 14%[=> ] 809.59M 41.2MB/s eta 1m 53s " + " v5-L6-D40 0%[ ] 0 --.-KB/s " ] }, { @@ -4564,7 +4583,7 @@ "output_type": "stream", "text": [ "\r", - "-ctx-8k.pth 14%[=> ] 823.97M 43.5MB/s eta 1m 53s " + " v5-L6-D409 0%[ ] 14.45M 72.2MB/s " ] }, { @@ -4572,7 +4591,7 @@ "output_type": "stream", "text": [ "\r", - "ctx-8k.pth 14%[=> ] 838.71M 42.0MB/s eta 1m 53s " + " v5-L6-D4096 0%[ ] 30.00M 69.8MB/s " ] }, { @@ -4580,7 +4599,7 @@ "output_type": "stream", "text": [ "\r", - "tx-8k.pth 14%[=> ] 841.85M 41.5MB/s eta 1m 53s " + " v5-L6-D4096- 1%[ ] 45.78M 62.5MB/s " ] }, { @@ -4588,7 +4607,7 @@ "output_type": "stream", "text": [ "\r", - "x-8k.pth 14%[=> ] 854.49M 40.3MB/s eta 1m 52s " + " v5-L6-D4096-E 1%[ ] 63.10M 66.9MB/s " ] }, { @@ -4596,7 +4615,7 @@ "output_type": "stream", "text": [ "\r", - "-8k.pth 14%[=> ] 857.55M 37.3MB/s eta 1m 52s " + " v5-L6-D4096-E0 2%[ ] 76.29M 62.0MB/s " ] }, { @@ -4604,7 +4623,7 @@ "output_type": "stream", "text": [ "\r", - "8k.pth 15%[==> ] 869.75M 40.7MB/s eta 1m 52s " + " v5-L6-D4096-E0_ 2%[ ] 91.55M 61.2MB/s " ] }, { @@ -4612,7 +4631,7 @@ "output_type": "stream", "text": [ "\r", - "k.pth 15%[==> ] 879.33M 39.7MB/s eta 1m 52s " + " v5-L6-D4096-E0_1 3%[ ] 106.81M 61.9MB/s " ] }, { @@ -4620,7 +4639,7 @@ "output_type": "stream", "text": [ "\r", - ".pth 15%[==> ] 884.49M 40.9MB/s eta 1m 52s " + " v5-L6-D4096-E0_1- 3%[ ] 122.07M 61.9MB/s " ] }, { @@ -4628,7 +4647,7 @@ "output_type": "stream", "text": [ "\r", - "pth 15%[==> ] 889.88M 38.8MB/s eta 1m 52s " + " v5-L6-D4096-E0_1-m 4%[ ] 137.33M 61.2MB/s " ] }, { @@ -4636,7 +4655,7 @@ "output_type": "stream", "text": [ "\r", - "th 15%[==> ] 897.75M 39.9MB/s eta 1m 52s " + "v5-L6-D4096-E0_1-me 4%[ ] 152.59M 59.0MB/s " ] }, { @@ -4644,7 +4663,7 @@ "output_type": "stream", "text": [ "\r", - "h 15%[==> ] 915.53M 38.6MB/s eta 1m 52s " + "5-L6-D4096-E0_1-mem 5%[> ] 167.85M 59.2MB/s " ] }, { @@ -4652,7 +4671,7 @@ "output_type": "stream", "text": [ "\r", - " 16%[==> ] 930.78M 38.1MB/s eta 1m 52s " + "-L6-D4096-E0_1-mem- 5%[> ] 183.10M 59.3MB/s eta 52s " ] }, { @@ -4660,7 +4679,7 @@ "output_type": "stream", "text": [ "\r", - " E 16%[==> ] 941.84M 37.3MB/s eta 1m 52s " + "L6-D4096-E0_1-mem-c 6%[> ] 200.07M 60.9MB/s eta 52s " ] }, { @@ -4668,7 +4687,7 @@ "output_type": "stream", "text": [ "\r", - " EW 16%[==> ] 943.71M 37.1MB/s eta 1m 52s " + "6-D4096-E0_1-mem-ct 6%[> ] 213.62M 61.3MB/s eta 52s " ] }, { @@ -4676,7 +4695,7 @@ "output_type": "stream", "text": [ "\r", - " EWR 16%[==> ] 945.90M 34.5MB/s eta 1m 52s " + "-D4096-E0_1-mem-ctx 6%[> ] 228.36M 61.9MB/s eta 52s " ] }, { @@ -4684,7 +4703,7 @@ "output_type": "stream", "text": [ "\r", - " EWR- 16%[==> ] 957.54M 37.2MB/s eta 1m 52s " + "D4096-E0_1-mem-ctx- 7%[> ] 231.28M 58.9MB/s eta 52s " ] }, { @@ -4692,7 +4711,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1 16%[==> ] 961.30M 34.2MB/s eta 1m 52s " + "4096-E0_1-mem-ctx-8 7%[> ] 245.59M 59.4MB/s eta 51s " ] }, { @@ -4700,7 +4719,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B 16%[==> ] 976.55M 34.6MB/s eta 1m 53s " + "096-E0_1-mem-ctx-8k 7%[> ] 259.40M 59.2MB/s eta 51s " ] }, { @@ -4708,7 +4727,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5 17%[==> ] 991.82M 37.2MB/s eta 1m 53s " + "96-E0_1-mem-ctx-8k. 8%[> ] 274.66M 54.8MB/s eta 51s " ] }, { @@ -4716,7 +4735,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5- 17%[==> ] 1007M 37.8MB/s eta 1m 53s " + "6-E0_1-mem-ctx-8k.p 8%[> ] 289.92M 54.4MB/s eta 51s " ] }, { @@ -4724,7 +4743,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E 17%[==> ] 1007M 36.4MB/s eta 1m 53s " + "-E0_1-mem-ctx-8k.pt 9%[> ] 303.43M 56.3MB/s eta 52s " ] }, { @@ -4732,7 +4751,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0 17%[==> ] 1011M 34.6MB/s eta 1m 53s " + "E0_1-mem-ctx-8k.pth 9%[> ] 320.43M 56.5MB/s eta 52s " ] }, { @@ -4740,7 +4759,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_ 17%[==> ] 1022M 36.0MB/s eta 1m 52s " + "0_1-mem-ctx-8k.pth 10%[=> ] 335.69M 51.5MB/s eta 52s " ] }, { @@ -4748,7 +4767,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1 17%[==> ] 1.01G 36.2MB/s eta 1m 52s " + "_1-mem-ctx-8k.pth 10%[=> ] 350.95M 54.7MB/s eta 52s " ] }, { @@ -4756,7 +4775,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1- 18%[==> ] 1.03G 37.6MB/s eta 1m 52s " + "1-mem-ctx-8k.pth 11%[=> ] 373.65M 55.9MB/s eta 49s " ] }, { @@ -4764,7 +4783,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-m 18%[==> ] 1.03G 36.0MB/s eta 1m 52s " + "-mem-ctx-8k.pth 11%[=> ] 381.47M 55.3MB/s eta 49s " ] }, { @@ -4772,7 +4791,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-me 18%[==> ] 1.04G 36.9MB/s eta 1m 51s " + "mem-ctx-8k.pth 12%[=> ] 396.22M 54.8MB/s eta 49s " ] }, { @@ -4780,7 +4799,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem 18%[==> ] 1.06G 34.0MB/s eta 1m 51s " + "em-ctx-8k.pth 12%[=> ] 410.16M 53.9MB/s eta 49s " ] }, { @@ -4788,7 +4807,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem- 18%[==> ] 1.07G 36.7MB/s eta 1m 51s " + "m-ctx-8k.pth 13%[=> ] 426.73M 54.2MB/s eta 50s " ] }, { @@ -4796,7 +4815,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem-c 19%[==> ] 1.07G 34.1MB/s eta 1m 51s " + "-ctx-8k.pth 13%[=> ] 434.90M 52.6MB/s eta 50s " ] }, { @@ -4804,7 +4823,7 @@ "output_type": "stream", "text": [ "\r", - "EWR-1B5-E0_1-mem-ct 19%[==> ] 1.09G 36.6MB/s eta 1m 51s " + "ctx-8k.pth 13%[=> ] 442.51M 50.9MB/s eta 50s " ] }, { @@ -4812,7 +4831,7 @@ "output_type": "stream", "text": [ "\r", - "WR-1B5-E0_1-mem-ctx 19%[==> ] 1.10G 39.1MB/s eta 1m 51s " + "tx-8k.pth 13%[=> ] 457.76M 50.4MB/s eta 50s " ] }, { @@ -4820,7 +4839,7 @@ "output_type": "stream", "text": [ "\r", - "R-1B5-E0_1-mem-ctx- 19%[==> ] 1.11G 39.9MB/s eta 1m 51s " + "x-8k.pth 14%[=> ] 485.65M 56.9MB/s eta 48s " ] }, { @@ -4828,7 +4847,7 @@ "output_type": "stream", "text": [ "\r", - "-1B5-E0_1-mem-ctx-8 19%[==> ] 1.12G 40.3MB/s eta 1m 51s " + "-8k.pth 15%[==> ] 503.54M 57.4MB/s eta 48s " ] }, { @@ -4836,7 +4855,7 @@ "output_type": "stream", "text": [ "\r", - "1B5-E0_1-mem-ctx-8k 20%[===> ] 1.14G 41.6MB/s eta 1m 51s " + "8k.pth 15%[==> ] 518.80M 54.0MB/s eta 48s " ] }, { @@ -4844,7 +4863,7 @@ "output_type": "stream", "text": [ "\r", - "B5-E0_1-mem-ctx-8k. 20%[===> ] 1.15G 40.8MB/s eta 1m 48s " + "k.pth 16%[==> ] 533.54M 55.1MB/s eta 48s " ] }, { @@ -4852,7 +4871,7 @@ "output_type": "stream", "text": [ "\r", - "5-E0_1-mem-ctx-8k.p 20%[===> ] 1.16G 43.4MB/s eta 1m 48s " + ".pth 16%[==> ] 542.02M 54.1MB/s eta 48s " ] }, { @@ -4860,7 +4879,7 @@ "output_type": "stream", "text": [ "\r", - "-E0_1-mem-ctx-8k.pt 20%[===> ] 1.16G 40.8MB/s eta 1m 48s " + "pth 16%[==> ] 549.31M 54.7MB/s eta 48s " ] }, { @@ -4868,7 +4887,7 @@ "output_type": "stream", "text": [ "\r", - "E0_1-mem-ctx-8k.pth 20%[===> ] 1.18G 40.5MB/s eta 1m 48s " + "th 17%[==> ] 564.58M 52.2MB/s eta 48s " ] }, { @@ -4876,7 +4895,7 @@ "output_type": "stream", "text": [ "\r", - "0_1-mem-ctx-8k.pth 21%[===> ] 1.19G 45.1MB/s eta 1m 48s " + "h 17%[==> ] 573.01M 50.2MB/s eta 48s " ] }, { @@ -4884,7 +4903,7 @@ "output_type": "stream", "text": [ "\r", - "_1-mem-ctx-8k.pth 21%[===> ] 1.20G 44.9MB/s eta 1m 47s " + " 17%[==> ] 582.65M 51.6MB/s eta 48s " ] }, { @@ -4892,7 +4911,7 @@ "output_type": "stream", "text": [ "\r", - "1-mem-ctx-8k.pth 21%[===> ] 1.21G 43.8MB/s eta 1m 47s " + " v 18%[==> ] 595.09M 49.7MB/s eta 49s " ] }, { @@ -4900,7 +4919,7 @@ "output_type": "stream", "text": [ "\r", - "-mem-ctx-8k.pth 21%[===> ] 1.21G 42.0MB/s eta 1m 47s " + " v5 18%[==> ] 609.84M 52.8MB/s eta 49s " ] }, { @@ -4908,7 +4927,7 @@ "output_type": "stream", "text": [ "\r", - "mem-ctx-8k.pth 21%[===> ] 1.22G 42.6MB/s eta 1m 47s " + " v5- 18%[==> ] 612.47M 50.4MB/s eta 49s " ] }, { @@ -4916,7 +4935,7 @@ "output_type": "stream", "text": [ "\r", - "em-ctx-8k.pth 21%[===> ] 1.24G 41.8MB/s eta 1m 46s " + " v5-L 19%[==> ] 625.09M 47.8MB/s eta 49s " ] }, { @@ -4924,7 +4943,7 @@ "output_type": "stream", "text": [ "\r", - "m-ctx-8k.pth 22%[===> ] 1.25G 43.7MB/s eta 1m 46s " + " v5-L6 19%[==> ] 635.59M 49.6MB/s eta 49s " ] }, { @@ -4932,7 +4951,7 @@ "output_type": "stream", "text": [ "\r", - "-ctx-8k.pth 22%[===> ] 1.27G 47.1MB/s eta 1m 46s " + " v5-L6- 19%[==> ] 640.87M 47.2MB/s eta 49s " ] }, { @@ -4940,7 +4959,7 @@ "output_type": "stream", "text": [ "\r", - "ctx-8k.pth 22%[===> ] 1.27G 43.4MB/s eta 1m 46s " + " v5-L6-D 19%[==> ] 656.13M 48.2MB/s eta 49s " ] }, { @@ -4948,7 +4967,7 @@ "output_type": "stream", "text": [ "\r", - "tx-8k.pth 22%[===> ] 1.28G 46.2MB/s eta 1m 46s " + " v5-L6-D4 20%[===> ] 671.38M 44.8MB/s eta 49s " ] }, { @@ -4956,7 +4975,7 @@ "output_type": "stream", "text": [ "\r", - "x-8k.pth 22%[===> ] 1.29G 45.2MB/s eta 1m 45s " + " v5-L6-D40 20%[===> ] 686.64M 44.8MB/s eta 49s " ] }, { @@ -4964,7 +4983,7 @@ "output_type": "stream", "text": [ "\r", - "-8k.pth 22%[===> ] 1.30G 43.1MB/s eta 1m 45s " + " v5-L6-D409 21%[===> ] 706.19M 47.9MB/s eta 48s " ] }, { @@ -4972,7 +4991,7 @@ "output_type": "stream", "text": [ "\r", - "8k.pth 23%[===> ] 1.31G 41.9MB/s eta 1m 45s " + " v5-L6-D4096 21%[===> ] 717.16M 47.2MB/s eta 48s " ] }, { @@ -4980,7 +4999,7 @@ "output_type": "stream", "text": [ "\r", - "k.pth 23%[===> ] 1.31G 39.3MB/s eta 1m 45s " + " v5-L6-D4096- 22%[===> ] 732.42M 46.3MB/s eta 48s " ] }, { @@ -4988,7 +5007,7 @@ "output_type": "stream", "text": [ "\r", - ".pth 23%[===> ] 1.33G 39.3MB/s eta 1m 45s " + " v5-L6-D4096-E 22%[===> ] 745.86M 46.4MB/s eta 48s " ] }, { @@ -4996,7 +5015,7 @@ "output_type": "stream", "text": [ "\r", - "pth 23%[===> ] 1.34G 39.3MB/s eta 1m 45s " + " v5-L6-D4096-E0 23%[===> ] 759.61M 48.3MB/s eta 47s " ] }, { @@ -5004,7 +5023,7 @@ "output_type": "stream", "text": [ "\r", - "th 24%[===> ] 1.36G 40.4MB/s eta 1m 45s " + " v5-L6-D4096-E0_ 23%[===> ] 767.09M 48.3MB/s eta 47s " ] }, { @@ -5012,7 +5031,7 @@ "output_type": "stream", "text": [ "\r", - "h 24%[===> ] 1.37G 42.9MB/s eta 1m 45s " + " v5-L6-D4096-E0_1 23%[===> ] 778.20M 48.2MB/s eta 47s " ] }, { @@ -5020,7 +5039,7 @@ "output_type": "stream", "text": [ "\r", - " 24%[===> ] 1.38G 42.9MB/s eta 1m 42s " + " v5-L6-D4096-E0_1- 24%[===> ] 793.46M 49.1MB/s eta 47s " ] }, { @@ -5028,7 +5047,7 @@ "output_type": "stream", "text": [ "\r", - " E 24%[===> ] 1.39G 44.0MB/s eta 1m 42s " + " v5-L6-D4096-E0_1-m 24%[===> ] 808.71M 49.6MB/s eta 46s " ] }, { @@ -5036,7 +5055,7 @@ "output_type": "stream", "text": [ "\r", - " EW 24%[===> ] 1.40G 42.5MB/s eta 1m 42s " + "v5-L6-D4096-E0_1-me 25%[====> ] 823.46M 51.8MB/s eta 46s " ] }, { @@ -5044,7 +5063,7 @@ "output_type": "stream", "text": [ "\r", - " EWR 25%[====> ] 1.42G 45.6MB/s eta 1m 42s " + "5-L6-D4096-E0_1-mem 25%[====> ] 839.23M 53.6MB/s eta 46s " ] }, { @@ -5052,7 +5071,7 @@ "output_type": "stream", "text": [ "\r", - " EWR- 25%[====> ] 1.43G 45.6MB/s eta 1m 42s " + "-L6-D4096-E0_1-mem- 26%[====> ] 854.49M 52.4MB/s eta 46s " ] }, { @@ -5060,7 +5079,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1 25%[====> ] 1.44G 43.5MB/s eta 1m 41s " + "L6-D4096-E0_1-mem-c 26%[====> ] 874.75M 54.5MB/s eta 45s " ] }, { @@ -5068,7 +5087,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B 25%[====> ] 1.45G 44.9MB/s eta 1m 41s " + "6-D4096-E0_1-mem-ct 27%[====> ] 888.17M 57.6MB/s eta 45s " ] }, { @@ -5076,7 +5095,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5 25%[====> ] 1.46G 44.4MB/s eta 1m 41s " + "-D4096-E0_1-mem-ctx 27%[====> ] 900.27M 56.0MB/s eta 45s " ] }, { @@ -5084,7 +5103,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5- 25%[====> ] 1.46G 43.8MB/s eta 1m 41s " + "D4096-E0_1-mem-ctx- 27%[====> ] 915.53M 56.1MB/s eta 45s " ] }, { @@ -5092,7 +5111,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E 26%[====> ] 1.47G 43.9MB/s eta 1m 41s " + "4096-E0_1-mem-ctx-8 28%[====> ] 930.78M 55.9MB/s eta 45s " ] }, { @@ -5100,7 +5119,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0 26%[====> ] 1.48G 44.1MB/s eta 1m 40s " + "096-E0_1-mem-ctx-8k 28%[====> ] 946.04M 55.5MB/s eta 43s " ] }, { @@ -5108,7 +5127,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_ 26%[====> ] 1.49G 43.7MB/s eta 1m 40s " + "96-E0_1-mem-ctx-8k. 29%[====> ] 963.36M 57.9MB/s eta 43s " ] }, { @@ -5116,7 +5135,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1 26%[====> ] 1.50G 44.9MB/s eta 1m 40s " + "6-E0_1-mem-ctx-8k.p 29%[====> ] 967.61M 56.2MB/s eta 43s " ] }, { @@ -5124,7 +5143,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1- 26%[====> ] 1.52G 42.6MB/s eta 99s " + "-E0_1-mem-ctx-8k.pt 29%[====> ] 976.05M 56.5MB/s eta 43s " ] }, { @@ -5132,7 +5151,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-m 27%[====> ] 1.53G 45.9MB/s eta 99s " + "E0_1-mem-ctx-8k.pth 30%[=====> ] 988.87M 56.9MB/s eta 43s " ] }, { @@ -5140,7 +5159,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-me 27%[====> ] 1.55G 45.0MB/s eta 99s " + "0_1-mem-ctx-8k.pth 30%[=====> ] 1002M 56.3MB/s eta 42s " ] }, { @@ -5148,7 +5167,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem 27%[====> ] 1.55G 44.0MB/s eta 99s " + "_1-mem-ctx-8k.pth 30%[=====> ] 1007M 55.5MB/s eta 42s " ] }, { @@ -5156,7 +5175,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem- 27%[====> ] 1.56G 43.3MB/s eta 98s " + "1-mem-ctx-8k.pth 31%[=====> ] 1.00G 54.9MB/s eta 42s " ] }, { @@ -5164,7 +5183,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem-c 27%[====> ] 1.57G 42.3MB/s eta 98s " + "-mem-ctx-8k.pth 31%[=====> ] 1.01G 55.9MB/s eta 42s " ] }, { @@ -5172,7 +5191,7 @@ "output_type": "stream", "text": [ "\r", - "EWR-1B5-E0_1-mem-ct 27%[====> ] 1.58G 42.6MB/s eta 98s " + "mem-ctx-8k.pth 32%[=====> ] 1.03G 55.6MB/s eta 41s " ] }, { @@ -5180,7 +5199,7 @@ "output_type": "stream", "text": [ "\r", - "WR-1B5-E0_1-mem-ctx 28%[====> ] 1.59G 43.4MB/s eta 98s " + "em-ctx-8k.pth 32%[=====> ] 1.04G 55.3MB/s eta 41s " ] }, { @@ -5188,7 +5207,7 @@ "output_type": "stream", "text": [ "\r", - "R-1B5-E0_1-mem-ctx- 28%[====> ] 1.59G 40.2MB/s eta 98s " + "m-ctx-8k.pth 32%[=====> ] 1.04G 50.9MB/s eta 41s " ] }, { @@ -5196,7 +5215,7 @@ "output_type": "stream", "text": [ "\r", - "-1B5-E0_1-mem-ctx-8 28%[====> ] 1.61G 39.3MB/s eta 97s " + "-ctx-8k.pth 32%[=====> ] 1.06G 50.5MB/s eta 41s " ] }, { @@ -5204,7 +5223,7 @@ "output_type": "stream", "text": [ "\r", - "1B5-E0_1-mem-ctx-8k 28%[====> ] 1.61G 39.9MB/s eta 97s " + "ctx-8k.pth 33%[=====> ] 1.07G 50.0MB/s eta 41s " ] }, { @@ -5212,7 +5231,7 @@ "output_type": "stream", "text": [ "\r", - "B5-E0_1-mem-ctx-8k. 28%[====> ] 1.63G 38.4MB/s eta 97s " + "tx-8k.pth 33%[=====> ] 1.08G 47.6MB/s eta 41s " ] }, { @@ -5220,7 +5239,7 @@ "output_type": "stream", "text": [ "\r", - "5-E0_1-mem-ctx-8k.p 28%[====> ] 1.63G 40.2MB/s eta 97s " + "x-8k.pth 33%[=====> ] 1.09G 47.3MB/s eta 41s " ] }, { @@ -5228,7 +5247,7 @@ "output_type": "stream", "text": [ "\r", - "-E0_1-mem-ctx-8k.pt 29%[====> ] 1.64G 38.5MB/s eta 97s " + "-8k.pth 34%[=====> ] 1.10G 46.2MB/s eta 41s " ] }, { @@ -5236,7 +5255,7 @@ "output_type": "stream", "text": [ "\r", - "E0_1-mem-ctx-8k.pth 29%[====> ] 1.65G 38.1MB/s eta 97s " + "8k.pth 34%[=====> ] 1.12G 46.2MB/s eta 41s " ] }, { @@ -5244,7 +5263,7 @@ "output_type": "stream", "text": [ "\r", - "0_1-mem-ctx-8k.pth 29%[====> ] 1.67G 38.2MB/s eta 97s " + "k.pth 35%[======> ] 1.13G 47.4MB/s eta 40s " ] }, { @@ -5252,7 +5271,7 @@ "output_type": "stream", "text": [ "\r", - "_1-mem-ctx-8k.pth 29%[====> ] 1.68G 41.0MB/s eta 97s " + ".pth 35%[======> ] 1.15G 50.8MB/s eta 40s " ] }, { @@ -5260,7 +5279,7 @@ "output_type": "stream", "text": [ "\r", - "1-mem-ctx-8k.pth 29%[====> ] 1.68G 39.2MB/s eta 96s " + "pth 36%[======> ] 1.16G 52.5MB/s eta 40s " ] }, { @@ -5268,7 +5287,7 @@ "output_type": "stream", "text": [ "\r", - "-mem-ctx-8k.pth 30%[=====> ] 1.70G 37.8MB/s eta 96s " + "th 36%[======> ] 1.16G 49.3MB/s eta 40s " ] }, { @@ -5276,7 +5295,7 @@ "output_type": "stream", "text": [ "\r", - "mem-ctx-8k.pth 30%[=====> ] 1.72G 43.1MB/s eta 96s " + "h 36%[======> ] 1.18G 49.9MB/s eta 40s " ] }, { @@ -5284,7 +5303,7 @@ "output_type": "stream", "text": [ "\r", - "em-ctx-8k.pth 30%[=====> ] 1.73G 40.9MB/s eta 96s " + " 37%[======> ] 1.19G 48.9MB/s eta 39s " ] }, { @@ -5292,7 +5311,7 @@ "output_type": "stream", "text": [ "\r", - "m-ctx-8k.pth 30%[=====> ] 1.74G 43.3MB/s eta 94s " + " v 37%[======> ] 1.21G 49.5MB/s eta 39s " ] }, { @@ -5300,7 +5319,7 @@ "output_type": "stream", "text": [ "\r", - "-ctx-8k.pth 31%[=====> ] 1.76G 44.5MB/s eta 94s " + " v5 37%[======> ] 1.21G 46.1MB/s eta 39s " ] }, { @@ -5308,7 +5327,7 @@ "output_type": "stream", "text": [ "\r", - "ctx-8k.pth 31%[=====> ] 1.77G 43.4MB/s eta 94s " + " v5- 38%[======> ] 1.23G 50.5MB/s eta 39s " ] }, { @@ -5316,7 +5335,7 @@ "output_type": "stream", "text": [ "\r", - "tx-8k.pth 31%[=====> ] 1.79G 43.4MB/s eta 93s " + " v5-L 38%[======> ] 1.24G 49.0MB/s eta 39s " ] }, { @@ -5324,7 +5343,7 @@ "output_type": "stream", "text": [ "\r", - "x-8k.pth 31%[=====> ] 1.80G 45.5MB/s eta 93s " + " v5-L6 39%[======> ] 1.25G 50.9MB/s eta 38s " ] }, { @@ -5332,7 +5351,7 @@ "output_type": "stream", "text": [ "\r", - "-8k.pth 31%[=====> ] 1.80G 43.8MB/s eta 93s " + " v5-L6- 39%[======> ] 1.26G 52.1MB/s eta 38s " ] }, { @@ -5340,7 +5359,7 @@ "output_type": "stream", "text": [ "\r", - "8k.pth 32%[=====> ] 1.82G 44.6MB/s eta 93s " + " v5-L6-D 39%[======> ] 1.27G 49.5MB/s eta 38s " ] }, { @@ -5348,7 +5367,7 @@ "output_type": "stream", "text": [ "\r", - "k.pth 32%[=====> ] 1.82G 42.7MB/s eta 93s " + " v5-L6-D4 39%[======> ] 1.28G 50.0MB/s eta 38s " ] }, { @@ -5356,7 +5375,7 @@ "output_type": "stream", "text": [ "\r", - ".pth 32%[=====> ] 1.83G 42.1MB/s eta 93s " + " v5-L6-D40 40%[=======> ] 1.29G 50.0MB/s eta 37s " ] }, { @@ -5364,7 +5383,7 @@ "output_type": "stream", "text": [ "\r", - "pth 32%[=====> ] 1.84G 44.6MB/s eta 93s " + " v5-L6-D409 40%[=======> ] 1.31G 48.3MB/s eta 37s " ] }, { @@ -5372,7 +5391,7 @@ "output_type": "stream", "text": [ "\r", - "th 32%[=====> ] 1.85G 41.3MB/s eta 93s " + " v5-L6-D4096 41%[=======> ] 1.32G 47.8MB/s eta 37s " ] }, { @@ -5380,7 +5399,7 @@ "output_type": "stream", "text": [ "\r", - "h 32%[=====> ] 1.86G 40.6MB/s eta 91s " + " v5-L6-D4096- 41%[=======> ] 1.33G 45.3MB/s eta 37s " ] }, { @@ -5388,7 +5407,7 @@ "output_type": "stream", "text": [ "\r", - " 33%[=====> ] 1.87G 43.2MB/s eta 91s " + " v5-L6-D4096-E 41%[=======> ] 1.34G 46.9MB/s eta 36s " ] }, { @@ -5396,7 +5415,7 @@ "output_type": "stream", "text": [ "\r", - " E 33%[=====> ] 1.88G 39.2MB/s eta 91s " + " v5-L6-D4096-E0 42%[=======> ] 1.36G 47.6MB/s eta 36s " ] }, { @@ -5404,7 +5423,7 @@ "output_type": "stream", "text": [ "\r", - " EW 33%[=====> ] 1.88G 37.0MB/s eta 91s " + " v5-L6-D4096-E0_ 42%[=======> ] 1.37G 51.0MB/s eta 36s " ] }, { @@ -5412,7 +5431,7 @@ "output_type": "stream", "text": [ "\r", - " EWR 33%[=====> ] 1.89G 35.3MB/s eta 91s " + " v5-L6-D4096-E0_1 43%[=======> ] 1.38G 49.1MB/s eta 36s " ] }, { @@ -5420,7 +5439,7 @@ "output_type": "stream", "text": [ "\r", - " EWR- 33%[=====> ] 1.91G 37.0MB/s eta 91s " + " v5-L6-D4096-E0_1- 43%[=======> ] 1.39G 45.8MB/s eta 36s " ] }, { @@ -5428,7 +5447,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1 33%[=====> ] 1.92G 35.6MB/s eta 91s " + " v5-L6-D4096-E0_1-m 43%[=======> ] 1.40G 46.1MB/s eta 35s " ] }, { @@ -5436,7 +5455,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B 34%[=====> ] 1.92G 36.1MB/s eta 91s " + "v5-L6-D4096-E0_1-me 44%[=======> ] 1.42G 48.0MB/s eta 35s " ] }, { @@ -5444,7 +5463,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5 34%[=====> ] 1.94G 37.9MB/s eta 91s " + "5-L6-D4096-E0_1-mem 44%[=======> ] 1.43G 47.6MB/s eta 35s " ] }, { @@ -5452,7 +5471,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5- 34%[=====> ] 1.95G 39.7MB/s eta 89s " + "-L6-D4096-E0_1-mem- 45%[========> ] 1.45G 48.4MB/s eta 35s " ] }, { @@ -5460,7 +5479,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E 34%[=====> ] 1.97G 41.9MB/s eta 89s " + "L6-D4096-E0_1-mem-c 45%[========> ] 1.46G 50.4MB/s eta 35s " ] }, { @@ -5468,7 +5487,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0 35%[======> ] 1.98G 42.5MB/s eta 89s " + "6-D4096-E0_1-mem-ct 45%[========> ] 1.46G 47.4MB/s eta 34s " ] }, { @@ -5476,7 +5495,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_ 35%[======> ] 2.00G 43.7MB/s eta 89s " + "-D4096-E0_1-mem-ctx 46%[========> ] 1.47G 49.5MB/s eta 34s " ] }, { @@ -5484,7 +5503,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1 35%[======> ] 2.00G 43.1MB/s eta 88s " + "D4096-E0_1-mem-ctx- 46%[========> ] 1.49G 51.1MB/s eta 34s " ] }, { @@ -5492,7 +5511,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1- 35%[======> ] 2.01G 41.4MB/s eta 88s " + "4096-E0_1-mem-ctx-8 46%[========> ] 1.50G 51.9MB/s eta 34s " ] }, { @@ -5500,7 +5519,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-m 35%[======> ] 2.03G 44.7MB/s eta 88s " + "096-E0_1-mem-ctx-8k 47%[========> ] 1.52G 53.6MB/s eta 33s " ] }, { @@ -5508,7 +5527,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-me 36%[======> ] 2.04G 44.7MB/s eta 88s " + "96-E0_1-mem-ctx-8k. 47%[========> ] 1.53G 52.3MB/s eta 33s " ] }, { @@ -5516,7 +5535,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem 36%[======> ] 2.05G 46.8MB/s eta 86s " + "6-E0_1-mem-ctx-8k.p 48%[========> ] 1.55G 50.6MB/s eta 33s " ] }, { @@ -5524,7 +5543,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem- 36%[======> ] 2.06G 48.3MB/s eta 86s " + "-E0_1-mem-ctx-8k.pt 48%[========> ] 1.55G 50.5MB/s eta 33s " ] }, { @@ -5532,7 +5551,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem-c 36%[======> ] 2.07G 49.5MB/s eta 86s " + "E0_1-mem-ctx-8k.pth 48%[========> ] 1.56G 50.3MB/s eta 32s " ] }, { @@ -5540,7 +5559,7 @@ "output_type": "stream", "text": [ "\r", - "EWR-1B5-E0_1-mem-ct 36%[======> ] 2.08G 49.0MB/s eta 86s " + "0_1-mem-ctx-8k.pth 49%[========> ] 1.58G 53.0MB/s eta 32s " ] }, { @@ -5548,7 +5567,7 @@ "output_type": "stream", "text": [ "\r", - "WR-1B5-E0_1-mem-ctx 37%[======> ] 2.10G 52.4MB/s eta 86s " + "_1-mem-ctx-8k.pth 49%[========> ] 1.59G 53.6MB/s eta 32s " ] }, { @@ -5556,7 +5575,7 @@ "output_type": "stream", "text": [ "\r", - "R-1B5-E0_1-mem-ctx- 37%[======> ] 2.10G 48.9MB/s eta 85s " + "1-mem-ctx-8k.pth 50%[=========> ] 1.61G 54.7MB/s eta 32s " ] }, { @@ -5564,7 +5583,7 @@ "output_type": "stream", "text": [ "\r", - "-1B5-E0_1-mem-ctx-8 37%[======> ] 2.12G 46.7MB/s eta 85s " + "-mem-ctx-8k.pth 50%[=========> ] 1.62G 51.3MB/s eta 31s " ] }, { @@ -5572,7 +5591,7 @@ "output_type": "stream", "text": [ "\r", - "1B5-E0_1-mem-ctx-8k 37%[======> ] 2.13G 46.7MB/s eta 85s " + "mem-ctx-8k.pth 51%[=========> ] 1.64G 52.6MB/s eta 31s " ] }, { @@ -5580,7 +5599,7 @@ "output_type": "stream", "text": [ "\r", - "B5-E0_1-mem-ctx-8k. 38%[======> ] 2.15G 45.1MB/s eta 84s " + "em-ctx-8k.pth 51%[=========> ] 1.66G 55.2MB/s eta 31s " ] }, { @@ -5588,7 +5607,7 @@ "output_type": "stream", "text": [ "\r", - "5-E0_1-mem-ctx-8k.p 38%[======> ] 2.16G 43.6MB/s eta 84s " + "m-ctx-8k.pth 52%[=========> ] 1.67G 54.2MB/s eta 31s " ] }, { @@ -5596,7 +5615,7 @@ "output_type": "stream", "text": [ "\r", - "-E0_1-mem-ctx-8k.pt 38%[======> ] 2.17G 44.2MB/s eta 84s " + "-ctx-8k.pth 52%[=========> ] 1.68G 54.9MB/s eta 30s " ] }, { @@ -5604,7 +5623,7 @@ "output_type": "stream", "text": [ "\r", - "E0_1-mem-ctx-8k.pth 38%[======> ] 2.17G 42.6MB/s eta 84s " + "ctx-8k.pth 52%[=========> ] 1.70G 52.2MB/s eta 30s " ] }, { @@ -5612,7 +5631,7 @@ "output_type": "stream", "text": [ "\r", - "0_1-mem-ctx-8k.pth 38%[======> ] 2.19G 44.6MB/s eta 83s " + "tx-8k.pth 53%[=========> ] 1.71G 53.8MB/s eta 30s " ] }, { @@ -5620,7 +5639,7 @@ "output_type": "stream", "text": [ "\r", - "_1-mem-ctx-8k.pth 39%[======> ] 2.20G 43.8MB/s eta 83s " + "x-8k.pth 53%[=========> ] 1.71G 50.7MB/s eta 30s " ] }, { @@ -5628,7 +5647,7 @@ "output_type": "stream", "text": [ "\r", - "1-mem-ctx-8k.pth 39%[======> ] 2.22G 44.4MB/s eta 83s " + "-8k.pth 53%[=========> ] 1.73G 51.9MB/s eta 29s " ] }, { @@ -5636,7 +5655,7 @@ "output_type": "stream", "text": [ "\r", - "-mem-ctx-8k.pth 39%[======> ] 2.23G 47.0MB/s eta 83s " + "8k.pth 54%[=========> ] 1.74G 51.9MB/s eta 29s " ] }, { @@ -5644,7 +5663,7 @@ "output_type": "stream", "text": [ "\r", - "mem-ctx-8k.pth 39%[======> ] 2.25G 46.2MB/s eta 81s " + "k.pth 54%[=========> ] 1.76G 54.8MB/s eta 29s " ] }, { @@ -5652,7 +5671,7 @@ "output_type": "stream", "text": [ "\r", - "em-ctx-8k.pth 39%[======> ] 2.25G 44.5MB/s eta 81s " + ".pth 55%[==========> ] 1.77G 55.4MB/s eta 29s " ] }, { @@ -5660,7 +5679,7 @@ "output_type": "stream", "text": [ "\r", - "m-ctx-8k.pth 40%[=======> ] 2.26G 45.0MB/s eta 81s " + "pth 55%[==========> ] 1.79G 55.1MB/s eta 29s " ] }, { @@ -5668,7 +5687,7 @@ "output_type": "stream", "text": [ "\r", - "-ctx-8k.pth 40%[=======> ] 2.28G 44.9MB/s eta 81s " + "th 56%[==========> ] 1.80G 55.7MB/s eta 27s " ] }, { @@ -5676,7 +5695,7 @@ "output_type": "stream", "text": [ "\r", - "ctx-8k.pth 40%[=======> ] 2.29G 43.2MB/s eta 80s " + "h 56%[==========> ] 1.82G 57.3MB/s eta 27s " ] }, { @@ -5684,7 +5703,7 @@ "output_type": "stream", "text": [ "\r", - "tx-8k.pth 40%[=======> ] 2.31G 47.7MB/s eta 80s " + " 56%[==========> ] 1.82G 53.5MB/s eta 27s " ] }, { @@ -5692,7 +5711,7 @@ "output_type": "stream", "text": [ "\r", - "x-8k.pth 40%[=======> ] 2.31G 43.4MB/s eta 80s " + " v 57%[==========> ] 1.83G 52.6MB/s eta 27s " ] }, { @@ -5700,7 +5719,7 @@ "output_type": "stream", "text": [ "\r", - "-8k.pth 41%[=======> ] 2.32G 46.1MB/s eta 80s " + " v5 57%[==========> ] 1.85G 55.3MB/s eta 27s " ] }, { @@ -5708,7 +5727,7 @@ "output_type": "stream", "text": [ "\r", - "8k.pth 41%[=======> ] 2.33G 46.9MB/s eta 80s " + " v5- 58%[==========> ] 1.86G 54.3MB/s eta 26s " ] }, { @@ -5716,7 +5735,7 @@ "output_type": "stream", "text": [ "\r", - "k.pth 41%[=======> ] 2.34G 46.2MB/s eta 79s " + " v5-L 58%[==========> ] 1.86G 50.9MB/s eta 26s " ] }, { @@ -5724,7 +5743,7 @@ "output_type": "stream", "text": [ "\r", - ".pth 41%[=======> ] 2.35G 46.5MB/s eta 79s " + " v5-L6 58%[==========> ] 1.88G 50.6MB/s eta 26s " ] }, { @@ -5732,7 +5751,7 @@ "output_type": "stream", "text": [ "\r", - "pth 41%[=======> ] 2.37G 46.2MB/s eta 79s " + " v5-L6- 59%[==========> ] 1.89G 51.7MB/s eta 26s " ] }, { @@ -5740,7 +5759,7 @@ "output_type": "stream", "text": [ "\r", - "th 42%[=======> ] 2.38G 46.2MB/s eta 79s " + " v5-L6-D 59%[==========> ] 1.91G 51.6MB/s eta 25s " ] }, { @@ -5748,7 +5767,7 @@ "output_type": "stream", "text": [ "\r", - "h 42%[=======> ] 2.38G 43.9MB/s eta 78s " + " v5-L6-D4 59%[==========> ] 1.92G 50.9MB/s eta 25s " ] }, { @@ -5756,7 +5775,7 @@ "output_type": "stream", "text": [ "\r", - " 42%[=======> ] 2.40G 42.8MB/s eta 78s " + " v5-L6-D40 60%[===========> ] 1.93G 51.7MB/s eta 25s " ] }, { @@ -5764,7 +5783,7 @@ "output_type": "stream", "text": [ "\r", - " E 42%[=======> ] 2.41G 42.4MB/s eta 78s " + " v5-L6-D409 60%[===========> ] 1.94G 50.8MB/s eta 25s " ] }, { @@ -5772,7 +5791,7 @@ "output_type": "stream", "text": [ "\r", - " EW 42%[=======> ] 2.41G 41.4MB/s eta 78s " + " v5-L6-D4096 60%[===========> ] 1.95G 52.2MB/s eta 25s " ] }, { @@ -5780,7 +5799,7 @@ "output_type": "stream", "text": [ "\r", - " EWR 42%[=======> ] 2.41G 40.8MB/s eta 78s " + " v5-L6-D4096- 61%[===========> ] 1.97G 51.5MB/s eta 25s " ] }, { @@ -5788,7 +5807,7 @@ "output_type": "stream", "text": [ "\r", - " EWR- 42%[=======> ] 2.42G 38.1MB/s eta 77s " + " v5-L6-D4096-E 61%[===========> ] 1.98G 50.4MB/s eta 25s " ] }, { @@ -5796,7 +5815,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1 43%[=======> ] 2.43G 37.2MB/s eta 77s " + " v5-L6-D4096-E0 62%[===========> ] 2.00G 49.6MB/s eta 25s " ] }, { @@ -5804,7 +5823,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B 43%[=======> ] 2.44G 36.3MB/s eta 77s " + " v5-L6-D4096-E0_ 62%[===========> ] 2.01G 49.4MB/s eta 23s " ] }, { @@ -5812,7 +5831,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5 43%[=======> ] 2.45G 37.6MB/s eta 77s " + " v5-L6-D4096-E0_1 63%[===========> ] 2.03G 48.8MB/s eta 23s " ] }, { @@ -5820,7 +5839,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5- 43%[=======> ] 2.46G 36.6MB/s eta 77s " + " v5-L6-D4096-E0_1- 63%[===========> ] 2.04G 51.1MB/s eta 23s " ] }, { @@ -5828,7 +5847,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E 43%[=======> ] 2.47G 37.1MB/s eta 76s " + " v5-L6-D4096-E0_1-m 63%[===========> ] 2.05G 50.6MB/s eta 23s " ] }, { @@ -5836,7 +5855,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0 44%[=======> ] 2.49G 39.2MB/s eta 76s " + "v5-L6-D4096-E0_1-me 64%[===========> ] 2.06G 50.5MB/s eta 23s " ] }, { @@ -5844,7 +5863,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_ 44%[=======> ] 2.50G 37.7MB/s eta 76s " + "5-L6-D4096-E0_1-mem 64%[===========> ] 2.07G 51.2MB/s eta 22s " ] }, { @@ -5852,7 +5871,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1 44%[=======> ] 2.52G 37.0MB/s eta 76s " + "-L6-D4096-E0_1-mem- 64%[===========> ] 2.08G 51.2MB/s eta 22s " ] }, { @@ -5860,7 +5879,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1- 44%[=======> ] 2.52G 37.7MB/s eta 75s " + "L6-D4096-E0_1-mem-c 65%[============> ] 2.09G 48.9MB/s eta 22s " ] }, { @@ -5868,7 +5887,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-m 44%[=======> ] 2.53G 39.3MB/s eta 75s " + "6-D4096-E0_1-mem-ct 65%[============> ] 2.10G 48.0MB/s eta 22s " ] }, { @@ -5876,7 +5895,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-me 44%[=======> ] 2.54G 38.0MB/s eta 75s " + "-D4096-E0_1-mem-ctx 66%[============> ] 2.12G 50.3MB/s eta 22s " ] }, { @@ -5884,7 +5903,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem 45%[========> ] 2.55G 34.9MB/s eta 75s " + "D4096-E0_1-mem-ctx- 66%[============> ] 2.13G 50.1MB/s eta 21s " ] }, { @@ -5892,7 +5911,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem- 45%[========> ] 2.55G 33.6MB/s eta 75s " + "4096-E0_1-mem-ctx-8 66%[============> ] 2.14G 50.9MB/s eta 21s " ] }, { @@ -5900,7 +5919,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem-c 45%[========> ] 2.56G 34.4MB/s eta 75s " + "096-E0_1-mem-ctx-8k 67%[============> ] 2.16G 52.8MB/s eta 21s " ] }, { @@ -5908,7 +5927,7 @@ "output_type": "stream", "text": [ "\r", - "EWR-1B5-E0_1-mem-ct 45%[========> ] 2.58G 35.9MB/s eta 75s " + "96-E0_1-mem-ctx-8k. 67%[============> ] 2.17G 54.8MB/s eta 21s " ] }, { @@ -5916,7 +5935,7 @@ "output_type": "stream", "text": [ "\r", - "WR-1B5-E0_1-mem-ctx 45%[========> ] 2.59G 37.2MB/s eta 75s " + "6-E0_1-mem-ctx-8k.p 67%[============> ] 2.17G 52.1MB/s eta 21s " ] }, { @@ -5924,7 +5943,7 @@ "output_type": "stream", "text": [ "\r", - "R-1B5-E0_1-mem-ctx- 46%[========> ] 2.61G 39.4MB/s eta 75s " + "-E0_1-mem-ctx-8k.pt 68%[============> ] 2.19G 52.9MB/s eta 20s " ] }, { @@ -5932,7 +5951,7 @@ "output_type": "stream", "text": [ "\r", - "-1B5-E0_1-mem-ctx-8 46%[========> ] 2.62G 39.3MB/s eta 75s " + "E0_1-mem-ctx-8k.pth 68%[============> ] 2.19G 49.6MB/s eta 20s " ] }, { @@ -5940,7 +5959,7 @@ "output_type": "stream", "text": [ "\r", - "1B5-E0_1-mem-ctx-8k 46%[========> ] 2.64G 40.0MB/s eta 75s " + "0_1-mem-ctx-8k.pth 68%[============> ] 2.20G 51.2MB/s eta 20s " ] }, { @@ -5948,7 +5967,7 @@ "output_type": "stream", "text": [ "\r", - "B5-E0_1-mem-ctx-8k. 46%[========> ] 2.64G 38.5MB/s eta 73s " + "_1-mem-ctx-8k.pth 69%[============> ] 2.21G 49.2MB/s eta 20s " ] }, { @@ -5956,7 +5975,7 @@ "output_type": "stream", "text": [ "\r", - "5-E0_1-mem-ctx-8k.p 46%[========> ] 2.65G 40.5MB/s eta 73s " + "1-mem-ctx-8k.pth 69%[============> ] 2.22G 47.1MB/s eta 20s " ] }, { @@ -5964,7 +5983,7 @@ "output_type": "stream", "text": [ "\r", - "-E0_1-mem-ctx-8k.pt 47%[========> ] 2.67G 40.0MB/s eta 73s " + "-mem-ctx-8k.pth 69%[============> ] 2.23G 49.6MB/s eta 19s " ] }, { @@ -5972,7 +5991,7 @@ "output_type": "stream", "text": [ "\r", - "E0_1-mem-ctx-8k.pth 47%[========> ] 2.68G 41.5MB/s eta 73s " + "mem-ctx-8k.pth 70%[=============> ] 2.25G 49.0MB/s eta 19s " ] }, { @@ -5980,7 +5999,7 @@ "output_type": "stream", "text": [ "\r", - "0_1-mem-ctx-8k.pth 47%[========> ] 2.69G 41.1MB/s eta 73s " + "em-ctx-8k.pth 70%[=============> ] 2.26G 48.8MB/s eta 19s " ] }, { @@ -5988,7 +6007,7 @@ "output_type": "stream", "text": [ "\r", - "_1-mem-ctx-8k.pth 47%[========> ] 2.70G 38.8MB/s eta 71s " + "m-ctx-8k.pth 71%[=============> ] 2.28G 49.2MB/s eta 19s " ] }, { @@ -5996,7 +6015,7 @@ "output_type": "stream", "text": [ "\r", - "1-mem-ctx-8k.pth 47%[========> ] 2.71G 41.2MB/s eta 71s " + "-ctx-8k.pth 71%[=============> ] 2.29G 52.0MB/s eta 18s " ] }, { @@ -6004,7 +6023,7 @@ "output_type": "stream", "text": [ "\r", - "-mem-ctx-8k.pth 48%[========> ] 2.71G 42.5MB/s eta 71s " + "ctx-8k.pth 72%[=============> ] 2.31G 51.0MB/s eta 18s " ] }, { @@ -6012,7 +6031,7 @@ "output_type": "stream", "text": [ "\r", - "mem-ctx-8k.pth 48%[========> ] 2.72G 45.5MB/s eta 71s " + "tx-8k.pth 72%[=============> ] 2.32G 51.4MB/s eta 18s " ] }, { @@ -6020,7 +6039,7 @@ "output_type": "stream", "text": [ "\r", - "em-ctx-8k.pth 48%[========> ] 2.73G 42.6MB/s eta 71s " + "x-8k.pth 72%[=============> ] 2.34G 50.6MB/s eta 18s " ] }, { @@ -6028,7 +6047,7 @@ "output_type": "stream", "text": [ "\r", - "m-ctx-8k.pth 48%[========> ] 2.74G 41.7MB/s eta 70s " + "-8k.pth 73%[=============> ] 2.35G 50.3MB/s eta 17s " ] }, { @@ -6036,7 +6055,7 @@ "output_type": "stream", "text": [ "\r", - "-ctx-8k.pth 48%[========> ] 2.75G 44.8MB/s eta 70s " + "8k.pth 73%[=============> ] 2.35G 49.2MB/s eta 17s " ] }, { @@ -6044,7 +6063,7 @@ "output_type": "stream", "text": [ "\r", - "ctx-8k.pth 48%[========> ] 2.76G 44.6MB/s eta 70s " + "k.pth 73%[=============> ] 2.37G 49.4MB/s eta 17s " ] }, { @@ -6052,7 +6071,7 @@ "output_type": "stream", "text": [ "\r", - "tx-8k.pth 49%[========> ] 2.77G 42.7MB/s eta 70s " + ".pth 74%[=============> ] 2.38G 50.2MB/s eta 17s " ] }, { @@ -6060,7 +6079,7 @@ "output_type": "stream", "text": [ "\r", - "x-8k.pth 49%[========> ] 2.79G 44.0MB/s eta 70s " + "pth 74%[=============> ] 2.39G 48.5MB/s eta 17s " ] }, { @@ -6068,7 +6087,7 @@ "output_type": "stream", "text": [ "\r", - "-8k.pth 49%[========> ] 2.81G 45.8MB/s eta 68s " + "th 74%[=============> ] 2.40G 47.0MB/s eta 16s " ] }, { @@ -6076,7 +6095,7 @@ "output_type": "stream", "text": [ "\r", - "8k.pth 49%[========> ] 2.81G 47.1MB/s eta 68s " + "h 75%[==============> ] 2.41G 47.5MB/s eta 16s " ] }, { @@ -6084,7 +6103,7 @@ "output_type": "stream", "text": [ "\r", - "k.pth 49%[========> ] 2.82G 41.1MB/s eta 68s " + " 75%[==============> ] 2.41G 46.8MB/s eta 16s " ] }, { @@ -6092,7 +6111,7 @@ "output_type": "stream", "text": [ "\r", - ".pth 50%[=========> ] 2.83G 42.8MB/s eta 68s " + " v 75%[==============> ] 2.41G 45.5MB/s eta 16s " ] }, { @@ -6100,7 +6119,7 @@ "output_type": "stream", "text": [ "\r", - "pth 50%[=========> ] 2.85G 43.0MB/s eta 67s " + " v5 76%[==============> ] 2.44G 49.9MB/s eta 16s " ] }, { @@ -6108,7 +6127,7 @@ "output_type": "stream", "text": [ "\r", - "th 50%[=========> ] 2.86G 45.6MB/s eta 67s " + " v5- 76%[==============> ] 2.44G 46.5MB/s eta 15s " ] }, { @@ -6116,7 +6135,7 @@ "output_type": "stream", "text": [ "\r", - "h 50%[=========> ] 2.88G 46.0MB/s eta 67s " + " v5-L 76%[==============> ] 2.46G 46.8MB/s eta 15s " ] }, { @@ -6124,7 +6143,7 @@ "output_type": "stream", "text": [ "\r", - " 51%[=========> ] 2.89G 47.7MB/s eta 67s " + " v5-L6 76%[==============> ] 2.46G 45.3MB/s eta 15s " ] }, { @@ -6132,7 +6151,7 @@ "output_type": "stream", "text": [ "\r", - " E 51%[=========> ] 2.90G 47.0MB/s eta 66s " + " v5-L6- 77%[==============> ] 2.47G 44.0MB/s eta 15s " ] }, { @@ -6140,7 +6159,7 @@ "output_type": "stream", "text": [ "\r", - " EW 51%[=========> ] 2.91G 47.1MB/s eta 66s " + " v5-L6-D 77%[==============> ] 2.49G 46.3MB/s eta 15s " ] }, { @@ -6148,7 +6167,7 @@ "output_type": "stream", "text": [ "\r", - " EWR 51%[=========> ] 2.92G 49.3MB/s eta 66s " + " v5-L6-D4 77%[==============> ] 2.50G 45.0MB/s eta 14s " ] }, { @@ -6156,7 +6175,7 @@ "output_type": "stream", "text": [ "\r", - " EWR- 51%[=========> ] 2.92G 46.0MB/s eta 66s " + " v5-L6-D40 78%[==============> ] 2.51G 45.7MB/s eta 14s " ] }, { @@ -6164,7 +6183,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1 52%[=========> ] 2.93G 47.6MB/s eta 65s " + " v5-L6-D409 78%[==============> ] 2.52G 46.3MB/s eta 14s " ] }, { @@ -6172,7 +6191,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B 52%[=========> ] 2.95G 47.6MB/s eta 65s " + " v5-L6-D4096 79%[==============> ] 2.53G 45.4MB/s eta 14s " ] }, { @@ -6180,7 +6199,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5 52%[=========> ] 2.96G 46.1MB/s eta 65s " + " v5-L6-D4096- 79%[==============> ] 2.55G 45.6MB/s eta 14s " ] }, { @@ -6188,7 +6207,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5- 52%[=========> ] 2.98G 45.3MB/s eta 64s " + " v5-L6-D4096-E 79%[==============> ] 2.56G 48.4MB/s eta 13s " ] }, { @@ -6196,7 +6215,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E 53%[=========> ] 2.99G 44.4MB/s eta 64s " + " v5-L6-D4096-E0 80%[===============> ] 2.58G 48.2MB/s eta 13s " ] }, { @@ -6204,7 +6223,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0 53%[=========> ] 3.00G 42.1MB/s eta 64s " + " v5-L6-D4096-E0_ 80%[===============> ] 2.58G 46.9MB/s eta 13s " ] }, { @@ -6212,7 +6231,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_ 53%[=========> ] 3.01G 43.2MB/s eta 64s " + " v5-L6-D4096-E0_1 80%[===============> ] 2.59G 49.3MB/s eta 13s " ] }, { @@ -6220,7 +6239,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1 53%[=========> ] 3.01G 42.8MB/s eta 64s " + " v5-L6-D4096-E0_1- 81%[===============> ] 2.61G 45.2MB/s eta 12s " ] }, { @@ -6228,7 +6247,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1- 53%[=========> ] 3.02G 42.3MB/s eta 63s " + " v5-L6-D4096-E0_1-m 81%[===============> ] 2.62G 48.9MB/s eta 12s " ] }, { @@ -6236,7 +6255,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-m 53%[=========> ] 3.04G 42.0MB/s eta 63s " + "v5-L6-D4096-E0_1-me 82%[===============> ] 2.64G 48.9MB/s eta 12s " ] }, { @@ -6244,7 +6263,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-me 53%[=========> ] 3.04G 39.4MB/s eta 63s " + "5-L6-D4096-E0_1-mem 82%[===============> ] 2.65G 49.2MB/s eta 12s " ] }, { @@ -6252,7 +6271,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem 54%[=========> ] 3.05G 38.4MB/s eta 63s " + "-L6-D4096-E0_1-mem- 83%[===============> ] 2.67G 49.8MB/s eta 12s " ] }, { @@ -6260,7 +6279,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem- 54%[=========> ] 3.07G 39.7MB/s eta 62s " + "L6-D4096-E0_1-mem-c 83%[===============> ] 2.68G 50.8MB/s eta 10s " ] }, { @@ -6268,7 +6287,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-mem-c 54%[=========> ] 3.08G 40.7MB/s eta 62s " + "6-D4096-E0_1-mem-ct 84%[===============> ] 2.70G 50.6MB/s eta 10s " ] }, { @@ -6276,7 +6295,7 @@ "output_type": "stream", "text": [ "\r", - "EWR-1B5-E0_1-mem-ct 54%[=========> ] 3.09G 40.4MB/s eta 62s " + "-D4096-E0_1-mem-ctx 84%[===============> ] 2.70G 50.0MB/s eta 10s " ] }, { @@ -6284,7 +6303,7 @@ "output_type": "stream", "text": [ "\r", - "WR-1B5-E0_1-mem-ctx 54%[=========> ] 3.10G 39.0MB/s eta 62s " + "D4096-E0_1-mem-ctx- 84%[===============> ] 2.71G 49.3MB/s eta 10s " ] }, { @@ -6292,7 +6311,7 @@ "output_type": "stream", "text": [ "\r", - "R-1B5-E0_1-mem-ctx- 55%[==========> ] 3.11G 41.6MB/s eta 61s " + "4096-E0_1-mem-ctx-8 85%[================> ] 2.73G 49.5MB/s eta 10s " ] }, { @@ -6300,7 +6319,7 @@ "output_type": "stream", "text": [ "\r", - "-1B5-E0_1-mem-ctx-8 55%[==========> ] 3.13G 39.1MB/s eta 61s " + "096-E0_1-mem-ctx-8k 85%[================> ] 2.74G 52.1MB/s eta 9s " ] }, { @@ -6308,7 +6327,7 @@ "output_type": "stream", "text": [ "\r", - "1B5-E0_1-mem-ctx-8k 55%[==========> ] 3.14G 40.3MB/s eta 61s " + "96-E0_1-mem-ctx-8k. 86%[================> ] 2.76G 51.2MB/s eta 9s " ] }, { @@ -6316,7 +6335,7 @@ "output_type": "stream", "text": [ "\r", - "B5-E0_1-mem-ctx-8k. 55%[==========> ] 3.16G 41.2MB/s eta 61s " + "6-E0_1-mem-ctx-8k.p 86%[================> ] 2.77G 53.9MB/s eta 9s " ] }, { @@ -6324,7 +6343,7 @@ "output_type": "stream", "text": [ "\r", - "5-E0_1-mem-ctx-8k.p 56%[==========> ] 3.17G 40.5MB/s eta 59s " + "-E0_1-mem-ctx-8k.pt 86%[================> ] 2.77G 50.2MB/s eta 9s " ] }, { @@ -6332,7 +6351,7 @@ "output_type": "stream", "text": [ "\r", - "-E0_1-mem-ctx-8k.pt 56%[==========> ] 3.17G 40.1MB/s eta 59s " + "E0_1-mem-ctx-8k.pth 87%[================> ] 2.80G 54.7MB/s eta 8s " ] }, { @@ -6340,7 +6359,7 @@ "output_type": "stream", "text": [ "\r", - "E0_1-mem-ctx-8k.pth 56%[==========> ] 3.19G 42.1MB/s eta 59s " + "0_1-mem-ctx-8k.pth 87%[================> ] 2.82G 57.2MB/s eta 8s " ] }, { @@ -6348,7 +6367,7 @@ "output_type": "stream", "text": [ "\r", - "0_1-mem-ctx-8k.pth 56%[==========> ] 3.20G 40.8MB/s eta 59s " + "_1-mem-ctx-8k.pth 88%[================> ] 2.83G 57.9MB/s eta 8s " ] }, { @@ -6356,7 +6375,7 @@ "output_type": "stream", "text": [ "\r", - "_1-mem-ctx-8k.pth 57%[==========> ] 3.22G 42.3MB/s eta 59s " + "1-mem-ctx-8k.pth 88%[================> ] 2.84G 56.5MB/s eta 8s " ] }, { @@ -6364,7 +6383,7 @@ "output_type": "stream", "text": [ "\r", - "1-mem-ctx-8k.pth 57%[==========> ] 3.23G 41.8MB/s eta 59s " + "-mem-ctx-8k.pth 89%[================> ] 2.86G 57.9MB/s eta 8s " ] }, { @@ -6372,7 +6391,7 @@ "output_type": "stream", "text": [ "\r", - "-mem-ctx-8k.pth 57%[==========> ] 3.23G 39.6MB/s eta 59s " + "mem-ctx-8k.pth 89%[================> ] 2.86G 56.1MB/s eta 7s " ] }, { @@ -6380,7 +6399,7 @@ "output_type": "stream", "text": [ "\r", - "mem-ctx-8k.pth 57%[==========> ] 3.25G 38.5MB/s eta 58s " + "em-ctx-8k.pth 89%[================> ] 2.88G 55.1MB/s eta 7s " ] }, { @@ -6388,7 +6407,7 @@ "output_type": "stream", "text": [ "\r", - "em-ctx-8k.pth 57%[==========> ] 3.25G 37.9MB/s eta 58s " + "m-ctx-8k.pth 90%[=================> ] 2.89G 55.6MB/s eta 7s " ] }, { @@ -6396,7 +6415,7 @@ "output_type": "stream", "text": [ "\r", - "m-ctx-8k.pth 57%[==========> ] 3.26G 36.7MB/s eta 58s " + "-ctx-8k.pth 90%[=================> ] 2.89G 53.6MB/s eta 7s " ] }, { @@ -6404,7 +6423,7 @@ "output_type": "stream", "text": [ "\r", - "-ctx-8k.pth 58%[==========> ] 3.28G 40.0MB/s eta 58s " + "ctx-8k.pth 90%[=================> ] 2.91G 54.0MB/s eta 7s " ] }, { @@ -6412,7 +6431,7 @@ "output_type": "stream", "text": [ "\r", - "ctx-8k.pth 58%[==========> ] 3.29G 38.9MB/s eta 57s " + "tx-8k.pth 91%[=================> ] 2.92G 57.0MB/s eta 6s " ] }, { @@ -6420,7 +6439,7 @@ "output_type": "stream", "text": [ "\r", - "tx-8k.pth 58%[==========> ] 3.31G 40.8MB/s eta 57s " + "x-8k.pth 91%[=================> ] 2.94G 57.0MB/s eta 6s " ] }, { @@ -6428,7 +6447,7 @@ "output_type": "stream", "text": [ "\r", - "x-8k.pth 58%[==========> ] 3.32G 39.4MB/s eta 57s " + "-8k.pth 91%[=================> ] 2.94G 54.9MB/s eta 6s " ] }, { @@ -6436,7 +6455,7 @@ "output_type": "stream", "text": [ "\r", - "-8k.pth 58%[==========> ] 3.32G 39.4MB/s eta 57s " + "8k.pth 91%[=================> ] 2.95G 53.2MB/s eta 6s " ] }, { @@ -6444,7 +6463,7 @@ "output_type": "stream", "text": [ "\r", - "8k.pth 58%[==========> ] 3.32G 37.4MB/s eta 57s " + "k.pth 92%[=================> ] 2.95G 48.8MB/s eta 6s " ] }, { @@ -6452,7 +6471,7 @@ "output_type": "stream", "text": [ "\r", - "k.pth 59%[==========> ] 3.34G 37.5MB/s eta 56s " + ".pth 92%[=================> ] 2.96G 51.8MB/s eta 5s " ] }, { @@ -6460,7 +6479,7 @@ "output_type": "stream", "text": [ "\r", - ".pth 59%[==========> ] 3.35G 36.2MB/s eta 56s " + "pth 92%[=================> ] 2.97G 51.1MB/s eta 5s " ] }, { @@ -6468,7 +6487,7 @@ "output_type": "stream", "text": [ "\r", - "pth 59%[==========> ] 3.37G 37.6MB/s eta 56s " + "th 92%[=================> ] 2.98G 50.6MB/s eta 5s " ] }, { @@ -6476,7 +6495,7 @@ "output_type": "stream", "text": [ "\r", - "th 59%[==========> ] 3.38G 40.2MB/s eta 56s " + "h 92%[=================> ] 2.98G 44.5MB/s eta 5s " ] }, { @@ -6484,7 +6503,7 @@ "output_type": "stream", "text": [ "\r", - "h 60%[===========> ] 3.40G 39.4MB/s eta 54s " + " 93%[=================> ] 2.99G 46.9MB/s eta 5s " ] }, { @@ -6492,7 +6511,7 @@ "output_type": "stream", "text": [ "\r", - " 60%[===========> ] 3.40G 39.9MB/s eta 54s " + " v 93%[=================> ] 3.01G 44.4MB/s eta 4s " ] }, { @@ -6500,7 +6519,7 @@ "output_type": "stream", "text": [ "\r", - " E 60%[===========> ] 3.41G 41.4MB/s eta 54s " + " v5 94%[=================> ] 3.02G 44.4MB/s eta 4s " ] }, { @@ -6508,7 +6527,7 @@ "output_type": "stream", "text": [ "\r", - " EW 60%[===========> ] 3.43G 44.3MB/s eta 54s " + " v5- 94%[=================> ] 3.04G 45.9MB/s eta 4s " ] }, { @@ -6516,7 +6535,7 @@ "output_type": "stream", "text": [ "\r", - " EWR 60%[===========> ] 3.44G 43.2MB/s eta 53s " + " v5-L 95%[==================> ] 3.05G 45.5MB/s eta 4s " ] }, { @@ -6524,7 +6543,7 @@ "output_type": "stream", "text": [ "\r", - " EWR- 61%[===========> ] 3.44G 39.0MB/s eta 53s " + " v5-L6 95%[==================> ] 3.07G 48.1MB/s eta 3s " ] }, { @@ -6532,7 +6551,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1 61%[===========> ] 3.45G 40.3MB/s eta 53s " + " v5-L6- 96%[==================> ] 3.08G 47.2MB/s eta 3s " ] }, { @@ -6540,7 +6559,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B 61%[===========> ] 3.47G 40.4MB/s eta 53s " + " v5-L6-D 96%[==================> ] 3.10G 46.6MB/s eta 3s " ] }, { @@ -6548,7 +6567,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5 61%[===========> ] 3.48G 42.0MB/s eta 52s " + " v5-L6-D4 97%[==================> ] 3.11G 45.8MB/s eta 3s " ] }, { @@ -6556,7 +6575,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5- 61%[===========> ] 3.49G 40.1MB/s eta 52s " + " v5-L6-D40 97%[==================> ] 3.13G 46.7MB/s eta 2s " ] }, { @@ -6564,7 +6583,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E 62%[===========> ] 3.50G 40.5MB/s eta 52s " + " v5-L6-D409 97%[==================> ] 3.13G 45.6MB/s eta 2s " ] }, { @@ -6572,7 +6591,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0 62%[===========> ] 3.51G 43.6MB/s eta 52s " + " v5-L6-D4096 98%[==================> ] 3.15G 48.4MB/s eta 2s " ] }, { @@ -6580,7 +6599,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_ 62%[===========> ] 3.52G 41.1MB/s eta 52s " + " v5-L6-D4096- 98%[==================> ] 3.16G 50.4MB/s eta 2s " ] }, { @@ -6588,7 +6607,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1 62%[===========> ] 3.53G 41.0MB/s eta 52s " + " v5-L6-D4096-E 98%[==================> ] 3.16G 48.0MB/s eta 2s " ] }, { @@ -6596,7 +6615,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1- 62%[===========> ] 3.53G 37.2MB/s eta 52s " + " v5-L6-D4096-E0 99%[==================> ] 3.17G 49.5MB/s eta 1s " ] }, { @@ -6604,7 +6623,7 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-m 62%[===========> ] 3.55G 40.0MB/s eta 52s " + " v5-L6-D4096-E0_ 99%[==================> ] 3.19G 50.4MB/s eta 1s " ] }, { @@ -6612,7680 +6631,628 @@ "output_type": "stream", "text": [ "\r", - " EWR-1B5-E0_1-me 63%[===========> ] 3.56G 39.6MB/s eta 51s " + " v5-L6-D4096-E0_1 99%[==================> ] 3.20G 53.9MB/s eta 1s \r", + "v5-L6-D4096-E0_1-me 100%[===================>] 3.21G 53.9MB/s in 64s \r\n", + "\r\n", + "2023-08-26 13:30:39 (51.4 MB/s) - ‘v5-L6-D4096-E0_1-mem-ctx-8k.pth’ saved [3441599237/3441599237]\r\n", + "\r\n" ] + } + ], + "source": [ + "# Lets download the custom models\n", + "!mkdir -p ../../../model/\n", + "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/memory-size-experiment-for-rwkv/resolve/main/RWKV-v5-baseline/BaseV5-C-Tune5.pth\"\n", + "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/EWR-1B5-E0_1-mem-ctx-8k.pth\"\n", + "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D2048-E0_1-mem-ctx-8k.pth\"\n", + "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D4096-E0_1-mem-ctx-8k.pth\"" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "fbaa4381", + "metadata": { + "execution": { + "iopub.execute_input": "2023-08-26T13:30:39.660558Z", + "iopub.status.busy": "2023-08-26T13:30:39.659105Z", + "iopub.status.idle": "2023-08-26T13:30:39.915027Z", + "shell.execute_reply": "2023-08-26T13:30:39.914129Z" + }, + "papermill": { + "duration": 0.309269, + "end_time": "2023-08-26T13:30:39.917097", + "exception": false, + "start_time": "2023-08-26T13:30:39.607828", + "status": "completed" }, + "tags": [] + }, + "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1-mem 63%[===========> ] 3.58G 41.2MB/s eta 51s " + "total 16G\r\n", + "-rw-r--r-- 1 root root 5.7G Aug 11 12:48 BaseV5-C-Tune5.pth\r\n", + "-rw-r--r-- 1 root root 5.7G Aug 17 14:38 EWR-1B5-E0_1-mem-ctx-8k.pth\r\n", + "-rw-r--r-- 1 root root 1018M Aug 19 08:33 v5-L6-D2048-E0_1-mem-ctx-8k.pth\r\n", + "-rw-r--r-- 1 root root 3.3G Aug 20 14:58 v5-L6-D4096-E0_1-mem-ctx-8k.pth\r\n" ] + } + ], + "source": [ + "!ls -lh ../../../model/" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "d97d8780", + "metadata": { + "execution": { + "iopub.execute_input": "2023-08-26T13:30:40.012919Z", + "iopub.status.busy": "2023-08-26T13:30:40.012535Z", + "iopub.status.idle": "2023-08-26T13:30:40.265417Z", + "shell.execute_reply": "2023-08-26T13:30:40.264441Z" + }, + "papermill": { + "duration": 0.303594, + "end_time": "2023-08-26T13:30:40.267576", + "exception": false, + "start_time": "2023-08-26T13:30:39.963982", + "status": "completed" }, + "tags": [] + }, + "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1-mem- 63%[===========> ] 3.59G 39.2MB/s eta 51s " + "/usr/bin/sh: 1: python: not found\r\n" ] + } + ], + "source": [ + "!python -m pip install aiocsv aiofiles" + ] + }, + { + "cell_type": "markdown", + "id": "84e31882", + "metadata": { + "papermill": { + "duration": 0.046789, + "end_time": "2023-08-26T13:30:40.361168", + "exception": false, + "start_time": "2023-08-26T13:30:40.314379", + "status": "completed" + }, + "tags": [] + }, + "source": [ + "# 1B5 V5 benchmark" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "b787699a", + "metadata": { + "execution": { + "iopub.execute_input": "2023-08-26T13:30:40.457229Z", + "iopub.status.busy": "2023-08-26T13:30:40.456877Z", + "iopub.status.idle": "2023-08-26T13:31:50.055322Z", + "shell.execute_reply": "2023-08-26T13:31:50.054422Z" }, + "papermill": { + "duration": 69.64913, + "end_time": "2023-08-26T13:31:50.057468", + "exception": false, + "start_time": "2023-08-26T13:30:40.408338", + "status": "completed" + }, + "tags": [] + }, + "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1-mem-c 63%[===========> ] 3.59G 38.2MB/s eta 50s " + "[2023-08-26 13:30:44,674] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "EWR-1B5-E0_1-mem-ct 63%[===========> ] 3.61G 38.4MB/s eta 50s " + "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "WR-1B5-E0_1-mem-ctx 63%[===========> ] 3.61G 36.7MB/s eta 50s " + "###\r\n", + "### Model validation start ###\r\n", + "###\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "R-1B5-E0_1-mem-ctx- 64%[===========> ] 3.62G 36.4MB/s eta 50s " + "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "-1B5-E0_1-mem-ctx-8 64%[===========> ] 3.63G 39.5MB/s eta 49s " + "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "1B5-E0_1-mem-ctx-8k 64%[===========> ] 3.64G 37.0MB/s eta 49s " + "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "B5-E0_1-mem-ctx-8k. 64%[===========> ] 3.65G 35.4MB/s eta 49s " + "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "5-E0_1-mem-ctx-8k.p 64%[===========> ] 3.67G 37.0MB/s eta 49s " + "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 65%[============> ] 3.67G 37.2MB/s eta 48s " + "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 65%[============> ] 3.68G 36.3MB/s eta 48s " + "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "0_1-mem-ctx-8k.pth 65%[============> ] 3.70G 37.2MB/s eta 48s " + "## Model validation for 40 tokens : 100.0% similarity, with 40 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "_1-mem-ctx-8k.pth 65%[============> ] 3.71G 38.7MB/s eta 48s " + "## Model validation for 45 tokens : 100.0% similarity, with 45 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "1-mem-ctx-8k.pth 65%[============> ] 3.72G 41.4MB/s eta 48s " + "## Model validation for 50 tokens : 100.0% similarity, with 50 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "-mem-ctx-8k.pth 66%[============> ] 3.72G 38.7MB/s eta 47s " + "## Model validation for 55 tokens : 100.0% similarity, with 55 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "mem-ctx-8k.pth 66%[============> ] 3.74G 38.7MB/s eta 47s " + "## Model validation for 60 tokens : 100.0% similarity, with 60 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "em-ctx-8k.pth 66%[============> ] 3.75G 42.7MB/s eta 47s " + "## Model validation for 65 tokens : 100.0% similarity, with 65 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "m-ctx-8k.pth 66%[============> ] 3.77G 45.0MB/s eta 47s " + "## Model validation for 70 tokens : 100.0% similarity, with 70 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "-ctx-8k.pth 67%[============> ] 3.78G 45.9MB/s eta 45s " + "## Model validation for 75 tokens : 100.0% similarity, with 75 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "ctx-8k.pth 67%[============> ] 3.80G 47.1MB/s eta 45s " + "## Model validation for 80 tokens : 100.0% similarity, with 80 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "tx-8k.pth 67%[============> ] 3.80G 44.4MB/s eta 45s " + "## Model validation for 85 tokens : 100.0% similarity, with 85 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "x-8k.pth 67%[============> ] 3.81G 47.1MB/s eta 45s " + "## Model validation for 90 tokens : 100.0% similarity, with 90 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "-8k.pth 67%[============> ] 3.83G 47.4MB/s eta 44s " + "## Model validation for 95 tokens : 100.0% similarity, with 95 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "8k.pth 68%[============> ] 3.84G 46.5MB/s eta 44s " + "## Model validation for 100 tokens : 100.0% similarity, with 100 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "k.pth 68%[============> ] 3.86G 48.3MB/s eta 44s " + "## Model validation for 105 tokens : 100.0% similarity, with 105 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - ".pth 68%[============> ] 3.87G 50.8MB/s eta 44s " + "## Model validation for 110 tokens : 100.0% similarity, with 110 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "pth 68%[============> ] 3.87G 45.6MB/s eta 43s " + "## Model validation for 115 tokens : 100.0% similarity, with 115 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "th 68%[============> ] 3.89G 47.4MB/s eta 43s " + "## Model validation for 120 tokens : 100.0% similarity, with 120 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "h 69%[============> ] 3.90G 46.5MB/s eta 43s " + "## Model validation for 125 tokens : 100.0% similarity, with 125 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " 69%[============> ] 3.92G 45.8MB/s eta 43s " + "## Model validation for 130 tokens : 100.0% similarity, with 130 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " E 69%[============> ] 3.93G 47.5MB/s eta 42s " + "## Model validation for 135 tokens : 100.0% similarity, with 135 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EW 69%[============> ] 3.95G 47.3MB/s eta 42s " + "## Model validation for 140 tokens : 100.0% similarity, with 140 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR 70%[=============> ] 3.96G 47.2MB/s eta 42s " + "## Model validation for 145 tokens : 100.0% similarity, with 145 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR- 70%[=============> ] 3.98G 47.1MB/s eta 42s " + "## Model validation for 150 tokens : 100.0% similarity, with 150 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1 70%[=============> ] 3.99G 46.7MB/s eta 40s " + "## Model validation for 160 tokens : 100.0% similarity, with 160 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B 70%[=============> ] 3.99G 46.8MB/s eta 40s " + "## Model validation for 170 tokens : 100.0% similarity, with 170 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5 71%[=============> ] 4.01G 47.6MB/s eta 40s " + "## Model validation for 180 tokens : 100.0% similarity, with 180 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5- 71%[=============> ] 4.02G 46.1MB/s eta 40s " + "## Model validation for 190 tokens : 99.47368421052632% similarity, with 189 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E 71%[=============> ] 4.04G 47.1MB/s eta 39s " + "## Model validation for 200 tokens : 100.0% similarity, with 200 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0 71%[=============> ] 4.04G 44.9MB/s eta 39s " + "## Model validation for 210 tokens : 100.0% similarity, with 210 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_ 71%[=============> ] 4.05G 43.9MB/s eta 39s " + "## Model validation for 220 tokens : 100.0% similarity, with 220 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1 71%[=============> ] 4.05G 42.3MB/s eta 39s " + "## Model validation for 230 tokens : 100.0% similarity, with 230 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1- 72%[=============> ] 4.07G 43.7MB/s eta 39s " + "## Model validation for 240 tokens : 100.0% similarity, with 240 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1-m 72%[=============> ] 4.08G 45.2MB/s eta 38s " + "## Model validation for 250 tokens : 100.0% similarity, with 250 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1-me 72%[=============> ] 4.10G 43.4MB/s eta 38s " + "## Model validation for 260 tokens : 100.0% similarity, with 260 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1-mem 72%[=============> ] 4.11G 44.8MB/s eta 38s " + "## Model validation for 270 tokens : 100.0% similarity, with 270 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1-mem- 73%[=============> ] 4.13G 44.4MB/s eta 37s " + "## Model validation for 280 tokens : 99.64285714285714% similarity, with 279 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - " EWR-1B5-E0_1-mem-c 73%[=============> ] 4.14G 45.7MB/s eta 37s " + "## Model validation for 290 tokens : 100.0% similarity, with 290 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "EWR-1B5-E0_1-mem-ct 73%[=============> ] 4.15G 43.7MB/s eta 37s " + "## Model validation for 300 tokens : 99.66666666666667% similarity, with 299 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "WR-1B5-E0_1-mem-ctx 73%[=============> ] 4.16G 43.0MB/s eta 37s " + "## Model validation for 325 tokens : 100.0% similarity, with 325 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "R-1B5-E0_1-mem-ctx- 73%[=============> ] 4.16G 43.0MB/s eta 37s " + "## Model validation for 350 tokens : 100.0% similarity, with 350 matched token, and 0 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "-1B5-E0_1-mem-ctx-8 73%[=============> ] 4.17G 38.8MB/s eta 36s " + "## Model validation for 375 tokens : 99.46666666666667% similarity, with 373 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "1B5-E0_1-mem-ctx-8k 74%[=============> ] 4.19G 39.7MB/s eta 36s " + "## Model validation for 400 tokens : 99.75% similarity, with 399 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "B5-E0_1-mem-ctx-8k. 74%[=============> ] 4.19G 37.9MB/s eta 36s " + "## Model validation for 425 tokens : 99.76470588235294% similarity, with 424 matched token, and 1 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "5-E0_1-mem-ctx-8k.p 74%[=============> ] 4.20G 40.7MB/s eta 36s " + "## Model validation for 450 tokens : 99.55555555555556% similarity, with 448 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 74%[=============> ] 4.22G 38.7MB/s eta 35s " + "## Model validation for 475 tokens : 99.36842105263159% similarity, with 472 matched token, and 3 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 74%[=============> ] 4.23G 39.7MB/s eta 35s " + "## Model validation for 500 tokens : 99.6% similarity, with 498 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "\r", - "0_1-mem-ctx-8k.pth 74%[=============> ] 4.23G 36.9MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 75%[==============> ] 4.24G 36.4MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 75%[==============> ] 4.25G 33.9MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 75%[==============> ] 4.26G 37.3MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 75%[==============> ] 4.26G 33.7MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 75%[==============> ] 4.28G 33.8MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 76%[==============> ] 4.29G 37.0MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 76%[==============> ] 4.31G 38.3MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 76%[==============> ] 4.32G 38.8MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 76%[==============> ] 4.33G 39.8MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 77%[==============> ] 4.35G 39.3MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 77%[==============> ] 4.35G 39.1MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 77%[==============> ] 4.36G 41.5MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 77%[==============> ] 4.37G 39.0MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 77%[==============> ] 4.38G 39.8MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 77%[==============> ] 4.39G 42.4MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 77%[==============> ] 4.40G 41.6MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 78%[==============> ] 4.41G 41.9MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 78%[==============> ] 4.42G 42.7MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " E 78%[==============> ] 4.42G 39.5MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EW 78%[==============> ] 4.44G 41.8MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR 78%[==============> ] 4.46G 43.6MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR- 79%[==============> ] 4.47G 43.6MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1 79%[==============> ] 4.48G 44.1MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B 79%[==============> ] 4.50G 41.2MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5 79%[==============> ] 4.50G 41.8MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5- 79%[==============> ] 4.51G 42.8MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E 80%[===============> ] 4.53G 44.4MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0 80%[===============> ] 4.54G 45.8MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_ 80%[===============> ] 4.56G 45.6MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1 81%[===============> ] 4.57G 45.7MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1- 81%[===============> ] 4.57G 41.8MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-m 81%[===============> ] 4.58G 43.0MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-me 81%[===============> ] 4.59G 42.0MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem 81%[===============> ] 4.60G 44.0MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem- 81%[===============> ] 4.62G 44.3MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem-c 81%[===============> ] 4.62G 44.2MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "EWR-1B5-E0_1-mem-ct 82%[===============> ] 4.63G 43.3MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "WR-1B5-E0_1-mem-ctx 82%[===============> ] 4.63G 41.0MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "R-1B5-E0_1-mem-ctx- 82%[===============> ] 4.65G 41.0MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-1B5-E0_1-mem-ctx-8 82%[===============> ] 4.66G 40.5MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1B5-E0_1-mem-ctx-8k 82%[===============> ] 4.66G 39.2MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "B5-E0_1-mem-ctx-8k. 82%[===============> ] 4.68G 40.9MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-E0_1-mem-ctx-8k.p 83%[===============> ] 4.69G 40.1MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 83%[===============> ] 4.70G 38.9MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 83%[===============> ] 4.71G 39.6MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 83%[===============> ] 4.71G 37.2MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 83%[===============> ] 4.72G 36.7MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 83%[===============> ] 4.74G 39.8MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 84%[===============> ] 4.75G 42.6MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 84%[===============> ] 4.75G 40.3MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 84%[===============> ] 4.77G 40.6MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 84%[===============> ] 4.78G 40.8MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 84%[===============> ] 4.78G 38.1MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 85%[================> ] 4.80G 40.7MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 85%[================> ] 4.81G 41.0MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 85%[================> ] 4.83G 43.0MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 85%[================> ] 4.84G 42.3MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 86%[================> ] 4.86G 43.2MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 86%[================> ] 4.86G 41.5MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 86%[================> ] 4.88G 44.0MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 86%[================> ] 4.89G 43.8MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 86%[================> ] 4.89G 41.2MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 86%[================> ] 4.90G 41.5MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 86%[================> ] 4.90G 42.0MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " E 87%[================> ] 4.92G 41.3MB/s eta 18s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EW 87%[================> ] 4.93G 40.9MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR 87%[================> ] 4.95G 41.4MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR- 87%[================> ] 4.96G 41.3MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1 88%[================> ] 4.97G 40.8MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B 88%[================> ] 4.98G 40.8MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5 88%[================> ] 4.99G 44.3MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5- 88%[================> ] 4.99G 41.2MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E 88%[================> ] 5.01G 41.5MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0 88%[================> ] 5.02G 41.3MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_ 89%[================> ] 5.04G 42.0MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1 89%[================> ] 5.04G 38.3MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1- 89%[================> ] 5.05G 41.0MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-m 89%[================> ] 5.07G 40.1MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-me 90%[=================> ] 5.08G 39.3MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem 90%[=================> ] 5.09G 42.3MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem- 90%[=================> ] 5.10G 42.4MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem-c 90%[=================> ] 5.11G 42.5MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "EWR-1B5-E0_1-mem-ct 90%[=================> ] 5.13G 43.3MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "WR-1B5-E0_1-mem-ctx 91%[=================> ] 5.14G 43.5MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "R-1B5-E0_1-mem-ctx- 91%[=================> ] 5.15G 44.4MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-1B5-E0_1-mem-ctx-8 91%[=================> ] 5.16G 43.3MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1B5-E0_1-mem-ctx-8k 91%[=================> ] 5.17G 44.0MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "B5-E0_1-mem-ctx-8k. 91%[=================> ] 5.18G 42.9MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-E0_1-mem-ctx-8k.p 91%[=================> ] 5.19G 42.8MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 92%[=================> ] 5.20G 42.4MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 92%[=================> ] 5.21G 43.0MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 92%[=================> ] 5.23G 44.3MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 92%[=================> ] 5.24G 47.5MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 92%[=================> ] 5.25G 44.5MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 93%[=================> ] 5.26G 42.8MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 93%[=================> ] 5.27G 43.3MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 93%[=================> ] 5.28G 43.9MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 93%[=================> ] 5.29G 43.5MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 93%[=================> ] 5.30G 42.6MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 93%[=================> ] 5.30G 39.5MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 94%[=================> ] 5.32G 41.6MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 94%[=================> ] 5.33G 40.0MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 94%[=================> ] 5.35G 41.7MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 95%[==================> ] 5.36G 43.6MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 95%[==================> ] 5.38G 42.7MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 95%[==================> ] 5.38G 43.0MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 95%[==================> ] 5.39G 43.0MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 95%[==================> ] 5.41G 42.4MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 96%[==================> ] 5.42G 43.4MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 96%[==================> ] 5.44G 43.4MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " E 96%[==================> ] 5.44G 44.0MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EW 96%[==================> ] 5.45G 43.9MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR 96%[==================> ] 5.47G 42.4MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR- 96%[==================> ] 5.47G 39.9MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1 97%[==================> ] 5.48G 43.2MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B 97%[==================> ] 5.50G 43.1MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5 97%[==================> ] 5.50G 42.9MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5- 97%[==================> ] 5.51G 41.6MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E 97%[==================> ] 5.53G 44.0MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0 98%[==================> ] 5.53G 42.1MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_ 98%[==================> ] 5.54G 41.1MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1 98%[==================> ] 5.54G 39.0MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1- 98%[==================> ] 5.56G 39.8MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-m 98%[==================> ] 5.57G 38.9MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-me 98%[==================> ] 5.58G 38.8MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem 99%[==================> ] 5.59G 36.4MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem- 99%[==================> ] 5.60G 39.1MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " EWR-1B5-E0_1-mem-c 99%[==================> ] 5.62G 38.1MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "EWR-1B5-E0_1-mem-ct 99%[==================> ] 5.63G 41.0MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "WR-1B5-E0_1-mem-ctx 99%[==================> ] 5.64G 40.3MB/s eta 1s \r", - "EWR-1B5-E0_1-mem-ct 100%[===================>] 5.64G 40.6MB/s in 2m 17s \r\n", - "\r\n", - "2023-09-05 20:02:49 (42.0 MB/s) - ‘EWR-1B5-E0_1-mem-ctx-8k.pth’ saved [6060483163/6060483163]\r\n", - "\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "--2023-09-05 20:02:49-- https://huggingface.co/rwkv-x-dev/rwkv-x-playground/resolve/main/experiment/rwkv-x-exp/v5-slim-memory/v5-L6-D1024-E0_1-mem-ctx-8k.pth\r\n", - "Resolving huggingface.co (huggingface.co)... 18.154.227.69, 18.154.227.87, 18.154.227.67, ...\r\n", - "Connecting to huggingface.co (huggingface.co)|18.154.227.69|:443... connected.\r\n", - "HTTP request sent, awaiting response... 302 Found\r\n", - "Location: https://cdn-lfs.huggingface.co/repos/2e/f7/2ef78555202aa92abdbdf476ce3d0fd5a8b15f7245edf0b80d4d30572355f30d/cefa72363bb7dfddb34723de3848f3cc5116c1ff15481f5562317058324b8bf0?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D1024-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D1024-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203370&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzM3MH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy8yZS9mNy8yZWY3ODU1NTIwMmFhOTJhYmRiZGY0NzZjZTNkMGZkNWE4YjE1ZjcyNDVlZGYwYjgwZDRkMzA1NzIzNTVmMzBkL2NlZmE3MjM2M2JiN2RmZGRiMzQ3MjNkZTM4NDhmM2NjNTExNmMxZmYxNTQ4MWY1NTYyMzE3MDU4MzI0YjhiZjA%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=B66WcOta7appV-JHHd-jMXu8SQjsoaHZFUDZQKrIz-elqYAFJYJb6m1qE2l6RR8yfASI8EA1iiSMO4ht-ToSA%7Eh5w827hJ5jknceswiSmp3dsP8R%7ERv3v79%7EPhXM26Mm0s1RiOhcwWAqJtECD4bFLqx6Ejh978NbajGhvZ08YBZx8aNA2ZPkfx8lK5ozeBRIoQI1NsQivS3r5uFuoe6aEe00iBVYuhSPP6DDtRa1NbEoF6ak4YWTqF6QED3U9Vp899VrgVJZzaEjJcE%7E2Aw6xywAiyfMmRFuG-QbfQ3zD93vVIFKVBaKgXtLNLsXq9OPn2pdMRV-IUKtGvJ2s-zjKA__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", - "--2023-09-05 20:02:50-- https://cdn-lfs.huggingface.co/repos/2e/f7/2ef78555202aa92abdbdf476ce3d0fd5a8b15f7245edf0b80d4d30572355f30d/cefa72363bb7dfddb34723de3848f3cc5116c1ff15481f5562317058324b8bf0?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D1024-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D1024-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203370&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzM3MH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy8yZS9mNy8yZWY3ODU1NTIwMmFhOTJhYmRiZGY0NzZjZTNkMGZkNWE4YjE1ZjcyNDVlZGYwYjgwZDRkMzA1NzIzNTVmMzBkL2NlZmE3MjM2M2JiN2RmZGRiMzQ3MjNkZTM4NDhmM2NjNTExNmMxZmYxNTQ4MWY1NTYyMzE3MDU4MzI0YjhiZjA%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=B66WcOta7appV-JHHd-jMXu8SQjsoaHZFUDZQKrIz-elqYAFJYJb6m1qE2l6RR8yfASI8EA1iiSMO4ht-ToSA%7Eh5w827hJ5jknceswiSmp3dsP8R%7ERv3v79%7EPhXM26Mm0s1RiOhcwWAqJtECD4bFLqx6Ejh978NbajGhvZ08YBZx8aNA2ZPkfx8lK5ozeBRIoQI1NsQivS3r5uFuoe6aEe00iBVYuhSPP6DDtRa1NbEoF6ak4YWTqF6QED3U9Vp899VrgVJZzaEjJcE%7E2Aw6xywAiyfMmRFuG-QbfQ3zD93vVIFKVBaKgXtLNLsXq9OPn2pdMRV-IUKtGvJ2s-zjKA__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", - "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.49, 108.138.64.36, 108.138.64.111, ...\r\n", - "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.49|:443... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "connected.\r\n", - "HTTP request sent, awaiting response... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "200 OK\r\n", - "Length: 369696005 (353M) [binary/octet-stream]\r\n", - "Saving to: ‘v5-L6-D1024-E0_1-mem-ctx-8k.pth’\r\n", - "\r\n", - "\r", - " v5-L6-D10 0%[ ] 0 --.-KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D102 4%[ ] 15.26M 46.1MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D1024 8%[> ] 30.52M 54.1MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D1024- 12%[=> ] 45.78M 56.2MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D1024-E 17%[==> ] 61.03M 57.1MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D1024-E0 21%[===> ] 76.29M 55.7MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D1024-E0_ 25%[====> ] 91.55M 54.7MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D1024-E0_1 30%[=====> ] 106.81M 55.6MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D1024-E0_1- 34%[=====> ] 121.56M 55.5MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D1024-E0_1-m 38%[======> ] 135.50M 53.9MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D1024-E0_1-me 42%[=======> ] 151.33M 55.8MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D1024-E0_1-mem 43%[=======> ] 152.59M 50.9MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D1024-E0_1-mem- 47%[========> ] 167.85M 52.2MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D1024-E0_1-mem-c 50%[=========> ] 178.41M 52.2MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D1024-E0_1-mem-ct 56%[==========> ] 197.85M 52.5MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D1024-E0_1-mem-ctx 60%[===========> ] 211.79M 51.6MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D1024-E0_1-mem-ctx- 64%[===========> ] 228.36M 51.2MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1024-E0_1-mem-ctx-8 66%[============> ] 233.06M 46.8MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "024-E0_1-mem-ctx-8k 69%[============> ] 244.13M 46.8MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "24-E0_1-mem-ctx-8k. 73%[=============> ] 259.40M 47.5MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4-E0_1-mem-ctx-8k.p 77%[==============> ] 274.14M 45.4MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 77%[==============> ] 274.66M 44.1MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 82%[===============> ] 289.40M 43.7MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 86%[================> ] 304.40M 45.0MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 86%[================> ] 305.79M 43.9MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 90%[=================> ] 320.43M 44.2MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 95%[==================> ] 335.69M 43.9MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 99%[==================> ] 350.44M 46.2MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D1024-E0_1-me 100%[===================>] 352.57M 45.4MB/s in 7.4s \r\n", - "\r\n", - "2023-09-05 20:02:57 (47.6 MB/s) - ‘v5-L6-D1024-E0_1-mem-ctx-8k.pth’ saved [369696005/369696005]\r\n", - "\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "--2023-09-05 20:02:57-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D2048-E0_1-mem-ctx-8k.pth\r\n", - "Resolving huggingface.co (huggingface.co)... 18.154.227.7, 18.154.227.67, 18.154.227.87, ...\r\n", - "Connecting to huggingface.co (huggingface.co)|18.154.227.7|:443... connected.\r\n", - "HTTP request sent, awaiting response... 302 Found\r\n", - "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/87b64f45529c2049a8b044b7e7c0338a9ede8ba8259d17d987d8e73f8a34fd75?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D2048-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D2048-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203377&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzM3N319LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzg3YjY0ZjQ1NTI5YzIwNDlhOGIwNDRiN2U3YzAzMzhhOWVkZThiYTgyNTlkMTdkOTg3ZDhlNzNmOGEzNGZkNzU%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=VBYbW8z%7E9JBNguL51PviRfIlJ54YdlKEx91Ga02bS1bpaMTycJmWk-xv5BrCaiZzsDoosmbz7lPmOAAXRwEaLLn%7EpoS9cb5XHy3KTfp8ndxX7bqjKg3SYSf9P9po2RrS-50MBgszD2UFbjP7RWDf6GDRX7NHvHRXrKQ9DajMDZXByKypfrrMreWxQcsgaqJGEzco-tJYdyQO1JsjD8tTHFTQQd2R3DeHLlV1k8vAoxSg%7EkHse1nL4%7Ej68Z84lamLLL4rrO6qn2Lmh5KwDlTa76KCe5nID22ULDapKaGQr2grYb7qVEYGfXbHjoOxT63Ma82a6NWGRLMTR24M89v9Hg__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", - "--2023-09-05 20:02:57-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/87b64f45529c2049a8b044b7e7c0338a9ede8ba8259d17d987d8e73f8a34fd75?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D2048-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D2048-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203377&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzM3N319LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzg3YjY0ZjQ1NTI5YzIwNDlhOGIwNDRiN2U3YzAzMzhhOWVkZThiYTgyNTlkMTdkOTg3ZDhlNzNmOGEzNGZkNzU%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=VBYbW8z%7E9JBNguL51PviRfIlJ54YdlKEx91Ga02bS1bpaMTycJmWk-xv5BrCaiZzsDoosmbz7lPmOAAXRwEaLLn%7EpoS9cb5XHy3KTfp8ndxX7bqjKg3SYSf9P9po2RrS-50MBgszD2UFbjP7RWDf6GDRX7NHvHRXrKQ9DajMDZXByKypfrrMreWxQcsgaqJGEzco-tJYdyQO1JsjD8tTHFTQQd2R3DeHLlV1k8vAoxSg%7EkHse1nL4%7Ej68Z84lamLLL4rrO6qn2Lmh5KwDlTa76KCe5nID22ULDapKaGQr2grYb7qVEYGfXbHjoOxT63Ma82a6NWGRLMTR24M89v9Hg__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", - "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.121, 108.138.64.111, 108.138.64.49, ...\r\n", - "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.121|:443... connected.\r\n", - "HTTP request sent, awaiting response... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "200 OK\r\n", - "Length: 1066508293 (1017M) [binary/octet-stream]\r\n", - "Saving to: ‘v5-L6-D2048-E0_1-mem-ctx-8k.pth’\r\n", - "\r\n", - "\r", - " v5-L6-D20 0%[ ] 0 --.-KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D204 1%[ ] 13.43M 64.2MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048 2%[ ] 25.33M 61.9MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048- 3%[ ] 30.52M 44.1MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E 4%[ ] 45.78M 44.3MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0 5%[> ] 60.75M 49.3MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0_ 6%[> ] 61.03M 42.1MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0_1 7%[> ] 76.29M 43.8MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0_1- 8%[> ] 89.73M 42.1MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0_1-m 10%[=> ] 101.80M 43.4MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D2048-E0_1-me 10%[=> ] 107.72M 42.3MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D2048-E0_1-mem 11%[=> ] 121.56M 43.4MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 12%[=> ] 122.16M 40.7MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 13%[=> ] 136.81M 41.9MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 14%[=> ] 150.76M 40.9MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 16%[==> ] 165.33M 42.5MB/s eta 22s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 16%[==> ] 167.85M 39.9MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 18%[==> ] 183.10M 39.5MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 19%[==> ] 198.36M 39.8MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 20%[===> ] 213.11M 42.3MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 21%[===> ] 219.93M 40.2MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 23%[===> ] 241.44M 44.2MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 24%[===> ] 244.13M 41.1MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 25%[====> ] 259.40M 43.1MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 27%[====> ] 274.66M 44.2MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 28%[====> ] 289.40M 44.4MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 28%[====> ] 289.92M 41.9MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 29%[====> ] 304.66M 44.7MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 30%[=====> ] 305.30M 41.8MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 31%[=====> ] 320.43M 42.4MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 32%[=====> ] 335.18M 42.2MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 33%[=====> ] 341.75M 43.2MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 34%[=====> ] 350.95M 40.9MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 36%[======> ] 366.20M 41.3MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 37%[======> ] 380.96M 41.4MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 38%[======> ] 394.91M 41.0MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 40%[=======> ] 410.16M 40.6MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 40%[=======> ] 411.99M 37.7MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 41%[=======> ] 426.73M 40.1MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 42%[=======> ] 429.87M 36.9MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 43%[=======> ] 441.98M 37.4MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 44%[=======> ] 451.07M 39.7MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 45%[========> ] 457.76M 37.2MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 46%[========> ] 473.02M 40.3MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 48%[========> ] 488.28M 41.4MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L 49%[========> ] 503.03M 41.6MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6 50%[=========> ] 516.97M 43.5MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6- 52%[=========> ] 533.54M 44.0MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D 53%[=========> ] 548.80M 44.6MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2 55%[==========> ] 559.55M 43.8MB/s eta 12s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D20 55%[==========> ] 564.58M 42.1MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D204 57%[==========> ] 579.83M 42.9MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048 57%[==========> ] 585.02M 41.6MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048- 58%[==========> ] 595.09M 42.7MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E 60%[===========> ] 610.35M 42.0MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0 61%[===========> ] 625.61M 45.2MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0_ 63%[===========> ] 640.87M 45.4MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0_1 63%[===========> ] 647.18M 46.0MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0_1- 64%[===========> ] 655.62M 43.9MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D2048-E0_1-m 64%[===========> ] 656.34M 41.0MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D2048-E0_1-me 65%[============> ] 669.55M 43.4MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D2048-E0_1-mem 67%[============> ] 684.58M 44.3MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D2048-E0_1-mem- 67%[============> ] 686.77M 41.8MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D2048-E0_1-mem-c 69%[============> ] 701.90M 42.6MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D2048-E0_1-mem-ct 70%[=============> ] 717.16M 43.7MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D2048-E0_1-mem-ctx 72%[=============> ] 732.42M 44.5MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D2048-E0_1-mem-ctx- 73%[=============> ] 747.69M 42.8MB/s eta 8s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "2048-E0_1-mem-ctx-8 74%[=============> ] 762.42M 44.6MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "048-E0_1-mem-ctx-8k 76%[==============> ] 774.55M 44.9MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "48-E0_1-mem-ctx-8k. 76%[==============> ] 778.20M 43.6MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8-E0_1-mem-ctx-8k.p 78%[==============> ] 793.46M 43.0MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 79%[==============> ] 808.71M 45.2MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 80%[===============> ] 823.46M 43.2MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 81%[===============> ] 824.22M 40.6MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 82%[===============> ] 839.23M 41.4MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 84%[===============> ] 854.49M 42.6MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 85%[================> ] 869.75M 45.3MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 87%[================> ] 885.01M 44.5MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 87%[================> ] 892.69M 43.8MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 88%[================> ] 900.27M 42.5MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 90%[=================> ] 915.53M 42.7MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 91%[=================> ] 930.78M 42.2MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 93%[=================> ] 946.04M 43.3MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 94%[=================> ] 961.30M 43.7MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 96%[==================> ] 976.55M 45.9MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 97%[==================> ] 991.31M 44.9MB/s eta 2s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 97%[==================> ] 993.88M 43.3MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 99%[==================> ] 1007M 43.3MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 99%[==================> ] 1016M 42.5MB/s eta 1s \r", - "v5-L6-D2048-E0_1-me 100%[===================>] 1017M 42.8MB/s in 24s \r\n", - "\r\n", - "2023-09-05 20:03:21 (42.8 MB/s) - ‘v5-L6-D2048-E0_1-mem-ctx-8k.pth’ saved [1066508293/1066508293]\r\n", - "\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "--2023-09-05 20:03:22-- https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D4096-E0_1-mem-ctx-8k.pth\r\n", - "Resolving huggingface.co (huggingface.co)... 18.154.227.69, 18.154.227.7, 18.154.227.67, ...\r\n", - "Connecting to huggingface.co (huggingface.co)|18.154.227.69|:443... connected.\r\n", - "HTTP request sent, awaiting response... 302 Found\r\n", - "Location: https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/5f93b1f6f6f7fb2193130a3a51f8ed41a0541b1b5eab100ca9318c8218d481fa?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D4096-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D4096-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203402&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzQwMn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzVmOTNiMWY2ZjZmN2ZiMjE5MzEzMGEzYTUxZjhlZDQxYTA1NDFiMWI1ZWFiMTAwY2E5MzE4YzgyMThkNDgxZmE%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=kCsh5tzkI71pVRmfZsPhC0oiMlNdvC32eUOBVomz04o7staDhD2mIy6e9QqNHRsXMGyb1w1x8zQwRSuXSfWfo1LvvIkiIevIPEm6FGcRQhtkf9erytEqdKZatuYT-PBOlLBy%7EDrXG96JnUuXbDo9CTezywZTuYWQImQgZL2u5J3qHyUHcUbMiM8UwyVky4zy8XyGHBFFSvmIh3OygZOTofjkBuVZU78x0lbd-5xkf-UGRfm9bQLyHilkPWhulkTXE2M8XUYTbfJEfrwUyZi94%7EqXEqn7kX37bkywoVTOgmO-yBTF0R6uFjbm3r8lz7fM7Ww5wrblit2Clim6TTprww__&Key-Pair-Id=KVTP0A1DKRTAX [following]\r\n", - "--2023-09-05 20:03:22-- https://cdn-lfs.huggingface.co/repos/69/e5/69e55a6299441d3070ee1690632f8d12440ea004de9c6a51b873ccd49ea78ea0/5f93b1f6f6f7fb2193130a3a51f8ed41a0541b1b5eab100ca9318c8218d481fa?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27v5-L6-D4096-E0_1-mem-ctx-8k.pth%3B+filename%3D%22v5-L6-D4096-E0_1-mem-ctx-8k.pth%22%3B&Expires=1694203402&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NDIwMzQwMn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy82OS9lNS82OWU1NWE2Mjk5NDQxZDMwNzBlZTE2OTA2MzJmOGQxMjQ0MGVhMDA0ZGU5YzZhNTFiODczY2NkNDllYTc4ZWEwLzVmOTNiMWY2ZjZmN2ZiMjE5MzEzMGEzYTUxZjhlZDQxYTA1NDFiMWI1ZWFiMTAwY2E5MzE4YzgyMThkNDgxZmE%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=kCsh5tzkI71pVRmfZsPhC0oiMlNdvC32eUOBVomz04o7staDhD2mIy6e9QqNHRsXMGyb1w1x8zQwRSuXSfWfo1LvvIkiIevIPEm6FGcRQhtkf9erytEqdKZatuYT-PBOlLBy%7EDrXG96JnUuXbDo9CTezywZTuYWQImQgZL2u5J3qHyUHcUbMiM8UwyVky4zy8XyGHBFFSvmIh3OygZOTofjkBuVZU78x0lbd-5xkf-UGRfm9bQLyHilkPWhulkTXE2M8XUYTbfJEfrwUyZi94%7EqXEqn7kX37bkywoVTOgmO-yBTF0R6uFjbm3r8lz7fM7Ww5wrblit2Clim6TTprww__&Key-Pair-Id=KVTP0A1DKRTAX\r\n", - "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.138.64.36, 108.138.64.49, 108.138.64.111, ...\r\n", - "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.138.64.36|:443... connected.\r\n", - "HTTP request sent, awaiting response... " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "200 OK\r\n", - "Length: 3441599237 (3.2G) [binary/octet-stream]\r\n", - "Saving to: ‘v5-L6-D4096-E0_1-mem-ctx-8k.pth’\r\n", - "\r\n", - "\r", - " v5-L6-D40 0%[ ] 0 --.-KB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D409 0%[ ] 13.43M 62.3MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096 0%[ ] 28.00M 67.3MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096- 0%[ ] 30.52M 42.9MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E 1%[ ] 45.78M 43.6MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0 1%[ ] 61.03M 43.9MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_ 2%[ ] 71.57M 45.0MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1 2%[ ] 85.74M 47.9MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1- 2%[ ] 91.55M 44.8MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1-m 3%[ ] 106.77M 47.6MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D4096-E0_1-me 3%[ ] 115.21M 47.2MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D4096-E0_1-mem 3%[ ] 120.25M 44.1MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 3%[ ] 129.42M 44.2MB/s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 4%[ ] 137.33M 41.8MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 4%[ ] 152.59M 42.4MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 5%[> ] 167.33M 43.6MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 5%[> ] 174.16M 42.9MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 5%[> ] 182.59M 42.8MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 5%[> ] 185.73M 41.5MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 6%[> ] 198.36M 40.7MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 6%[> ] 213.62M 41.7MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 6%[> ] 228.87M 42.3MB/s eta 75s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 7%[> ] 243.63M 43.6MB/s eta 70s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 7%[> ] 258.62M 46.3MB/s eta 70s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 7%[> ] 259.40M 41.1MB/s eta 70s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 8%[> ] 274.66M 40.4MB/s eta 70s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 8%[> ] 289.92M 42.5MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 9%[> ] 305.18M 43.4MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 9%[> ] 320.43M 43.6MB/s eta 69s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 10%[=> ] 335.69M 44.6MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 10%[=> ] 350.44M 43.4MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 10%[=> ] 359.99M 42.6MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 11%[=> ] 366.20M 42.2MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 11%[=> ] 381.47M 42.4MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 12%[=> ] 396.22M 43.9MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 12%[=> ] 396.73M 40.1MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 12%[=> ] 410.16M 42.8MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 13%[=> ] 426.73M 43.4MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 13%[=> ] 427.25M 40.1MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 13%[=> ] 441.98M 42.4MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 13%[=> ] 442.51M 39.2MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 13%[=> ] 457.24M 42.1MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 14%[=> ] 465.94M 41.5MB/s eta 68s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 14%[=> ] 482.89M 42.7MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 14%[=> ] 488.28M 38.8MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L 15%[==> ] 503.54M 41.0MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6 15%[==> ] 518.80M 41.1MB/s eta 65s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6- 16%[==> ] 534.05M 42.8MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D 16%[==> ] 548.80M 45.4MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4 16%[==> ] 557.75M 43.5MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D40 17%[==> ] 564.58M 43.4MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D409 17%[==> ] 579.31M 44.7MB/s eta 64s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096 17%[==> ] 582.81M 43.2MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096- 18%[==> ] 594.57M 44.6MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E 18%[==> ] 597.15M 41.9MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0 18%[==> ] 609.84M 41.8MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_ 18%[==> ] 615.55M 42.3MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1 19%[==> ] 625.61M 40.8MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1- 19%[==> ] 640.87M 42.8MB/s eta 63s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1-m 19%[==> ] 656.13M 39.5MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D4096-E0_1-me 20%[===> ] 670.87M 42.4MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D4096-E0_1-mem 20%[===> ] 671.38M 38.6MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 20%[===> ] 686.13M 39.8MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 21%[===> ] 700.08M 40.0MB/s eta 62s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 21%[===> ] 708.71M 38.7MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 21%[===> ] 717.16M 37.1MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 22%[===> ] 732.42M 37.2MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 22%[===> ] 747.69M 38.9MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 23%[===> ] 764.04M 40.8MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 23%[===> ] 777.68M 43.5MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 23%[===> ] 784.89M 41.8MB/s eta 61s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 24%[===> ] 793.46M 40.1MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 24%[===> ] 808.71M 42.5MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 25%[====> ] 823.97M 41.8MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 25%[====> ] 839.23M 45.2MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 26%[====> ] 854.49M 46.2MB/s eta 59s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 26%[====> ] 869.75M 48.8MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 26%[====> ] 885.47M 49.5MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 27%[====> ] 899.75M 48.8MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 27%[====> ] 900.27M 46.6MB/s eta 56s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 27%[====> ] 915.53M 47.1MB/s eta 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 28%[====> ] 930.78M 45.8MB/s eta 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 28%[====> ] 946.04M 48.0MB/s eta 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 29%[====> ] 961.30M 48.8MB/s eta 55s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 29%[====> ] 975.91M 48.0MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 29%[====> ] 976.05M 46.0MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 29%[====> ] 983.00M 46.1MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 30%[=====> ] 993.36M 48.3MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 30%[=====> ] 1007M 45.6MB/s eta 53s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 31%[=====> ] 1022M 44.8MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 31%[=====> ] 1.00G 43.5MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 31%[=====> ] 1.01G 40.3MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 32%[=====> ] 1.03G 42.6MB/s eta 52s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 32%[=====> ] 1.04G 41.7MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 32%[=====> ] 1.06G 42.3MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L 33%[=====> ] 1.07G 45.0MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6 33%[=====> ] 1.08G 43.0MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6- 33%[=====> ] 1.08G 43.7MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D 33%[=====> ] 1.09G 41.8MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4 33%[=====> ] 1.09G 37.4MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D40 34%[=====> ] 1.09G 36.0MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D409 34%[=====> ] 1.10G 37.4MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096 34%[=====> ] 1.11G 37.0MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096- 34%[=====> ] 1.12G 37.6MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E 35%[======> ] 1.12G 38.8MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0 35%[======> ] 1.13G 36.8MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_ 35%[======> ] 1.15G 36.2MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1 35%[======> ] 1.15G 35.6MB/s eta 51s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1- 36%[======> ] 1.16G 35.8MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1-m 36%[======> ] 1.18G 35.6MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D4096-E0_1-me 37%[======> ] 1.19G 36.5MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D4096-E0_1-mem 37%[======> ] 1.20G 34.6MB/s eta 50s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 37%[======> ] 1.20G 32.8MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 37%[======> ] 1.21G 31.2MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 37%[======> ] 1.21G 30.9MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 38%[======> ] 1.22G 32.1MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 38%[======> ] 1.24G 35.1MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 39%[======> ] 1.25G 36.4MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 39%[======> ] 1.26G 36.2MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 39%[======> ] 1.27G 34.4MB/s eta 49s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 39%[======> ] 1.28G 35.1MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 40%[=======> ] 1.30G 36.5MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 40%[=======> ] 1.31G 36.8MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 41%[=======> ] 1.33G 37.7MB/s eta 48s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 41%[=======> ] 1.34G 40.4MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 41%[=======> ] 1.34G 38.4MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 42%[=======> ] 1.36G 38.0MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 42%[=======> ] 1.37G 40.6MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 43%[=======> ] 1.38G 41.0MB/s eta 46s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 43%[=======> ] 1.38G 40.6MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 43%[=======> ] 1.39G 39.5MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 43%[=======> ] 1.40G 39.8MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 44%[=======> ] 1.41G 41.9MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 44%[=======> ] 1.42G 40.2MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 44%[=======> ] 1.43G 41.6MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 45%[========> ] 1.44G 42.3MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 45%[========> ] 1.45G 43.1MB/s eta 45s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 45%[========> ] 1.46G 42.1MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 46%[========> ] 1.47G 40.9MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 46%[========> ] 1.49G 41.6MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 46%[========> ] 1.50G 44.1MB/s eta 43s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 47%[========> ] 1.52G 44.3MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 47%[========> ] 1.52G 41.0MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 47%[========> ] 1.53G 38.9MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 48%[========> ] 1.55G 40.5MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L 48%[========> ] 1.55G 40.3MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6 48%[========> ] 1.56G 40.4MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6- 49%[========> ] 1.57G 42.1MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D 49%[========> ] 1.58G 39.5MB/s eta 41s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4 49%[========> ] 1.59G 41.8MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D40 50%[=========> ] 1.61G 41.3MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D409 50%[=========> ] 1.62G 43.3MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096 50%[=========> ] 1.62G 41.8MB/s eta 40s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096- 51%[=========> ] 1.64G 41.1MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E 51%[=========> ] 1.65G 40.7MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0 51%[=========> ] 1.65G 40.6MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_ 51%[=========> ] 1.66G 40.7MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1 52%[=========> ] 1.67G 39.4MB/s eta 39s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1- 52%[=========> ] 1.69G 41.3MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1-m 52%[=========> ] 1.70G 38.2MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D4096-E0_1-me 53%[=========> ] 1.71G 41.2MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D4096-E0_1-mem 53%[=========> ] 1.73G 39.5MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 54%[=========> ] 1.74G 41.7MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 54%[=========> ] 1.76G 42.1MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 55%[==========> ] 1.77G 44.3MB/s eta 37s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 55%[==========> ] 1.79G 45.5MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 56%[==========> ] 1.80G 46.7MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 56%[==========> ] 1.80G 44.7MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 56%[==========> ] 1.82G 44.8MB/s eta 35s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 57%[==========> ] 1.83G 45.5MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 57%[==========> ] 1.85G 47.3MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 58%[==========> ] 1.86G 47.2MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 58%[==========> ] 1.88G 47.7MB/s eta 34s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 58%[==========> ] 1.88G 48.2MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 59%[==========> ] 1.89G 47.2MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 59%[==========> ] 1.90G 47.3MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 59%[==========> ] 1.91G 45.4MB/s eta 33s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 59%[==========> ] 1.92G 46.5MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 60%[===========> ] 1.94G 45.2MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 60%[===========> ] 1.95G 44.7MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 61%[===========> ] 1.96G 45.6MB/s eta 31s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 61%[===========> ] 1.97G 43.7MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 61%[===========> ] 1.98G 42.8MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 62%[===========> ] 2.00G 45.3MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 62%[===========> ] 2.01G 45.1MB/s eta 30s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 62%[===========> ] 2.01G 43.6MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 63%[===========> ] 2.03G 45.2MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 63%[===========> ] 2.04G 43.8MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 63%[===========> ] 2.04G 43.4MB/s eta 29s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 64%[===========> ] 2.06G 43.6MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 64%[===========> ] 2.06G 40.5MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 64%[===========> ] 2.07G 40.8MB/s eta 28s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 65%[============> ] 2.09G 42.1MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 65%[============> ] 2.10G 43.8MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 65%[============> ] 2.11G 43.3MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L 66%[============> ] 2.12G 41.7MB/s eta 27s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6 66%[============> ] 2.13G 39.8MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6- 66%[============> ] 2.15G 41.2MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D 67%[============> ] 2.16G 41.3MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4 67%[============> ] 2.16G 38.0MB/s eta 26s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D40 67%[============> ] 2.17G 39.9MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D409 67%[============> ] 2.17G 37.1MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096 68%[============> ] 2.19G 40.4MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096- 68%[============> ] 2.20G 39.8MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E 68%[============> ] 2.21G 38.9MB/s eta 25s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0 69%[============> ] 2.21G 37.6MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_ 69%[============> ] 2.22G 38.7MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1 69%[============> ] 2.23G 39.7MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1- 70%[=============> ] 2.25G 39.6MB/s eta 24s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1-m 70%[=============> ] 2.26G 41.4MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D4096-E0_1-me 70%[=============> ] 2.27G 38.7MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D4096-E0_1-mem 70%[=============> ] 2.27G 39.1MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 70%[=============> ] 2.27G 36.0MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 71%[=============> ] 2.28G 34.9MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 71%[=============> ] 2.28G 35.7MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 71%[=============> ] 2.29G 35.5MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 72%[=============> ] 2.31G 35.1MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 72%[=============> ] 2.32G 37.5MB/s eta 23s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 72%[=============> ] 2.34G 38.4MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 73%[=============> ] 2.35G 37.5MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 73%[=============> ] 2.35G 34.7MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 73%[=============> ] 2.37G 37.5MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 73%[=============> ] 2.37G 36.1MB/s eta 21s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 74%[=============> ] 2.38G 37.7MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 74%[=============> ] 2.38G 37.2MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 74%[=============> ] 2.39G 36.3MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 74%[=============> ] 2.40G 35.1MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 75%[==============> ] 2.41G 33.7MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 75%[==============> ] 2.41G 33.1MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 76%[==============> ] 2.44G 37.2MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 76%[==============> ] 2.46G 39.9MB/s eta 20s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 76%[==============> ] 2.46G 40.2MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 77%[==============> ] 2.47G 39.3MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 77%[==============> ] 2.49G 39.9MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 77%[==============> ] 2.49G 38.9MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 77%[==============> ] 2.50G 35.8MB/s eta 19s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 78%[==============> ] 2.50G 37.2MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 78%[==============> ] 2.51G 38.4MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 78%[==============> ] 2.52G 36.4MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 78%[==============> ] 2.53G 39.8MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 79%[==============> ] 2.53G 37.3MB/s eta 17s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 79%[==============> ] 2.55G 41.2MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 79%[==============> ] 2.56G 42.5MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 80%[===============> ] 2.58G 42.3MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 80%[===============> ] 2.59G 44.0MB/s eta 16s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L 80%[===============> ] 2.59G 44.4MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6 81%[===============> ] 2.60G 42.2MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6- 81%[===============> ] 2.61G 40.7MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D 81%[===============> ] 2.62G 40.1MB/s eta 15s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4 82%[===============> ] 2.64G 42.8MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D40 82%[===============> ] 2.65G 44.0MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D409 83%[===============> ] 2.67G 45.4MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096 83%[===============> ] 2.68G 46.1MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096- 84%[===============> ] 2.70G 47.0MB/s eta 14s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E 84%[===============> ] 2.70G 45.7MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0 84%[===============> ] 2.71G 47.0MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_ 85%[================> ] 2.72G 48.7MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1 85%[================> ] 2.73G 47.7MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1- 85%[================> ] 2.74G 47.2MB/s eta 13s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D4096-E0_1-m 85%[================> ] 2.76G 47.5MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D4096-E0_1-me 86%[================> ] 2.77G 47.3MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "5-L6-D4096-E0_1-mem 86%[================> ] 2.79G 48.7MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-L6-D4096-E0_1-mem- 87%[================> ] 2.80G 48.9MB/s eta 11s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "L6-D4096-E0_1-mem-c 87%[================> ] 2.80G 47.7MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-D4096-E0_1-mem-ct 87%[================> ] 2.82G 48.5MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-D4096-E0_1-mem-ctx 88%[================> ] 2.83G 49.5MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "D4096-E0_1-mem-ctx- 88%[================> ] 2.84G 48.0MB/s eta 10s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "4096-E0_1-mem-ctx-8 89%[================> ] 2.86G 44.8MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "096-E0_1-mem-ctx-8k 89%[================> ] 2.86G 44.1MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "96-E0_1-mem-ctx-8k. 89%[================> ] 2.88G 44.7MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "6-E0_1-mem-ctx-8k.p 90%[=================> ] 2.89G 44.2MB/s eta 9s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-E0_1-mem-ctx-8k.pt 90%[=================> ] 2.91G 45.9MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "E0_1-mem-ctx-8k.pth 91%[=================> ] 2.92G 47.9MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "0_1-mem-ctx-8k.pth 91%[=================> ] 2.93G 48.7MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "_1-mem-ctx-8k.pth 91%[=================> ] 2.95G 48.0MB/s eta 7s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "1-mem-ctx-8k.pth 92%[=================> ] 2.95G 41.6MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-mem-ctx-8k.pth 92%[=================> ] 2.96G 43.9MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "mem-ctx-8k.pth 92%[=================> ] 2.98G 45.1MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "em-ctx-8k.pth 92%[=================> ] 2.98G 40.2MB/s eta 6s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "m-ctx-8k.pth 93%[=================> ] 2.99G 41.2MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-ctx-8k.pth 93%[=================> ] 3.00G 40.6MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "ctx-8k.pth 93%[=================> ] 3.01G 39.8MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "tx-8k.pth 94%[=================> ] 3.02G 42.2MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "x-8k.pth 94%[=================> ] 3.03G 41.7MB/s eta 5s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "-8k.pth 95%[==================> ] 3.05G 45.1MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "8k.pth 95%[==================> ] 3.05G 43.7MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "k.pth 95%[==================> ] 3.07G 43.3MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - ".pth 96%[==================> ] 3.08G 44.7MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "pth 96%[==================> ] 3.09G 43.9MB/s eta 4s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "th 96%[==================> ] 3.10G 44.3MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "h 97%[==================> ] 3.11G 42.7MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " 97%[==================> ] 3.13G 42.3MB/s eta 3s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v 98%[==================> ] 3.14G 42.7MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5 98%[==================> ] 3.16G 45.0MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5- 98%[==================> ] 3.16G 42.3MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L 99%[==================> ] 3.17G 46.3MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6 99%[==================> ] 3.18G 44.5MB/s eta 1s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6- 99%[==================> ] 3.19G 44.6MB/s eta 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - " v5-L6-D 99%[==================> ] 3.20G 46.1MB/s eta 0s " - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\r", - "v5-L6-D4096-E0_1-me 100%[===================>] 3.21G 45.1MB/s in 78s \r\n", - "\r\n", - "2023-09-05 20:04:40 (41.9 MB/s) - ‘v5-L6-D4096-E0_1-mem-ctx-8k.pth’ saved [3441599237/3441599237]\r\n", - "\r\n" - ] - } - ], - "source": [ - "# Lets download the custom models\n", - "!mkdir -p ../../../model/\n", - "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/memory-size-experiment-for-rwkv/resolve/main/RWKV-v5-baseline/BaseV5-C-Tune5.pth\"\n", - "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/EWR-1B5-E0_1-mem-ctx-8k.pth\"\n", - "!cd ../../../model/ && wget -nc \"https://huggingface.co/rwkv-x-dev/rwkv-x-playground/resolve/main/experiment/rwkv-x-exp/v5-slim-memory/v5-L6-D1024-E0_1-mem-ctx-8k.pth\"\n", - "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D2048-E0_1-mem-ctx-8k.pth\"\n", - "!cd ../../../model/ && wget -nc \"https://huggingface.co/picocreator/RWKV-x-playground/resolve/main/V5-16k/v5-L6-D4096-E0_1-mem-ctx-8k.pth\"" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "id": "c1d4920e", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T20:04:41.200276Z", - "iopub.status.busy": "2023-09-05T20:04:41.199672Z", - "iopub.status.idle": "2023-09-05T20:04:41.455126Z", - "shell.execute_reply": "2023-09-05T20:04:41.454090Z" - }, - "papermill": { - "duration": 0.340242, - "end_time": "2023-09-05T20:04:41.457583", - "exception": false, - "start_time": "2023-09-05T20:04:41.117341", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "total 16G\r\n", - "-rw-r--r-- 1 root root 5.7G Aug 11 12:48 BaseV5-C-Tune5.pth\r\n", - "-rw-r--r-- 1 root root 5.7G Aug 17 14:38 EWR-1B5-E0_1-mem-ctx-8k.pth\r\n", - "-rw-r--r-- 1 root root 353M Sep 5 14:40 v5-L6-D1024-E0_1-mem-ctx-8k.pth\r\n", - "-rw-r--r-- 1 root root 1018M Aug 19 08:33 v5-L6-D2048-E0_1-mem-ctx-8k.pth\r\n", - "-rw-r--r-- 1 root root 3.3G Aug 20 14:58 v5-L6-D4096-E0_1-mem-ctx-8k.pth\r\n" - ] - } - ], - "source": [ - "!ls -lh ../../../model/" - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "id": "836e432a", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T20:04:41.617951Z", - "iopub.status.busy": "2023-09-05T20:04:41.617377Z", - "iopub.status.idle": "2023-09-05T20:04:44.887019Z", - "shell.execute_reply": "2023-09-05T20:04:44.885854Z" - }, - "papermill": { - "duration": 3.352332, - "end_time": "2023-09-05T20:04:44.889387", - "exception": false, - "start_time": "2023-09-05T20:04:41.537055", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Requirement already satisfied: aiocsv in /usr/local/lib/python3.10/dist-packages (1.2.4)\r\n", - "Requirement already satisfied: aiofiles in /usr/local/lib/python3.10/dist-packages (23.2.1)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\u001b[33mWARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\u001b[0m\u001b[33m\r\n", - "\u001b[0m" - ] - } - ], - "source": [ - "!python3 -m pip install aiocsv aiofiles" - ] - }, - { - "cell_type": "markdown", - "id": "2e58126b", - "metadata": { - "papermill": { - "duration": 0.079405, - "end_time": "2023-09-05T20:04:45.048270", - "exception": false, - "start_time": "2023-09-05T20:04:44.968865", - "status": "completed" - }, - "tags": [] - }, - "source": [ - "# 1B5 V5 benchmark" - ] - }, - { - "cell_type": "code", - "execution_count": 4, - "id": "ac23fcab", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T20:04:45.210262Z", - "iopub.status.busy": "2023-09-05T20:04:45.209384Z", - "iopub.status.idle": "2023-09-05T20:06:04.241980Z", - "shell.execute_reply": "2023-09-05T20:06:04.240702Z" - }, - "papermill": { - "duration": 79.11701, - "end_time": "2023-09-05T20:06:04.244895", - "exception": false, - "start_time": "2023-09-05T20:04:45.127885", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-09-05 20:04:49,621] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 40 tokens : 100.0% similarity, with 40 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 45 tokens : 100.0% similarity, with 45 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 50 tokens : 100.0% similarity, with 50 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 55 tokens : 100.0% similarity, with 55 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 60 tokens : 100.0% similarity, with 60 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 65 tokens : 100.0% similarity, with 65 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 70 tokens : 100.0% similarity, with 70 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 75 tokens : 100.0% similarity, with 75 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 80 tokens : 100.0% similarity, with 80 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 85 tokens : 100.0% similarity, with 85 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 90 tokens : 100.0% similarity, with 90 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 95 tokens : 100.0% similarity, with 95 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 100 tokens : 100.0% similarity, with 100 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 105 tokens : 100.0% similarity, with 105 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 110 tokens : 100.0% similarity, with 110 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 115 tokens : 100.0% similarity, with 115 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 120 tokens : 100.0% similarity, with 120 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 125 tokens : 100.0% similarity, with 125 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 130 tokens : 100.0% similarity, with 130 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 135 tokens : 100.0% similarity, with 135 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 140 tokens : 100.0% similarity, with 140 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 145 tokens : 100.0% similarity, with 145 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 150 tokens : 100.0% similarity, with 150 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 160 tokens : 100.0% similarity, with 160 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 170 tokens : 100.0% similarity, with 170 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 180 tokens : 100.0% similarity, with 180 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 190 tokens : 99.47368421052632% similarity, with 189 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 200 tokens : 100.0% similarity, with 200 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 210 tokens : 100.0% similarity, with 210 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 220 tokens : 100.0% similarity, with 220 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 230 tokens : 100.0% similarity, with 230 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 240 tokens : 100.0% similarity, with 240 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 250 tokens : 100.0% similarity, with 250 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 260 tokens : 100.0% similarity, with 260 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 270 tokens : 100.0% similarity, with 270 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 280 tokens : 99.64285714285714% similarity, with 279 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 290 tokens : 100.0% similarity, with 290 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 300 tokens : 99.66666666666667% similarity, with 299 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 325 tokens : 100.0% similarity, with 325 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 350 tokens : 100.0% similarity, with 350 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 375 tokens : 99.46666666666667% similarity, with 373 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 400 tokens : 99.75% similarity, with 399 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 425 tokens : 99.76470588235294% similarity, with 424 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 450 tokens : 99.55555555555556% similarity, with 448 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 475 tokens : 99.36842105263159% similarity, with 472 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 500 tokens : 99.6% similarity, with 498 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 525 tokens : 99.61904761904762% similarity, with 523 matched token, and 2 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 550 tokens : 99.27272727272727% similarity, with 546 matched token, and 4 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 575 tokens : 99.30434782608695% similarity, with 571 matched token, and 4 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 600 tokens : 99.33333333333333% similarity, with 596 matched token, and 4 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 625 tokens : 99.03999999999999% similarity, with 619 matched token, and 6 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 650 tokens : 99.07692307692308% similarity, with 644 matched token, and 6 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 675 tokens : 99.11111111111111% similarity, with 669 matched token, and 6 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 700 tokens : 99.0% similarity, with 693 matched token, and 7 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 750 tokens : 99.06666666666666% similarity, with 743 matched token, and 7 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 800 tokens : 99.0% similarity, with 792 matched token, and 8 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 850 tokens : 99.05882352941177% similarity, with 842 matched token, and 8 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 900 tokens : 99.0% similarity, with 891 matched token, and 9 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 950 tokens : 99.1578947368421% similarity, with 942 matched token, and 8 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1000 tokens : 99.2% similarity, with 992 matched token, and 8 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-1k.csv\"" - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "id": "534dc178", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T20:06:04.432032Z", - "iopub.status.busy": "2023-09-05T20:06:04.431202Z", - "iopub.status.idle": "2023-09-05T20:10:29.967568Z", - "shell.execute_reply": "2023-09-05T20:10:29.966188Z" - }, - "papermill": { - "duration": 265.629775, - "end_time": "2023-09-05T20:10:29.969793", - "exception": false, - "start_time": "2023-09-05T20:06:04.340018", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-09-05 20:06:08,978] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1100 tokens : 98.63636363636363% similarity, with 1085 matched token, and 15 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1150 tokens : 98.52173913043478% similarity, with 1133 matched token, and 17 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1200 tokens : 98.75% similarity, with 1185 matched token, and 15 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1250 tokens : 98.72% similarity, with 1234 matched token, and 16 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1300 tokens : 98.61538461538461% similarity, with 1282 matched token, and 18 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1350 tokens : 98.44444444444444% similarity, with 1329 matched token, and 21 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1400 tokens : 98.5% similarity, with 1379 matched token, and 21 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1450 tokens : 98.20689655172414% similarity, with 1424 matched token, and 26 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1500 tokens : 97.86666666666667% similarity, with 1468 matched token, and 32 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1550 tokens : 97.67741935483872% similarity, with 1514 matched token, and 36 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1600 tokens : 97.8125% similarity, with 1565 matched token, and 35 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1650 tokens : 97.57575757575758% similarity, with 1610 matched token, and 40 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1700 tokens : 97.6470588235294% similarity, with 1660 matched token, and 40 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1750 tokens : 97.94285714285714% similarity, with 1714 matched token, and 36 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1800 tokens : 97.72222222222223% similarity, with 1759 matched token, and 41 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1850 tokens : 96.86486486486487% similarity, with 1792 matched token, and 58 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1900 tokens : 96.36842105263158% similarity, with 1831 matched token, and 69 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 1950 tokens : 95.17948717948718% similarity, with 1856 matched token, and 94 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2000 tokens : 94.75% similarity, with 1895 matched token, and 105 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2050 tokens : 93.26829268292684% similarity, with 1912 matched token, and 138 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2100 tokens : 91.33333333333333% similarity, with 1918 matched token, and 182 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2150 tokens : 90.09302325581395% similarity, with 1937 matched token, and 213 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2200 tokens : 88.77272727272727% similarity, with 1953 matched token, and 247 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2250 tokens : 86.53333333333333% similarity, with 1947 matched token, and 303 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2300 tokens : 84.78260869565217% similarity, with 1950 matched token, and 350 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2350 tokens : 82.08510638297872% similarity, with 1929 matched token, and 421 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2400 tokens : 80.625% similarity, with 1935 matched token, and 465 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2450 tokens : 78.61224489795919% similarity, with 1926 matched token, and 524 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2500 tokens : 77.08% similarity, with 1927 matched token, and 573 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2550 tokens : 75.29411764705883% similarity, with 1920 matched token, and 630 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2600 tokens : 73.88461538461539% similarity, with 1921 matched token, and 679 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2650 tokens : 72.75471698113208% similarity, with 1928 matched token, and 722 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2700 tokens : 71.4074074074074% similarity, with 1928 matched token, and 772 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2750 tokens : 70.10909090909091% similarity, with 1928 matched token, and 822 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2800 tokens : 68.85714285714286% similarity, with 1928 matched token, and 872 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2850 tokens : 67.89473684210526% similarity, with 1935 matched token, and 915 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2900 tokens : 66.6896551724138% similarity, with 1934 matched token, and 966 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 2950 tokens : 65.5593220338983% similarity, with 1934 matched token, and 1016 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3000 tokens : 64.36666666666667% similarity, with 1931 matched token, and 1069 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3050 tokens : 63.278688524590166% similarity, with 1930 matched token, and 1120 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3100 tokens : 62.096774193548384% similarity, with 1925 matched token, and 1175 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3150 tokens : 61.17460317460317% similarity, with 1927 matched token, and 1223 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3200 tokens : 60.21875% similarity, with 1927 matched token, and 1273 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3250 tokens : 59.199999999999996% similarity, with 1924 matched token, and 1326 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3300 tokens : 58.151515151515156% similarity, with 1919 matched token, and 1381 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3350 tokens : 57.16417910447761% similarity, with 1915 matched token, and 1435 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3400 tokens : 56.294117647058826% similarity, with 1914 matched token, and 1486 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3450 tokens : 55.362318840579704% similarity, with 1910 matched token, and 1540 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3500 tokens : 54.400000000000006% similarity, with 1904 matched token, and 1596 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3550 tokens : 53.5774647887324% similarity, with 1902 matched token, and 1648 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3600 tokens : 52.77777777777778% similarity, with 1900 matched token, and 1700 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3650 tokens : 51.89041095890411% similarity, with 1894 matched token, and 1756 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3700 tokens : 51.08108108108108% similarity, with 1890 matched token, and 1810 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3750 tokens : 50.160000000000004% similarity, with 1881 matched token, and 1869 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3800 tokens : 49.34210526315789% similarity, with 1875 matched token, and 1925 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3850 tokens : 48.51948051948052% similarity, with 1868 matched token, and 1982 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3900 tokens : 47.51282051282051% similarity, with 1853 matched token, and 2047 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 3950 tokens : 46.607594936708864% similarity, with 1841 matched token, and 2109 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4000 tokens : 45.574999999999996% similarity, with 1823 matched token, and 2177 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-4k.csv\" 1100 4000" - ] - }, - { - "cell_type": "code", - "execution_count": 6, - "id": "99f322eb", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T20:10:30.144675Z", - "iopub.status.busy": "2023-09-05T20:10:30.144153Z", - "iopub.status.idle": "2023-09-05T21:13:05.936146Z", - "shell.execute_reply": "2023-09-05T21:13:05.934942Z" - }, - "papermill": { - "duration": 3755.883001, - "end_time": "2023-09-05T21:13:05.938991", - "exception": false, - "start_time": "2023-09-05T20:10:30.055990", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-09-05 20:10:34,716] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4100 tokens : 44.0% similarity, with 1804 matched token, and 2296 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4200 tokens : 42.11904761904762% similarity, with 1769 matched token, and 2431 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4300 tokens : 40.27906976744186% similarity, with 1732 matched token, and 2568 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4400 tokens : 38.27272727272727% similarity, with 1684 matched token, and 2716 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4500 tokens : 35.8% similarity, with 1611 matched token, and 2889 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4600 tokens : 33.73913043478261% similarity, with 1552 matched token, and 3048 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4700 tokens : 31.06382978723404% similarity, with 1460 matched token, and 3240 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4800 tokens : 28.3125% similarity, with 1359 matched token, and 3441 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 4900 tokens : 25.857142857142858% similarity, with 1267 matched token, and 3633 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5000 tokens : 23.04% similarity, with 1152 matched token, and 3848 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5100 tokens : 20.764705882352942% similarity, with 1059 matched token, and 4041 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5200 tokens : 18.5% similarity, with 962 matched token, and 4238 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5300 tokens : 16.88679245283019% similarity, with 895 matched token, and 4405 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5400 tokens : 15.222222222222223% similarity, with 822 matched token, and 4578 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5500 tokens : 13.418181818181818% similarity, with 738 matched token, and 4762 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5600 tokens : 11.625% similarity, with 651 matched token, and 4949 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5700 tokens : 10.421052631578947% similarity, with 594 matched token, and 5106 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5800 tokens : 9.344827586206897% similarity, with 542 matched token, and 5258 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5900 tokens : 8.305084745762711% similarity, with 490 matched token, and 5410 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6000 tokens : 7.449999999999999% similarity, with 447 matched token, and 5553 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6100 tokens : 6.655737704918033% similarity, with 406 matched token, and 5694 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6200 tokens : 6.064516129032258% similarity, with 376 matched token, and 5824 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6300 tokens : 5.65079365079365% similarity, with 356 matched token, and 5944 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6400 tokens : 5.328125% similarity, with 341 matched token, and 6059 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6500 tokens : 4.984615384615385% similarity, with 324 matched token, and 6176 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6600 tokens : 4.6818181818181825% similarity, with 309 matched token, and 6291 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6700 tokens : 4.432835820895523% similarity, with 297 matched token, and 6403 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6800 tokens : 4.25% similarity, with 289 matched token, and 6511 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 6900 tokens : 4.08695652173913% similarity, with 282 matched token, and 6618 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7000 tokens : 4.0% similarity, with 280 matched token, and 6720 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7100 tokens : 3.943661971830986% similarity, with 280 matched token, and 6820 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7200 tokens : 3.75% similarity, with 270 matched token, and 6930 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7300 tokens : 3.767123287671233% similarity, with 275 matched token, and 7025 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7400 tokens : 3.689189189189189% similarity, with 273 matched token, and 7127 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7500 tokens : 3.64% similarity, with 273 matched token, and 7227 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7600 tokens : 3.578947368421052% similarity, with 272 matched token, and 7328 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7700 tokens : 3.5844155844155843% similarity, with 276 matched token, and 7424 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7800 tokens : 3.5641025641025643% similarity, with 278 matched token, and 7522 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 7900 tokens : 3.468354430379747% similarity, with 274 matched token, and 7626 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8000 tokens : 3.4250000000000003% similarity, with 274 matched token, and 7726 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8100 tokens : 3.432098765432099% similarity, with 278 matched token, and 7822 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8200 tokens : 3.414634146341464% similarity, with 280 matched token, and 7920 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8300 tokens : 3.36144578313253% similarity, with 279 matched token, and 8021 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8400 tokens : 3.3690476190476186% similarity, with 283 matched token, and 8117 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8500 tokens : 3.3411764705882354% similarity, with 284 matched token, and 8216 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8600 tokens : 3.3488372093023258% similarity, with 288 matched token, and 8312 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8700 tokens : 3.3678160919540225% similarity, with 293 matched token, and 8407 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8800 tokens : 3.3295454545454546% similarity, with 293 matched token, and 8507 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 8900 tokens : 3.348314606741573% similarity, with 298 matched token, and 8602 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9000 tokens : 3.3333333333333335% similarity, with 300 matched token, and 8700 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9100 tokens : 3.3406593406593412% similarity, with 304 matched token, and 8796 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9200 tokens : 3.3260869565217392% similarity, with 306 matched token, and 8894 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9300 tokens : 3.3010752688172045% similarity, with 307 matched token, and 8993 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9400 tokens : 3.2978723404255317% similarity, with 310 matched token, and 9090 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9500 tokens : 3.3157894736842106% similarity, with 315 matched token, and 9185 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9600 tokens : 3.3229166666666665% similarity, with 319 matched token, and 9281 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9700 tokens : 3.3195876288659796% similarity, with 322 matched token, and 9378 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9800 tokens : 3.316326530612245% similarity, with 325 matched token, and 9475 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 9900 tokens : 3.3333333333333335% similarity, with 330 matched token, and 9570 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10000 tokens : 3.37% similarity, with 337 matched token, and 9663 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10100 tokens : 3.3861386138613865% similarity, with 342 matched token, and 9758 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10200 tokens : 3.3725490196078427% similarity, with 344 matched token, and 9856 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10300 tokens : 3.349514563106796% similarity, with 345 matched token, and 9955 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10400 tokens : 3.355769230769231% similarity, with 349 matched token, and 10051 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10500 tokens : 3.371428571428572% similarity, with 354 matched token, and 10146 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10600 tokens : 3.3584905660377355% similarity, with 356 matched token, and 10244 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10700 tokens : 3.392523364485981% similarity, with 363 matched token, and 10337 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10800 tokens : 3.4074074074074074% similarity, with 368 matched token, and 10432 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10900 tokens : 3.3853211009174315% similarity, with 369 matched token, and 10531 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11000 tokens : 3.390909090909091% similarity, with 373 matched token, and 10627 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11100 tokens : 3.3963963963963963% similarity, with 377 matched token, and 10723 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11200 tokens : 3.3839285714285716% similarity, with 379 matched token, and 10821 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11300 tokens : 3.4070796460176993% similarity, with 385 matched token, and 10915 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11400 tokens : 3.43859649122807% similarity, with 392 matched token, and 11008 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11500 tokens : 3.4434782608695653% similarity, with 396 matched token, and 11104 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11600 tokens : 3.4568965517241383% similarity, with 401 matched token, and 11199 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11700 tokens : 3.4444444444444446% similarity, with 403 matched token, and 11297 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11800 tokens : 3.457627118644068% similarity, with 408 matched token, and 11392 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 11900 tokens : 3.46218487394958% similarity, with 412 matched token, and 11488 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12000 tokens : 3.4750000000000005% similarity, with 417 matched token, and 11583 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12100 tokens : 3.487603305785124% similarity, with 422 matched token, and 11678 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12200 tokens : 3.475409836065574% similarity, with 424 matched token, and 11776 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12300 tokens : 3.487804878048781% similarity, with 429 matched token, and 11871 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12400 tokens : 3.491935483870968% similarity, with 433 matched token, and 11967 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12500 tokens : 3.488% similarity, with 436 matched token, and 12064 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12600 tokens : 3.484126984126984% similarity, with 439 matched token, and 12161 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12700 tokens : 3.4881889763779523% similarity, with 443 matched token, and 12257 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12800 tokens : 3.484375% similarity, with 446 matched token, and 12354 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 12900 tokens : 3.488372093023256% similarity, with 450 matched token, and 12450 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13000 tokens : 3.5000000000000004% similarity, with 455 matched token, and 12545 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13100 tokens : 3.5038167938931295% similarity, with 459 matched token, and 12641 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13200 tokens : 3.5000000000000004% similarity, with 462 matched token, and 12738 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13300 tokens : 3.488721804511278% similarity, with 464 matched token, and 12836 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13400 tokens : 3.514925373134328% similarity, with 471 matched token, and 12929 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13500 tokens : 3.503703703703704% similarity, with 473 matched token, and 13027 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13600 tokens : 3.514705882352941% similarity, with 478 matched token, and 13122 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13700 tokens : 3.510948905109489% similarity, with 481 matched token, and 13219 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13800 tokens : 3.5144927536231885% similarity, with 485 matched token, and 13315 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 13900 tokens : 3.5251798561151078% similarity, with 490 matched token, and 13410 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14000 tokens : 3.55% similarity, with 497 matched token, and 13503 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14100 tokens : 3.546099290780142% similarity, with 500 matched token, and 13600 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14200 tokens : 3.535211267605634% similarity, with 502 matched token, and 13698 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14300 tokens : 3.5454545454545454% similarity, with 507 matched token, and 13793 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14400 tokens : 3.5555555555555554% similarity, with 512 matched token, and 13888 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14500 tokens : 3.537931034482759% similarity, with 513 matched token, and 13987 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14600 tokens : 3.5273972602739727% similarity, with 515 matched token, and 14085 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14700 tokens : 3.5646258503401365% similarity, with 524 matched token, and 14176 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14800 tokens : 3.5472972972972974% similarity, with 525 matched token, and 14275 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 14900 tokens : 3.550335570469799% similarity, with 529 matched token, and 14371 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15000 tokens : 3.5533333333333332% similarity, with 533 matched token, and 14467 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15100 tokens : 3.576158940397351% similarity, with 540 matched token, and 14560 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15200 tokens : 3.56578947368421% similarity, with 542 matched token, and 14658 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15300 tokens : 3.5490196078431375% similarity, with 543 matched token, and 14757 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15400 tokens : 3.551948051948052% similarity, with 547 matched token, and 14853 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15500 tokens : 3.5483870967741935% similarity, with 550 matched token, and 14950 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15600 tokens : 3.5448717948717947% similarity, with 553 matched token, and 15047 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15700 tokens : 3.5605095541401273% similarity, with 559 matched token, and 15141 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15800 tokens : 3.5506329113924053% similarity, with 561 matched token, and 15239 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15900 tokens : 3.547169811320755% similarity, with 564 matched token, and 15336 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 16000 tokens : 3.5437499999999997% similarity, with 567 matched token, and 15433 token mismatch\r\n", - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-16k.csv\" 4100 16000" - ] - }, - { - "cell_type": "markdown", - "id": "a74e51c9", - "metadata": { - "papermill": { - "duration": 0.09516, - "end_time": "2023-09-05T21:13:06.131143", - "exception": false, - "start_time": "2023-09-05T21:13:06.035983", - "status": "completed" - }, - "tags": [] - }, - "source": [ - "# EWR V5 benchmark" - ] - }, - { - "cell_type": "code", - "execution_count": 7, - "id": "9d25dfe2", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T21:13:06.323309Z", - "iopub.status.busy": "2023-09-05T21:13:06.322372Z", - "iopub.status.idle": "2023-09-05T21:13:12.951333Z", - "shell.execute_reply": "2023-09-05T21:13:12.950224Z" - }, - "papermill": { - "duration": 6.72745, - "end_time": "2023-09-05T21:13:12.953705", - "exception": false, - "start_time": "2023-09-05T21:13:06.226255", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-09-05 21:13:10,829] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Traceback (most recent call last):\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", - " asyncio.run(main_function())\r\n", - " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", - " return loop.run_until_complete(main)\r\n", - " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", - " return future.result()\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", - " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n", - " self.model = RWKV(**model_config)\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", - " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", - "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-1k.csv\"" - ] - }, - { - "cell_type": "code", - "execution_count": 8, - "id": "3fcf3d9c", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T21:13:13.146654Z", - "iopub.status.busy": "2023-09-05T21:13:13.146064Z", - "iopub.status.idle": "2023-09-05T21:13:19.792768Z", - "shell.execute_reply": "2023-09-05T21:13:19.791667Z" - }, - "papermill": { - "duration": 6.745739, - "end_time": "2023-09-05T21:13:19.795146", - "exception": false, - "start_time": "2023-09-05T21:13:13.049407", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-09-05 21:13:17,653] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n", - "Traceback (most recent call last):\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", - " asyncio.run(main_function())\r\n", - " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", - " return loop.run_until_complete(main)\r\n", - " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", - " return future.result()\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", - " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n", - " self.model = RWKV(**model_config)\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", - " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", - "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-4k.csv\" 1100 4000" - ] - }, - { - "cell_type": "code", - "execution_count": 9, - "id": "b6a68042", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T21:13:19.986694Z", - "iopub.status.busy": "2023-09-05T21:13:19.986046Z", - "iopub.status.idle": "2023-09-05T21:13:26.675895Z", - "shell.execute_reply": "2023-09-05T21:13:26.674749Z" - }, - "papermill": { - "duration": 6.789014, - "end_time": "2023-09-05T21:13:26.678244", - "exception": false, - "start_time": "2023-09-05T21:13:19.889230", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-09-05 21:13:24,542] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Traceback (most recent call last):\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", - " asyncio.run(main_function())\r\n", - " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", - " return loop.run_until_complete(main)\r\n", - " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", - " return future.result()\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", - " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n", - " self.model = RWKV(**model_config)\r\n", - " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", - " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", - "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" - ] - } - ], - "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-16k.csv\" 4100 16000" - ] - }, - { - "cell_type": "markdown", - "id": "6ecfc74c", - "metadata": { - "papermill": { - "duration": 0.093639, - "end_time": "2023-09-05T21:13:26.866949", - "exception": false, - "start_time": "2023-09-05T21:13:26.773310", - "status": "completed" - }, - "tags": [] - }, - "source": [ - "# v5-L6-D1024-E0_1-mem-ctx-8k.pth" - ] - }, - { - "cell_type": "code", - "execution_count": 10, - "id": "d480f218", - "metadata": { - "execution": { - "iopub.execute_input": "2023-09-05T21:13:27.058397Z", - "iopub.status.busy": "2023-09-05T21:13:27.057750Z", - "iopub.status.idle": "2023-09-05T21:14:20.632357Z", - "shell.execute_reply": "2023-09-05T21:14:20.631176Z" - }, - "papermill": { - "duration": 53.673513, - "end_time": "2023-09-05T21:14:20.634750", - "exception": false, - "start_time": "2023-09-05T21:13:26.961237", - "status": "completed" - }, - "tags": [] - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[2023-09-05 21:13:31,592] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 5 tokens : 100.0% similarity, with 5 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 10 tokens : 100.0% similarity, with 10 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15 tokens : 100.0% similarity, with 15 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 20 tokens : 100.0% similarity, with 20 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 25 tokens : 100.0% similarity, with 25 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 30 tokens : 100.0% similarity, with 30 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 35 tokens : 100.0% similarity, with 35 matched token, and 0 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 40 tokens : 97.5% similarity, with 39 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 45 tokens : 97.77777777777777% similarity, with 44 matched token, and 1 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 50 tokens : 94.0% similarity, with 47 matched token, and 3 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 55 tokens : 85.45454545454545% similarity, with 47 matched token, and 8 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 60 tokens : 83.33333333333334% similarity, with 50 matched token, and 10 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 65 tokens : 81.53846153846153% similarity, with 53 matched token, and 12 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 70 tokens : 72.85714285714285% similarity, with 51 matched token, and 19 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 75 tokens : 68.0% similarity, with 51 matched token, and 24 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 80 tokens : 63.74999999999999% similarity, with 51 matched token, and 29 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 85 tokens : 57.647058823529406% similarity, with 49 matched token, and 36 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 90 tokens : 58.88888888888889% similarity, with 53 matched token, and 37 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 95 tokens : 54.736842105263165% similarity, with 52 matched token, and 43 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 100 tokens : 55.00000000000001% similarity, with 55 matched token, and 45 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 105 tokens : 56.19047619047619% similarity, with 59 matched token, and 46 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 110 tokens : 55.45454545454545% similarity, with 61 matched token, and 49 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 115 tokens : 53.04347826086957% similarity, with 61 matched token, and 54 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 120 tokens : 48.333333333333336% similarity, with 58 matched token, and 62 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 125 tokens : 46.400000000000006% similarity, with 58 matched token, and 67 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 130 tokens : 45.38461538461539% similarity, with 59 matched token, and 71 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 135 tokens : 44.44444444444444% similarity, with 60 matched token, and 75 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 140 tokens : 42.142857142857146% similarity, with 59 matched token, and 81 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 145 tokens : 42.758620689655174% similarity, with 62 matched token, and 83 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 150 tokens : 41.333333333333336% similarity, with 62 matched token, and 88 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 160 tokens : 35.0% similarity, with 56 matched token, and 104 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 170 tokens : 33.52941176470588% similarity, with 57 matched token, and 113 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 180 tokens : 32.77777777777778% similarity, with 59 matched token, and 121 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 190 tokens : 32.631578947368425% similarity, with 62 matched token, and 128 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 200 tokens : 33.0% similarity, with 66 matched token, and 134 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 210 tokens : 32.38095238095238% similarity, with 68 matched token, and 142 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 220 tokens : 29.09090909090909% similarity, with 64 matched token, and 156 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 230 tokens : 28.695652173913043% similarity, with 66 matched token, and 164 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 240 tokens : 30.833333333333336% similarity, with 74 matched token, and 166 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 250 tokens : 30.8% similarity, with 77 matched token, and 173 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 260 tokens : 31.153846153846153% similarity, with 81 matched token, and 179 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 270 tokens : 28.51851851851852% similarity, with 77 matched token, and 193 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 280 tokens : 30.0% similarity, with 84 matched token, and 196 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 290 tokens : 27.586206896551722% similarity, with 80 matched token, and 210 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 300 tokens : 28.000000000000004% similarity, with 84 matched token, and 216 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 325 tokens : 26.153846153846157% similarity, with 85 matched token, and 240 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 350 tokens : 25.142857142857146% similarity, with 88 matched token, and 262 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 375 tokens : 22.933333333333334% similarity, with 86 matched token, and 289 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 400 tokens : 22.75% similarity, with 91 matched token, and 309 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 425 tokens : 22.58823529411765% similarity, with 96 matched token, and 329 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 450 tokens : 20.88888888888889% similarity, with 94 matched token, and 356 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 475 tokens : 19.789473684210527% similarity, with 94 matched token, and 381 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 500 tokens : 18.8% similarity, with 94 matched token, and 406 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 525 tokens : 18.285714285714285% similarity, with 96 matched token, and 429 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 550 tokens : 17.636363636363637% similarity, with 97 matched token, and 453 token mismatch\r\n" + "## Model validation for 525 tokens : 99.61904761904762% similarity, with 523 matched token, and 2 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 575 tokens : 18.086956521739133% similarity, with 104 matched token, and 471 token mismatch\r\n" + "## Model validation for 550 tokens : 99.27272727272727% similarity, with 546 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 600 tokens : 17.0% similarity, with 102 matched token, and 498 token mismatch\r\n" + "## Model validation for 575 tokens : 99.30434782608695% similarity, with 571 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 625 tokens : 16.96% similarity, with 106 matched token, and 519 token mismatch\r\n" + "## Model validation for 600 tokens : 99.33333333333333% similarity, with 596 matched token, and 4 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 650 tokens : 15.384615384615385% similarity, with 100 matched token, and 550 token mismatch\r\n" + "## Model validation for 625 tokens : 99.03999999999999% similarity, with 619 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 675 tokens : 15.851851851851853% similarity, with 107 matched token, and 568 token mismatch\r\n" + "## Model validation for 650 tokens : 99.07692307692308% similarity, with 644 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 700 tokens : 14.285714285714285% similarity, with 100 matched token, and 600 token mismatch\r\n" + "## Model validation for 675 tokens : 99.11111111111111% similarity, with 669 matched token, and 6 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 750 tokens : 14.266666666666666% similarity, with 107 matched token, and 643 token mismatch\r\n" + "## Model validation for 700 tokens : 99.0% similarity, with 693 matched token, and 7 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 800 tokens : 13.375% similarity, with 107 matched token, and 693 token mismatch\r\n" + "## Model validation for 750 tokens : 99.06666666666666% similarity, with 743 matched token, and 7 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 850 tokens : 13.529411764705882% similarity, with 115 matched token, and 735 token mismatch\r\n" + "## Model validation for 800 tokens : 99.0% similarity, with 792 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 900 tokens : 13.0% similarity, with 117 matched token, and 783 token mismatch\r\n" + "## Model validation for 850 tokens : 99.05882352941177% similarity, with 842 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 950 tokens : 12.0% similarity, with 114 matched token, and 836 token mismatch\r\n" + "## Model validation for 900 tokens : 99.0% similarity, with 891 matched token, and 9 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1000 tokens : 11.1% similarity, with 111 matched token, and 889 token mismatch\r\n" + "## Model validation for 950 tokens : 99.1578947368421% similarity, with 942 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n" + "## Model validation for 1000 tokens : 99.2% similarity, with 992 matched token, and 8 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ + "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n", "###\r\n", "### Model validation end ###\r\n", "###\r\n" @@ -14293,25 +7260,25 @@ } ], "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D1024-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D1024-E0_1-1k.csv\"" + "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-1k.csv\"" ] }, { "cell_type": "code", - "execution_count": 11, - "id": "50bc6985", + "execution_count": 5, + "id": "633f1f79", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T21:14:20.832876Z", - "iopub.status.busy": "2023-09-05T21:14:20.832220Z", - "iopub.status.idle": "2023-09-05T21:17:59.733915Z", - "shell.execute_reply": "2023-09-05T21:17:59.732622Z" + "iopub.execute_input": "2023-08-26T13:31:50.161177Z", + "iopub.status.busy": "2023-08-26T13:31:50.160355Z", + "iopub.status.idle": "2023-08-26T13:36:16.812262Z", + "shell.execute_reply": "2023-08-26T13:36:16.811318Z" }, "papermill": { - "duration": 219.003796, - "end_time": "2023-09-05T21:17:59.736377", + "duration": 266.706426, + "end_time": "2023-08-26T13:36:16.814332", "exception": false, - "start_time": "2023-09-05T21:14:20.732581", + "start_time": "2023-08-26T13:31:50.107906", "status": "completed" }, "tags": [] @@ -14321,7 +7288,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[2023-09-05 21:14:25,362] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + "[2023-08-26 13:31:54,664] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { @@ -14344,413 +7311,413 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1100 tokens : 10.363636363636363% similarity, with 114 matched token, and 986 token mismatch\r\n" + "## Model validation for 1100 tokens : 98.63636363636363% similarity, with 1085 matched token, and 15 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1150 tokens : 9.826086956521738% similarity, with 113 matched token, and 1037 token mismatch\r\n" + "## Model validation for 1150 tokens : 98.52173913043478% similarity, with 1133 matched token, and 17 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1200 tokens : 9.75% similarity, with 117 matched token, and 1083 token mismatch\r\n" + "## Model validation for 1200 tokens : 98.75% similarity, with 1185 matched token, and 15 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1250 tokens : 9.6% similarity, with 120 matched token, and 1130 token mismatch\r\n" + "## Model validation for 1250 tokens : 98.72% similarity, with 1234 matched token, and 16 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1300 tokens : 9.230769230769232% similarity, with 120 matched token, and 1180 token mismatch\r\n" + "## Model validation for 1300 tokens : 98.61538461538461% similarity, with 1282 matched token, and 18 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1350 tokens : 8.592592592592592% similarity, with 116 matched token, and 1234 token mismatch\r\n" + "## Model validation for 1350 tokens : 98.44444444444444% similarity, with 1329 matched token, and 21 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1400 tokens : 9.071428571428571% similarity, with 127 matched token, and 1273 token mismatch\r\n" + "## Model validation for 1400 tokens : 98.5% similarity, with 1379 matched token, and 21 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1450 tokens : 8.827586206896552% similarity, with 128 matched token, and 1322 token mismatch\r\n" + "## Model validation for 1450 tokens : 98.20689655172414% similarity, with 1424 matched token, and 26 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1500 tokens : 7.933333333333334% similarity, with 119 matched token, and 1381 token mismatch\r\n" + "## Model validation for 1500 tokens : 97.86666666666667% similarity, with 1468 matched token, and 32 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1550 tokens : 7.677419354838709% similarity, with 119 matched token, and 1431 token mismatch\r\n" + "## Model validation for 1550 tokens : 97.67741935483872% similarity, with 1514 matched token, and 36 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1600 tokens : 7.9375% similarity, with 127 matched token, and 1473 token mismatch\r\n" + "## Model validation for 1600 tokens : 97.8125% similarity, with 1565 matched token, and 35 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1650 tokens : 7.212121212121213% similarity, with 119 matched token, and 1531 token mismatch\r\n" + "## Model validation for 1650 tokens : 97.57575757575758% similarity, with 1610 matched token, and 40 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1700 tokens : 6.88235294117647% similarity, with 117 matched token, and 1583 token mismatch\r\n" + "## Model validation for 1700 tokens : 97.6470588235294% similarity, with 1660 matched token, and 40 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1750 tokens : 6.800000000000001% similarity, with 119 matched token, and 1631 token mismatch\r\n" + "## Model validation for 1750 tokens : 97.94285714285714% similarity, with 1714 matched token, and 36 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1800 tokens : 6.888888888888889% similarity, with 124 matched token, and 1676 token mismatch\r\n" + "## Model validation for 1800 tokens : 97.72222222222223% similarity, with 1759 matched token, and 41 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1850 tokens : 6.594594594594596% similarity, with 122 matched token, and 1728 token mismatch\r\n" + "## Model validation for 1850 tokens : 96.86486486486487% similarity, with 1792 matched token, and 58 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1900 tokens : 6.368421052631579% similarity, with 121 matched token, and 1779 token mismatch\r\n" + "## Model validation for 1900 tokens : 96.36842105263158% similarity, with 1831 matched token, and 69 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1950 tokens : 6.102564102564102% similarity, with 119 matched token, and 1831 token mismatch\r\n" + "## Model validation for 1950 tokens : 95.23076923076923% similarity, with 1857 matched token, and 93 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2000 tokens : 6.0% similarity, with 120 matched token, and 1880 token mismatch\r\n" + "## Model validation for 2000 tokens : 94.75% similarity, with 1895 matched token, and 105 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2050 tokens : 5.951219512195122% similarity, with 122 matched token, and 1928 token mismatch\r\n" + "## Model validation for 2050 tokens : 93.26829268292684% similarity, with 1912 matched token, and 138 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2100 tokens : 5.714285714285714% similarity, with 120 matched token, and 1980 token mismatch\r\n" + "## Model validation for 2100 tokens : 91.33333333333333% similarity, with 1918 matched token, and 182 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2150 tokens : 5.627906976744186% similarity, with 121 matched token, and 2029 token mismatch\r\n" + "## Model validation for 2150 tokens : 90.13953488372093% similarity, with 1938 matched token, and 212 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2200 tokens : 5.227272727272727% similarity, with 115 matched token, and 2085 token mismatch\r\n" + "## Model validation for 2200 tokens : 88.81818181818181% similarity, with 1954 matched token, and 246 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2250 tokens : 5.066666666666666% similarity, with 114 matched token, and 2136 token mismatch\r\n" + "## Model validation for 2250 tokens : 86.62222222222222% similarity, with 1949 matched token, and 301 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2300 tokens : 5.043478260869565% similarity, with 116 matched token, and 2184 token mismatch\r\n" + "## Model validation for 2300 tokens : 84.82608695652173% similarity, with 1951 matched token, and 349 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2350 tokens : 4.808510638297872% similarity, with 113 matched token, and 2237 token mismatch\r\n" + "## Model validation for 2350 tokens : 82.08510638297872% similarity, with 1929 matched token, and 421 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2400 tokens : 4.75% similarity, with 114 matched token, and 2286 token mismatch\r\n" + "## Model validation for 2400 tokens : 80.625% similarity, with 1935 matched token, and 465 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2450 tokens : 4.775510204081632% similarity, with 117 matched token, and 2333 token mismatch\r\n" + "## Model validation for 2450 tokens : 78.61224489795919% similarity, with 1926 matched token, and 524 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2500 tokens : 4.68% similarity, with 117 matched token, and 2383 token mismatch\r\n" + "## Model validation for 2500 tokens : 77.08% similarity, with 1927 matched token, and 573 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2550 tokens : 4.627450980392156% similarity, with 118 matched token, and 2432 token mismatch\r\n" + "## Model validation for 2550 tokens : 75.25490196078431% similarity, with 1919 matched token, and 631 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2600 tokens : 4.576923076923077% similarity, with 119 matched token, and 2481 token mismatch\r\n" + "## Model validation for 2600 tokens : 73.88461538461539% similarity, with 1921 matched token, and 679 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2650 tokens : 4.60377358490566% similarity, with 122 matched token, and 2528 token mismatch\r\n" + "## Model validation for 2650 tokens : 72.71698113207547% similarity, with 1927 matched token, and 723 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2700 tokens : 4.62962962962963% similarity, with 125 matched token, and 2575 token mismatch\r\n" + "## Model validation for 2700 tokens : 71.4074074074074% similarity, with 1928 matched token, and 772 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2750 tokens : 4.618181818181818% similarity, with 127 matched token, and 2623 token mismatch\r\n" + "## Model validation for 2750 tokens : 70.10909090909091% similarity, with 1928 matched token, and 822 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2800 tokens : 4.5% similarity, with 126 matched token, and 2674 token mismatch\r\n" + "## Model validation for 2800 tokens : 68.85714285714286% similarity, with 1928 matched token, and 872 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2850 tokens : 4.456140350877193% similarity, with 127 matched token, and 2723 token mismatch\r\n" + "## Model validation for 2850 tokens : 67.89473684210526% similarity, with 1935 matched token, and 915 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2900 tokens : 4.344827586206897% similarity, with 126 matched token, and 2774 token mismatch\r\n" + "## Model validation for 2900 tokens : 66.6896551724138% similarity, with 1934 matched token, and 966 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2950 tokens : 4.372881355932203% similarity, with 129 matched token, and 2821 token mismatch\r\n" + "## Model validation for 2950 tokens : 65.62711864406779% similarity, with 1936 matched token, and 1014 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3000 tokens : 4.233333333333333% similarity, with 127 matched token, and 2873 token mismatch\r\n" + "## Model validation for 3000 tokens : 64.4% similarity, with 1932 matched token, and 1068 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3050 tokens : 4.19672131147541% similarity, with 128 matched token, and 2922 token mismatch\r\n" + "## Model validation for 3050 tokens : 63.31147540983607% similarity, with 1931 matched token, and 1119 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3100 tokens : 4.161290322580645% similarity, with 129 matched token, and 2971 token mismatch\r\n" + "## Model validation for 3100 tokens : 62.096774193548384% similarity, with 1925 matched token, and 1175 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3150 tokens : 4.1269841269841265% similarity, with 130 matched token, and 3020 token mismatch\r\n" + "## Model validation for 3150 tokens : 61.17460317460317% similarity, with 1927 matched token, and 1223 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3200 tokens : 4.125% similarity, with 132 matched token, and 3068 token mismatch\r\n" + "## Model validation for 3200 tokens : 60.21875% similarity, with 1927 matched token, and 1273 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3250 tokens : 4.153846153846154% similarity, with 135 matched token, and 3115 token mismatch\r\n" + "## Model validation for 3250 tokens : 59.199999999999996% similarity, with 1924 matched token, and 1326 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3300 tokens : 4.121212121212121% similarity, with 136 matched token, and 3164 token mismatch\r\n" + "## Model validation for 3300 tokens : 58.18181818181818% similarity, with 1920 matched token, and 1380 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3350 tokens : 3.940298507462687% similarity, with 132 matched token, and 3218 token mismatch\r\n" + "## Model validation for 3350 tokens : 57.134328358208954% similarity, with 1914 matched token, and 1436 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3400 tokens : 3.9411764705882355% similarity, with 134 matched token, and 3266 token mismatch\r\n" + "## Model validation for 3400 tokens : 56.294117647058826% similarity, with 1914 matched token, and 1486 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3450 tokens : 3.91304347826087% similarity, with 135 matched token, and 3315 token mismatch\r\n" + "## Model validation for 3450 tokens : 55.362318840579704% similarity, with 1910 matched token, and 1540 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3500 tokens : 3.9142857142857146% similarity, with 137 matched token, and 3363 token mismatch\r\n" + "## Model validation for 3500 tokens : 54.400000000000006% similarity, with 1904 matched token, and 1596 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3550 tokens : 3.859154929577465% similarity, with 137 matched token, and 3413 token mismatch\r\n" + "## Model validation for 3550 tokens : 53.54929577464789% similarity, with 1901 matched token, and 1649 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3600 tokens : 3.888888888888889% similarity, with 140 matched token, and 3460 token mismatch\r\n" + "## Model validation for 3600 tokens : 52.77777777777778% similarity, with 1900 matched token, and 1700 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3650 tokens : 3.863013698630137% similarity, with 141 matched token, and 3509 token mismatch\r\n" + "## Model validation for 3650 tokens : 51.89041095890411% similarity, with 1894 matched token, and 1756 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3700 tokens : 3.8108108108108105% similarity, with 141 matched token, and 3559 token mismatch\r\n" + "## Model validation for 3700 tokens : 51.054054054054056% similarity, with 1889 matched token, and 1811 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3750 tokens : 3.7600000000000002% similarity, with 141 matched token, and 3609 token mismatch\r\n" + "## Model validation for 3750 tokens : 50.18666666666667% similarity, with 1882 matched token, and 1868 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3800 tokens : 3.763157894736842% similarity, with 143 matched token, and 3657 token mismatch\r\n" + "## Model validation for 3800 tokens : 49.31578947368421% similarity, with 1874 matched token, and 1926 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3850 tokens : 3.766233766233766% similarity, with 145 matched token, and 3705 token mismatch\r\n" + "## Model validation for 3850 tokens : 48.51948051948052% similarity, with 1868 matched token, and 1982 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3900 tokens : 3.717948717948718% similarity, with 145 matched token, and 3755 token mismatch\r\n" + "## Model validation for 3900 tokens : 47.53846153846154% similarity, with 1854 matched token, and 2046 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3950 tokens : 3.645569620253165% similarity, with 144 matched token, and 3806 token mismatch\r\n" + "## Model validation for 3950 tokens : 46.607594936708864% similarity, with 1841 matched token, and 2109 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4000 tokens : 3.6249999999999996% similarity, with 145 matched token, and 3855 token mismatch\r\n", + "## Model validation for 4000 tokens : 45.574999999999996% similarity, with 1823 matched token, and 2177 token mismatch\r\n", "###\r\n", "### Model validation end ###\r\n", "###\r\n" @@ -14758,916 +7725,1095 @@ } ], "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D1024-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D1024-E0_1-4k.csv\" 1100 4000" + "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-4k.csv\" 1100 4000" ] }, { "cell_type": "code", - "execution_count": 12, - "id": "488296d3", + "execution_count": 6, + "id": "f78a7cce", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T21:17:59.942749Z", - "iopub.status.busy": "2023-09-05T21:17:59.941792Z", - "iopub.status.idle": "2023-09-05T22:15:37.866692Z", - "shell.execute_reply": "2023-09-05T22:15:37.865420Z" + "iopub.execute_input": "2023-08-26T13:36:16.924786Z", + "iopub.status.busy": "2023-08-26T13:36:16.924015Z", + "iopub.status.idle": "2023-08-26T14:38:59.194602Z", + "shell.execute_reply": "2023-08-26T14:38:59.193661Z" }, "papermill": { - "duration": 3458.031609, - "end_time": "2023-09-05T22:15:37.869014", + "duration": 3762.328534, + "end_time": "2023-08-26T14:38:59.196991", "exception": false, - "start_time": "2023-09-05T21:17:59.837405", + "start_time": "2023-08-26T13:36:16.868457", "status": "completed" }, - "tags": [] - }, - "outputs": [ + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[2023-08-26 13:36:21,464] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "###\r\n", + "### Model validation start ###\r\n", + "###\r\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "## Model validation for 4100 tokens : 43.97560975609756% similarity, with 1803 matched token, and 2297 token mismatch\r\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "## Model validation for 4200 tokens : 42.142857142857146% similarity, with 1770 matched token, and 2430 token mismatch\r\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "## Model validation for 4300 tokens : 40.27906976744186% similarity, with 1732 matched token, and 2568 token mismatch\r\n" + ] + }, { "name": "stdout", "output_type": "stream", "text": [ - "[2023-09-05 21:18:04,474] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + "## Model validation for 4400 tokens : 38.27272727272727% similarity, with 1684 matched token, and 2716 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n" + "## Model validation for 4500 tokens : 35.8% similarity, with 1611 matched token, and 2889 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "###\r\n", - "### Model validation start ###\r\n", - "###\r\n" + "## Model validation for 4600 tokens : 33.71739130434783% similarity, with 1551 matched token, and 3049 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4100 tokens : 3.6585365853658534% similarity, with 150 matched token, and 3950 token mismatch\r\n" + "## Model validation for 4700 tokens : 31.06382978723404% similarity, with 1460 matched token, and 3240 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4200 tokens : 3.571428571428571% similarity, with 150 matched token, and 4050 token mismatch\r\n" + "## Model validation for 4800 tokens : 28.375% similarity, with 1362 matched token, and 3438 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4300 tokens : 3.5348837209302326% similarity, with 152 matched token, and 4148 token mismatch\r\n" + "## Model validation for 4900 tokens : 25.857142857142858% similarity, with 1267 matched token, and 3633 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4400 tokens : 3.5227272727272725% similarity, with 155 matched token, and 4245 token mismatch\r\n" + "## Model validation for 5000 tokens : 23.04% similarity, with 1152 matched token, and 3848 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4500 tokens : 3.4888888888888885% similarity, with 157 matched token, and 4343 token mismatch\r\n" + "## Model validation for 5100 tokens : 20.784313725490197% similarity, with 1060 matched token, and 4040 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4600 tokens : 3.5000000000000004% similarity, with 161 matched token, and 4439 token mismatch\r\n" + "## Model validation for 5200 tokens : 18.5% similarity, with 962 matched token, and 4238 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4700 tokens : 3.5106382978723407% similarity, with 165 matched token, and 4535 token mismatch\r\n" + "## Model validation for 5300 tokens : 16.88679245283019% similarity, with 895 matched token, and 4405 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4800 tokens : 3.4583333333333335% similarity, with 166 matched token, and 4634 token mismatch\r\n" + "## Model validation for 5400 tokens : 15.24074074074074% similarity, with 823 matched token, and 4577 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4900 tokens : 3.4489795918367343% similarity, with 169 matched token, and 4731 token mismatch\r\n" + "## Model validation for 5500 tokens : 13.436363636363636% similarity, with 739 matched token, and 4761 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5000 tokens : 3.38% similarity, with 169 matched token, and 4831 token mismatch\r\n" + "## Model validation for 5600 tokens : 11.607142857142858% similarity, with 650 matched token, and 4950 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5100 tokens : 3.392156862745098% similarity, with 173 matched token, and 4927 token mismatch\r\n" + "## Model validation for 5700 tokens : 10.385964912280702% similarity, with 592 matched token, and 5108 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5200 tokens : 3.307692307692308% similarity, with 172 matched token, and 5028 token mismatch\r\n" + "## Model validation for 5800 tokens : 9.327586206896552% similarity, with 541 matched token, and 5259 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5300 tokens : 3.3207547169811322% similarity, with 176 matched token, and 5124 token mismatch\r\n" + "## Model validation for 5900 tokens : 8.305084745762711% similarity, with 490 matched token, and 5410 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5400 tokens : 3.2407407407407405% similarity, with 175 matched token, and 5225 token mismatch\r\n" + "## Model validation for 6000 tokens : 7.466666666666668% similarity, with 448 matched token, and 5552 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5500 tokens : 3.272727272727273% similarity, with 180 matched token, and 5320 token mismatch\r\n" + "## Model validation for 6100 tokens : 6.672131147540984% similarity, with 407 matched token, and 5693 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5600 tokens : 3.2857142857142856% similarity, with 184 matched token, and 5416 token mismatch\r\n" + "## Model validation for 6200 tokens : 6.048387096774194% similarity, with 375 matched token, and 5825 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5700 tokens : 3.263157894736842% similarity, with 186 matched token, and 5514 token mismatch\r\n" + "## Model validation for 6300 tokens : 5.65079365079365% similarity, with 356 matched token, and 5944 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5800 tokens : 3.2241379310344827% similarity, with 187 matched token, and 5613 token mismatch\r\n" + "## Model validation for 6400 tokens : 5.328125% similarity, with 341 matched token, and 6059 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5900 tokens : 3.2542372881355934% similarity, with 192 matched token, and 5708 token mismatch\r\n" + "## Model validation for 6500 tokens : 4.984615384615385% similarity, with 324 matched token, and 6176 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6000 tokens : 3.2333333333333334% similarity, with 194 matched token, and 5806 token mismatch\r\n" + "## Model validation for 6600 tokens : 4.6818181818181825% similarity, with 309 matched token, and 6291 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6100 tokens : 3.245901639344263% similarity, with 198 matched token, and 5902 token mismatch\r\n" + "## Model validation for 6700 tokens : 4.447761194029851% similarity, with 298 matched token, and 6402 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6200 tokens : 3.225806451612903% similarity, with 200 matched token, and 6000 token mismatch\r\n" + "## Model validation for 6800 tokens : 4.25% similarity, with 289 matched token, and 6511 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6300 tokens : 3.2380952380952377% similarity, with 204 matched token, and 6096 token mismatch\r\n" + "## Model validation for 6900 tokens : 4.08695652173913% similarity, with 282 matched token, and 6618 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6400 tokens : 3.2343749999999996% similarity, with 207 matched token, and 6193 token mismatch\r\n" + "## Model validation for 7000 tokens : 4.0% similarity, with 280 matched token, and 6720 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6500 tokens : 3.2615384615384615% similarity, with 212 matched token, and 6288 token mismatch\r\n" + "## Model validation for 7100 tokens : 3.943661971830986% similarity, with 280 matched token, and 6820 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6600 tokens : 3.2424242424242427% similarity, with 214 matched token, and 6386 token mismatch\r\n" + "## Model validation for 7200 tokens : 3.763888888888889% similarity, with 271 matched token, and 6929 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6700 tokens : 3.268656716417911% similarity, with 219 matched token, and 6481 token mismatch\r\n" + "## Model validation for 7300 tokens : 3.767123287671233% similarity, with 275 matched token, and 7025 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6800 tokens : 3.25% similarity, with 221 matched token, and 6579 token mismatch\r\n" + "## Model validation for 7400 tokens : 3.689189189189189% similarity, with 273 matched token, and 7127 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6900 tokens : 3.27536231884058% similarity, with 226 matched token, and 6674 token mismatch\r\n" + "## Model validation for 7500 tokens : 3.64% similarity, with 273 matched token, and 7227 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7000 tokens : 3.257142857142857% similarity, with 228 matched token, and 6772 token mismatch\r\n" + "## Model validation for 7600 tokens : 3.578947368421052% similarity, with 272 matched token, and 7328 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7100 tokens : 3.2394366197183095% similarity, with 230 matched token, and 6870 token mismatch\r\n" + "## Model validation for 7700 tokens : 3.5844155844155843% similarity, with 276 matched token, and 7424 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7200 tokens : 3.236111111111111% similarity, with 233 matched token, and 6967 token mismatch\r\n" + "## Model validation for 7800 tokens : 3.5512820512820515% similarity, with 277 matched token, and 7523 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7300 tokens : 3.2602739726027394% similarity, with 238 matched token, and 7062 token mismatch\r\n" + "## Model validation for 7900 tokens : 3.468354430379747% similarity, with 274 matched token, and 7626 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7400 tokens : 3.256756756756757% similarity, with 241 matched token, and 7159 token mismatch\r\n" + "## Model validation for 8000 tokens : 3.4250000000000003% similarity, with 274 matched token, and 7726 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7500 tokens : 3.2399999999999998% similarity, with 243 matched token, and 7257 token mismatch\r\n" + "## Model validation for 8100 tokens : 3.419753086419753% similarity, with 277 matched token, and 7823 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7600 tokens : 3.25% similarity, with 247 matched token, and 7353 token mismatch\r\n" + "## Model validation for 8200 tokens : 3.414634146341464% similarity, with 280 matched token, and 7920 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7700 tokens : 3.25974025974026% similarity, with 251 matched token, and 7449 token mismatch\r\n" + "## Model validation for 8300 tokens : 3.36144578313253% similarity, with 279 matched token, and 8021 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7800 tokens : 3.2435897435897436% similarity, with 253 matched token, and 7547 token mismatch\r\n" + "## Model validation for 8400 tokens : 3.3690476190476186% similarity, with 283 matched token, and 8117 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7900 tokens : 3.2405063291139244% similarity, with 256 matched token, and 7644 token mismatch\r\n" + "## Model validation for 8500 tokens : 3.3411764705882354% similarity, with 284 matched token, and 8216 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8000 tokens : 3.2375000000000003% similarity, with 259 matched token, and 7741 token mismatch\r\n" + "## Model validation for 8600 tokens : 3.3488372093023258% similarity, with 288 matched token, and 8312 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8100 tokens : 3.2839506172839505% similarity, with 266 matched token, and 7834 token mismatch\r\n" + "## Model validation for 8700 tokens : 3.3678160919540225% similarity, with 293 matched token, and 8407 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8200 tokens : 3.2682926829268295% similarity, with 268 matched token, and 7932 token mismatch\r\n" + "## Model validation for 8800 tokens : 3.3295454545454546% similarity, with 293 matched token, and 8507 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8300 tokens : 3.2530120481927707% similarity, with 270 matched token, and 8030 token mismatch\r\n" + "## Model validation for 8900 tokens : 3.348314606741573% similarity, with 298 matched token, and 8602 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8400 tokens : 3.2380952380952377% similarity, with 272 matched token, and 8128 token mismatch\r\n" + "## Model validation for 9000 tokens : 3.3333333333333335% similarity, with 300 matched token, and 8700 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8500 tokens : 3.2705882352941176% similarity, with 278 matched token, and 8222 token mismatch\r\n" + "## Model validation for 9100 tokens : 3.3406593406593412% similarity, with 304 matched token, and 8796 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8600 tokens : 3.2674418604651168% similarity, with 281 matched token, and 8319 token mismatch\r\n" + "## Model validation for 9200 tokens : 3.3260869565217392% similarity, with 306 matched token, and 8894 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8700 tokens : 3.2758620689655173% similarity, with 285 matched token, and 8415 token mismatch\r\n" + "## Model validation for 9300 tokens : 3.3010752688172045% similarity, with 307 matched token, and 8993 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8800 tokens : 3.25% similarity, with 286 matched token, and 8514 token mismatch\r\n" + "## Model validation for 9400 tokens : 3.2978723404255317% similarity, with 310 matched token, and 9090 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8900 tokens : 3.258426966292135% similarity, with 290 matched token, and 8610 token mismatch\r\n" + "## Model validation for 9500 tokens : 3.3157894736842106% similarity, with 315 matched token, and 9185 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9000 tokens : 3.255555555555555% similarity, with 293 matched token, and 8707 token mismatch\r\n" + "## Model validation for 9600 tokens : 3.3229166666666665% similarity, with 319 matched token, and 9281 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9100 tokens : 3.274725274725275% similarity, with 298 matched token, and 8802 token mismatch\r\n" + "## Model validation for 9700 tokens : 3.3195876288659796% similarity, with 322 matched token, and 9378 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9200 tokens : 3.2717391304347823% similarity, with 301 matched token, and 8899 token mismatch\r\n" + "## Model validation for 9800 tokens : 3.316326530612245% similarity, with 325 matched token, and 9475 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9300 tokens : 3.258064516129032% similarity, with 303 matched token, and 8997 token mismatch\r\n" + "## Model validation for 9900 tokens : 3.3333333333333335% similarity, with 330 matched token, and 9570 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9400 tokens : 3.2446808510638294% similarity, with 305 matched token, and 9095 token mismatch\r\n" + "## Model validation for 10000 tokens : 3.37% similarity, with 337 matched token, and 9663 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9500 tokens : 3.263157894736842% similarity, with 310 matched token, and 9190 token mismatch\r\n" + "## Model validation for 10100 tokens : 3.3762376237623766% similarity, with 341 matched token, and 9759 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9600 tokens : 3.2604166666666665% similarity, with 313 matched token, and 9287 token mismatch\r\n" + "## Model validation for 10200 tokens : 3.3725490196078427% similarity, with 344 matched token, and 9856 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9700 tokens : 3.257731958762886% similarity, with 316 matched token, and 9384 token mismatch\r\n" + "## Model validation for 10300 tokens : 3.349514563106796% similarity, with 345 matched token, and 9955 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9800 tokens : 3.2448979591836737% similarity, with 318 matched token, and 9482 token mismatch\r\n" + "## Model validation for 10400 tokens : 3.355769230769231% similarity, with 349 matched token, and 10051 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9900 tokens : 3.262626262626263% similarity, with 323 matched token, and 9577 token mismatch\r\n" + "## Model validation for 10500 tokens : 3.371428571428572% similarity, with 354 matched token, and 10146 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10000 tokens : 3.29% similarity, with 329 matched token, and 9671 token mismatch\r\n" + "## Model validation for 10600 tokens : 3.3584905660377355% similarity, with 356 matched token, and 10244 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10100 tokens : 3.306930693069307% similarity, with 334 matched token, and 9766 token mismatch\r\n" + "## Model validation for 10700 tokens : 3.392523364485981% similarity, with 363 matched token, and 10337 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10200 tokens : 3.294117647058824% similarity, with 336 matched token, and 9864 token mismatch\r\n" + "## Model validation for 10800 tokens : 3.4074074074074074% similarity, with 368 matched token, and 10432 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10300 tokens : 3.2815533980582527% similarity, with 338 matched token, and 9962 token mismatch\r\n" + "## Model validation for 10900 tokens : 3.3853211009174315% similarity, with 369 matched token, and 10531 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10400 tokens : 3.2884615384615388% similarity, with 342 matched token, and 10058 token mismatch\r\n" + "## Model validation for 11000 tokens : 3.4000000000000004% similarity, with 374 matched token, and 10626 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10500 tokens : 3.3047619047619046% similarity, with 347 matched token, and 10153 token mismatch\r\n" + "## Model validation for 11100 tokens : 3.3963963963963963% similarity, with 377 matched token, and 10723 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10600 tokens : 3.2924528301886795% similarity, with 349 matched token, and 10251 token mismatch\r\n" + "## Model validation for 11200 tokens : 3.3839285714285716% similarity, with 379 matched token, and 10821 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10700 tokens : 3.3177570093457946% similarity, with 355 matched token, and 10345 token mismatch\r\n" + "## Model validation for 11300 tokens : 3.4070796460176993% similarity, with 385 matched token, and 10915 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10800 tokens : 3.3240740740740735% similarity, with 359 matched token, and 10441 token mismatch\r\n" + "## Model validation for 11400 tokens : 3.43859649122807% similarity, with 392 matched token, and 11008 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10900 tokens : 3.311926605504587% similarity, with 361 matched token, and 10539 token mismatch\r\n" + "## Model validation for 11500 tokens : 3.4434782608695653% similarity, with 396 matched token, and 11104 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11000 tokens : 3.327272727272727% similarity, with 366 matched token, and 10634 token mismatch\r\n" + "## Model validation for 11600 tokens : 3.4568965517241383% similarity, with 401 matched token, and 11199 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11100 tokens : 3.3153153153153156% similarity, with 368 matched token, and 10732 token mismatch\r\n" + "## Model validation for 11700 tokens : 3.4444444444444446% similarity, with 403 matched token, and 11297 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11200 tokens : 3.303571428571429% similarity, with 370 matched token, and 10830 token mismatch\r\n" + "## Model validation for 11800 tokens : 3.457627118644068% similarity, with 408 matched token, and 11392 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11300 tokens : 3.3097345132743365% similarity, with 374 matched token, and 10926 token mismatch\r\n" + "## Model validation for 11900 tokens : 3.46218487394958% similarity, with 412 matched token, and 11488 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11400 tokens : 3.3421052631578947% similarity, with 381 matched token, and 11019 token mismatch\r\n" + "## Model validation for 12000 tokens : 3.4750000000000005% similarity, with 417 matched token, and 11583 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11500 tokens : 3.3304347826086955% similarity, with 383 matched token, and 11117 token mismatch\r\n" + "## Model validation for 12100 tokens : 3.487603305785124% similarity, with 422 matched token, and 11678 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11600 tokens : 3.3448275862068964% similarity, with 388 matched token, and 11212 token mismatch\r\n" + "## Model validation for 12200 tokens : 3.475409836065574% similarity, with 424 matched token, and 11776 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11700 tokens : 3.3333333333333335% similarity, with 390 matched token, and 11310 token mismatch\r\n" + "## Model validation for 12300 tokens : 3.487804878048781% similarity, with 429 matched token, and 11871 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11800 tokens : 3.347457627118644% similarity, with 395 matched token, and 11405 token mismatch\r\n" + "## Model validation for 12400 tokens : 3.491935483870968% similarity, with 433 matched token, and 11967 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 11900 tokens : 3.34453781512605% similarity, with 398 matched token, and 11502 token mismatch\r\n" + "## Model validation for 12500 tokens : 3.488% similarity, with 436 matched token, and 12064 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12000 tokens : 3.3583333333333334% similarity, with 403 matched token, and 11597 token mismatch\r\n" + "## Model validation for 12600 tokens : 3.484126984126984% similarity, with 439 matched token, and 12161 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12100 tokens : 3.3636363636363638% similarity, with 407 matched token, and 11693 token mismatch\r\n" + "## Model validation for 12700 tokens : 3.4881889763779523% similarity, with 443 matched token, and 12257 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12200 tokens : 3.3524590163934427% similarity, with 409 matched token, and 11791 token mismatch\r\n" + "## Model validation for 12800 tokens : 3.484375% similarity, with 446 matched token, and 12354 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12300 tokens : 3.3577235772357725% similarity, with 413 matched token, and 11887 token mismatch\r\n" + "## Model validation for 12900 tokens : 3.488372093023256% similarity, with 450 matched token, and 12450 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12400 tokens : 3.354838709677419% similarity, with 416 matched token, and 11984 token mismatch\r\n" + "## Model validation for 13000 tokens : 3.5000000000000004% similarity, with 455 matched token, and 12545 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12500 tokens : 3.3520000000000003% similarity, with 419 matched token, and 12081 token mismatch\r\n" + "## Model validation for 13100 tokens : 3.5038167938931295% similarity, with 459 matched token, and 12641 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12600 tokens : 3.349206349206349% similarity, with 422 matched token, and 12178 token mismatch\r\n" + "## Model validation for 13200 tokens : 3.5000000000000004% similarity, with 462 matched token, and 12738 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12700 tokens : 3.362204724409449% similarity, with 427 matched token, and 12273 token mismatch\r\n" + "## Model validation for 13300 tokens : 3.488721804511278% similarity, with 464 matched token, and 12836 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12800 tokens : 3.3515625% similarity, with 429 matched token, and 12371 token mismatch\r\n" + "## Model validation for 13400 tokens : 3.514925373134328% similarity, with 471 matched token, and 12929 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12900 tokens : 3.356589147286822% similarity, with 433 matched token, and 12467 token mismatch\r\n" + "## Model validation for 13500 tokens : 3.503703703703704% similarity, with 473 matched token, and 13027 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13000 tokens : 3.3692307692307697% similarity, with 438 matched token, and 12562 token mismatch\r\n" + "## Model validation for 13600 tokens : 3.514705882352941% similarity, with 478 matched token, and 13122 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13100 tokens : 3.3587786259541987% similarity, with 440 matched token, and 12660 token mismatch\r\n" + "## Model validation for 13700 tokens : 3.510948905109489% similarity, with 481 matched token, and 13219 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13200 tokens : 3.3636363636363638% similarity, with 444 matched token, and 12756 token mismatch\r\n" + "## Model validation for 13800 tokens : 3.5144927536231885% similarity, with 485 matched token, and 13315 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13300 tokens : 3.3533834586466167% similarity, with 446 matched token, and 12854 token mismatch\r\n" + "## Model validation for 13900 tokens : 3.5251798561151078% similarity, with 490 matched token, and 13410 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13400 tokens : 3.3731343283582094% similarity, with 452 matched token, and 12948 token mismatch\r\n" + "## Model validation for 14000 tokens : 3.55% similarity, with 497 matched token, and 13503 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13500 tokens : 3.355555555555555% similarity, with 453 matched token, and 13047 token mismatch\r\n" + "## Model validation for 14100 tokens : 3.546099290780142% similarity, with 500 matched token, and 13600 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13600 tokens : 3.3602941176470584% similarity, with 457 matched token, and 13143 token mismatch\r\n" + "## Model validation for 14200 tokens : 3.535211267605634% similarity, with 502 matched token, and 13698 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13700 tokens : 3.343065693430657% similarity, with 458 matched token, and 13242 token mismatch\r\n" + "## Model validation for 14300 tokens : 3.5454545454545454% similarity, with 507 matched token, and 13793 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13800 tokens : 3.355072463768116% similarity, with 463 matched token, and 13337 token mismatch\r\n" + "## Model validation for 14400 tokens : 3.5555555555555554% similarity, with 512 matched token, and 13888 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13900 tokens : 3.3741007194244603% similarity, with 469 matched token, and 13431 token mismatch\r\n" + "## Model validation for 14500 tokens : 3.537931034482759% similarity, with 513 matched token, and 13987 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14000 tokens : 3.3857142857142857% similarity, with 474 matched token, and 13526 token mismatch\r\n" + "## Model validation for 14600 tokens : 3.5273972602739727% similarity, with 515 matched token, and 14085 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14100 tokens : 3.3829787234042556% similarity, with 477 matched token, and 13623 token mismatch\r\n" + "## Model validation for 14700 tokens : 3.5646258503401365% similarity, with 524 matched token, and 14176 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14200 tokens : 3.373239436619718% similarity, with 479 matched token, and 13721 token mismatch\r\n" + "## Model validation for 14800 tokens : 3.5472972972972974% similarity, with 525 matched token, and 14275 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14300 tokens : 3.3636363636363638% similarity, with 481 matched token, and 13819 token mismatch\r\n" + "## Model validation for 14900 tokens : 3.550335570469799% similarity, with 529 matched token, and 14371 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14400 tokens : 3.375% similarity, with 486 matched token, and 13914 token mismatch\r\n" + "## Model validation for 15000 tokens : 3.5533333333333332% similarity, with 533 matched token, and 14467 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14500 tokens : 3.36551724137931% similarity, with 488 matched token, and 14012 token mismatch\r\n" + "## Model validation for 15100 tokens : 3.576158940397351% similarity, with 540 matched token, and 14560 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14600 tokens : 3.356164383561644% similarity, with 490 matched token, and 14110 token mismatch\r\n" + "## Model validation for 15200 tokens : 3.56578947368421% similarity, with 542 matched token, and 14658 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14700 tokens : 3.387755102040816% similarity, with 498 matched token, and 14202 token mismatch\r\n" + "## Model validation for 15300 tokens : 3.5490196078431375% similarity, with 543 matched token, and 14757 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14800 tokens : 3.371621621621622% similarity, with 499 matched token, and 14301 token mismatch\r\n" + "## Model validation for 15400 tokens : 3.551948051948052% similarity, with 547 matched token, and 14853 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14900 tokens : 3.3758389261744965% similarity, with 503 matched token, and 14397 token mismatch\r\n" + "## Model validation for 15500 tokens : 3.5483870967741935% similarity, with 550 matched token, and 14950 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15000 tokens : 3.373333333333333% similarity, with 506 matched token, and 14494 token mismatch\r\n" + "## Model validation for 15600 tokens : 3.5448717948717947% similarity, with 553 matched token, and 15047 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15100 tokens : 3.357615894039735% similarity, with 507 matched token, and 14593 token mismatch\r\n" + "## Model validation for 15700 tokens : 3.5605095541401273% similarity, with 559 matched token, and 15141 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15200 tokens : 3.3486842105263155% similarity, with 509 matched token, and 14691 token mismatch\r\n" + "## Model validation for 15800 tokens : 3.5506329113924053% similarity, with 561 matched token, and 15239 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15300 tokens : 3.3529411764705883% similarity, with 513 matched token, and 14787 token mismatch\r\n" + "## Model validation for 15900 tokens : 3.547169811320755% similarity, with 564 matched token, and 15336 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15400 tokens : 3.3441558441558437% similarity, with 515 matched token, and 14885 token mismatch\r\n" + "## Model validation for 16000 tokens : 3.5437499999999997% similarity, with 567 matched token, and 15433 token mismatch\r\n", + "###\r\n", + "### Model validation end ###\r\n", + "###\r\n" ] + } + ], + "source": [ + "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/BaseV5-C-Tune5.pth\" \"./logs/BaseV5-C-Tune5-16k.csv\" 4100 16000" + ] + }, + { + "cell_type": "markdown", + "id": "cfbf5b3d", + "metadata": { + "papermill": { + "duration": 0.061671, + "end_time": "2023-08-26T14:38:59.320285", + "exception": false, + "start_time": "2023-08-26T14:38:59.258614", + "status": "completed" + }, + "tags": [] + }, + "source": [ + "# EWR V5 benchmark" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "60d86655", + "metadata": { + "execution": { + "iopub.execute_input": "2023-08-26T14:38:59.445569Z", + "iopub.status.busy": "2023-08-26T14:38:59.444939Z", + "iopub.status.idle": "2023-08-26T14:39:05.718059Z", + "shell.execute_reply": "2023-08-26T14:39:05.716844Z" + }, + "papermill": { + "duration": 6.338733, + "end_time": "2023-08-26T14:39:05.720399", + "exception": false, + "start_time": "2023-08-26T14:38:59.381666", + "status": "completed" }, + "tags": [] + }, + "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15500 tokens : 3.3419354838709676% similarity, with 518 matched token, and 14982 token mismatch\r\n" + "[2023-08-26 14:39:03,924] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15600 tokens : 3.346153846153846% similarity, with 522 matched token, and 15078 token mismatch\r\n" + "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n", + "Traceback (most recent call last):\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", + " asyncio.run(main_function())\r\n", + " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", + " return loop.run_until_complete(main)\r\n", + " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", + " return future.result()\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", + " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n", + " self.model = RWKV(**model_config)\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", + " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", + "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" ] + } + ], + "source": [ + "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-1k.csv\"" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "851be2b7", + "metadata": { + "execution": { + "iopub.execute_input": "2023-08-26T14:39:05.838572Z", + "iopub.status.busy": "2023-08-26T14:39:05.837927Z", + "iopub.status.idle": "2023-08-26T14:39:12.062651Z", + "shell.execute_reply": "2023-08-26T14:39:12.061734Z" + }, + "papermill": { + "duration": 6.287262, + "end_time": "2023-08-26T14:39:12.065659", + "exception": false, + "start_time": "2023-08-26T14:39:05.778397", + "status": "completed" }, + "tags": [] + }, + "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15700 tokens : 3.3503184713375793% similarity, with 526 matched token, and 15174 token mismatch\r\n" + "[2023-08-26 14:39:10,148] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15800 tokens : 3.3417721518987342% similarity, with 528 matched token, and 15272 token mismatch\r\n" + "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n", + "Traceback (most recent call last):\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", + " asyncio.run(main_function())\r\n", + " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", + " return loop.run_until_complete(main)\r\n", + " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", + " return future.result()\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", + " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n", + " self.model = RWKV(**model_config)\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", + " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", + "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" ] + } + ], + "source": [ + "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-4k.csv\" 1100 4000" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "e6022677", + "metadata": { + "execution": { + "iopub.execute_input": "2023-08-26T14:39:12.215332Z", + "iopub.status.busy": "2023-08-26T14:39:12.214878Z", + "iopub.status.idle": "2023-08-26T14:39:18.967986Z", + "shell.execute_reply": "2023-08-26T14:39:18.967070Z" }, + "papermill": { + "duration": 6.823866, + "end_time": "2023-08-26T14:39:18.970264", + "exception": false, + "start_time": "2023-08-26T14:39:12.146398", + "status": "completed" + }, + "tags": [] + }, + "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15900 tokens : 3.3333333333333335% similarity, with 530 matched token, and 15370 token mismatch\r\n" + "[2023-08-26 14:39:16,784] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 16000 tokens : 3.325% similarity, with 532 matched token, and 15468 token mismatch\r\n" + "[RWKV.model] Running RWKV model using 'torch-jit' with torch '2.0.1+cu118'\r\n", + "Traceback (most recent call last):\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 366, in \r\n", + " asyncio.run(main_function())\r\n", + " File \"/usr/lib/python3.10/asyncio/runners.py\", line 44, in run\r\n", + " return loop.run_until_complete(main)\r\n", + " File \"/usr/lib/python3.10/asyncio/base_events.py\", line 649, in run_until_complete\r\n", + " return future.result()\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/./memory_script/eval_v5_memory_guided.py\", line 58, in main_function\r\n", + " model = SimpleRWKV(model_path, device=\"cuda\")\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 1378, in __init__\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "###\r\n", - "### Model validation end ###\r\n", - "###\r\n" + " self.model = RWKV(**model_config)\r\n", + " File \"/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/RWKV-v5/src/model.py\", line 553, in __init__\r\n", + " raise ValueError(f\"load_model file '{load_model}' does not exist\")\r\n", + "ValueError: load_model file '../../../model/EWR-1B5-E0_1.pth' does not exist\r\n" ] } ], "source": [ - "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/v5-L6-D1024-E0_1-mem-ctx-8k.pth\" \"./logs/v5-L6-D1024-E0_1-16k.csv\" 4100 16000" + "!python3 ./memory_script/eval_v5_memory_guided.py \"../../../model/EWR-1B5-E0_1.pth\" \"./logs/v5-EWR-1B5-E0_1-16k.csv\" 4100 16000" ] }, { "cell_type": "markdown", - "id": "579317b2", + "id": "29d656b6", "metadata": { "papermill": { - "duration": 0.104356, - "end_time": "2023-09-05T22:15:38.079271", + "duration": 0.061957, + "end_time": "2023-08-26T14:39:19.094552", "exception": false, - "start_time": "2023-09-05T22:15:37.974915", + "start_time": "2023-08-26T14:39:19.032595", "status": "completed" }, "tags": [] @@ -15678,20 +8824,20 @@ }, { "cell_type": "code", - "execution_count": 13, - "id": "a3bc5e5c", + "execution_count": 10, + "id": "04f299aa", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T22:15:38.293951Z", - "iopub.status.busy": "2023-09-05T22:15:38.293240Z", - "iopub.status.idle": "2023-09-05T22:16:30.929975Z", - "shell.execute_reply": "2023-09-05T22:16:30.928742Z" + "iopub.execute_input": "2023-08-26T14:39:19.221229Z", + "iopub.status.busy": "2023-08-26T14:39:19.220475Z", + "iopub.status.idle": "2023-08-26T14:40:15.430273Z", + "shell.execute_reply": "2023-08-26T14:40:15.428492Z" }, "papermill": { - "duration": 52.74712, - "end_time": "2023-09-05T22:16:30.932428", + "duration": 56.276274, + "end_time": "2023-08-26T14:40:15.432948", "exception": false, - "start_time": "2023-09-05T22:15:38.185308", + "start_time": "2023-08-26T14:39:19.156674", "status": "completed" }, "tags": [] @@ -15701,7 +8847,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[2023-09-05 22:15:42,702] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + "[2023-08-26 14:39:23,732] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { @@ -16186,20 +9332,14 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1000 tokens : 67.4% similarity, with 674 matched token, and 326 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n" + "## Model validation for 1000 tokens : 67.5% similarity, with 675 matched token, and 325 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ + "## Finished baseline model to eval output predictive matching (aka 0 memory?), for 1000 tokens\r\n", "###\r\n", "### Model validation end ###\r\n", "###\r\n" @@ -16212,20 +9352,20 @@ }, { "cell_type": "code", - "execution_count": 14, - "id": "6bf21423", + "execution_count": 11, + "id": "cd974aff", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T22:16:31.257032Z", - "iopub.status.busy": "2023-09-05T22:16:31.256036Z", - "iopub.status.idle": "2023-09-05T22:20:35.318227Z", - "shell.execute_reply": "2023-09-05T22:20:35.316693Z" + "iopub.execute_input": "2023-08-26T14:40:15.563705Z", + "iopub.status.busy": "2023-08-26T14:40:15.561980Z", + "iopub.status.idle": "2023-08-26T14:44:23.290770Z", + "shell.execute_reply": "2023-08-26T14:44:23.289849Z" }, "papermill": { - "duration": 244.178194, - "end_time": "2023-09-05T22:20:35.320591", + "duration": 247.796902, + "end_time": "2023-08-26T14:44:23.293511", "exception": false, - "start_time": "2023-09-05T22:16:31.142397", + "start_time": "2023-08-26T14:40:15.496609", "status": "completed" }, "tags": [] @@ -16235,7 +9375,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[2023-09-05 22:16:35,877] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + "[2023-08-26 14:40:19,891] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { @@ -16293,7 +9433,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1350 tokens : 50.37037037037037% similarity, with 680 matched token, and 670 token mismatch\r\n" + "## Model validation for 1350 tokens : 50.2962962962963% similarity, with 679 matched token, and 671 token mismatch\r\n" ] }, { @@ -16328,7 +9468,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1600 tokens : 41.125% similarity, with 658 matched token, and 942 token mismatch\r\n" + "## Model validation for 1600 tokens : 41.1875% similarity, with 659 matched token, and 941 token mismatch\r\n" ] }, { @@ -16342,7 +9482,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1700 tokens : 38.23529411764706% similarity, with 650 matched token, and 1050 token mismatch\r\n" + "## Model validation for 1700 tokens : 38.1764705882353% similarity, with 649 matched token, and 1051 token mismatch\r\n" ] }, { @@ -16356,21 +9496,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1800 tokens : 35.388888888888886% similarity, with 637 matched token, and 1163 token mismatch\r\n" + "## Model validation for 1800 tokens : 35.44444444444444% similarity, with 638 matched token, and 1162 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1850 tokens : 33.4054054054054% similarity, with 618 matched token, and 1232 token mismatch\r\n" + "## Model validation for 1850 tokens : 33.2972972972973% similarity, with 616 matched token, and 1234 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1900 tokens : 32.315789473684205% similarity, with 614 matched token, and 1286 token mismatch\r\n" + "## Model validation for 1900 tokens : 32.26315789473684% similarity, with 613 matched token, and 1287 token mismatch\r\n" ] }, { @@ -16384,7 +9524,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2000 tokens : 30.75% similarity, with 615 matched token, and 1385 token mismatch\r\n" + "## Model validation for 2000 tokens : 30.7% similarity, with 614 matched token, and 1386 token mismatch\r\n" ] }, { @@ -16405,14 +9545,14 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2150 tokens : 28.511627906976745% similarity, with 613 matched token, and 1537 token mismatch\r\n" + "## Model validation for 2150 tokens : 28.55813953488372% similarity, with 614 matched token, and 1536 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2200 tokens : 28.045454545454547% similarity, with 617 matched token, and 1583 token mismatch\r\n" + "## Model validation for 2200 tokens : 28.000000000000004% similarity, with 616 matched token, and 1584 token mismatch\r\n" ] }, { @@ -16447,7 +9587,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2450 tokens : 24.653061224489793% similarity, with 604 matched token, and 1846 token mismatch\r\n" + "## Model validation for 2450 tokens : 24.816326530612244% similarity, with 608 matched token, and 1842 token mismatch\r\n" ] }, { @@ -16461,21 +9601,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2550 tokens : 23.764705882352942% similarity, with 606 matched token, and 1944 token mismatch\r\n" + "## Model validation for 2550 tokens : 23.72549019607843% similarity, with 605 matched token, and 1945 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2600 tokens : 23.26923076923077% similarity, with 605 matched token, and 1995 token mismatch\r\n" + "## Model validation for 2600 tokens : 23.23076923076923% similarity, with 604 matched token, and 1996 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2650 tokens : 22.79245283018868% similarity, with 604 matched token, and 2046 token mismatch\r\n" + "## Model validation for 2650 tokens : 22.754716981132077% similarity, with 603 matched token, and 2047 token mismatch\r\n" ] }, { @@ -16496,7 +9636,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2800 tokens : 21.464285714285715% similarity, with 601 matched token, and 2199 token mismatch\r\n" + "## Model validation for 2800 tokens : 21.392857142857142% similarity, with 599 matched token, and 2201 token mismatch\r\n" ] }, { @@ -16510,21 +9650,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2900 tokens : 20.620689655172413% similarity, with 598 matched token, and 2302 token mismatch\r\n" + "## Model validation for 2900 tokens : 20.655172413793103% similarity, with 599 matched token, and 2301 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2950 tokens : 20.30508474576271% similarity, with 599 matched token, and 2351 token mismatch\r\n" + "## Model validation for 2950 tokens : 20.271186440677965% similarity, with 598 matched token, and 2352 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3000 tokens : 19.933333333333334% similarity, with 598 matched token, and 2402 token mismatch\r\n" + "## Model validation for 3000 tokens : 19.8% similarity, with 594 matched token, and 2406 token mismatch\r\n" ] }, { @@ -16538,7 +9678,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3100 tokens : 19.193548387096772% similarity, with 595 matched token, and 2505 token mismatch\r\n" + "## Model validation for 3100 tokens : 19.225806451612904% similarity, with 596 matched token, and 2504 token mismatch\r\n" ] }, { @@ -16566,35 +9706,35 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3300 tokens : 17.87878787878788% similarity, with 590 matched token, and 2710 token mismatch\r\n" + "## Model validation for 3300 tokens : 17.84848484848485% similarity, with 589 matched token, and 2711 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3350 tokens : 17.55223880597015% similarity, with 588 matched token, and 2762 token mismatch\r\n" + "## Model validation for 3350 tokens : 17.522388059701495% similarity, with 587 matched token, and 2763 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3400 tokens : 17.323529411764707% similarity, with 589 matched token, and 2811 token mismatch\r\n" + "## Model validation for 3400 tokens : 17.352941176470587% similarity, with 590 matched token, and 2810 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3450 tokens : 16.98550724637681% similarity, with 586 matched token, and 2864 token mismatch\r\n" + "## Model validation for 3450 tokens : 16.956521739130434% similarity, with 585 matched token, and 2865 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3500 tokens : 16.62857142857143% similarity, with 582 matched token, and 2918 token mismatch\r\n" + "## Model validation for 3500 tokens : 16.57142857142857% similarity, with 580 matched token, and 2920 token mismatch\r\n" ] }, { @@ -16608,35 +9748,35 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3600 tokens : 15.944444444444445% similarity, with 574 matched token, and 3026 token mismatch\r\n" + "## Model validation for 3600 tokens : 16.0% similarity, with 576 matched token, and 3024 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3650 tokens : 15.835616438356166% similarity, with 578 matched token, and 3072 token mismatch\r\n" + "## Model validation for 3650 tokens : 15.890410958904111% similarity, with 580 matched token, and 3070 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3700 tokens : 15.486486486486486% similarity, with 573 matched token, and 3127 token mismatch\r\n" + "## Model validation for 3700 tokens : 15.513513513513514% similarity, with 574 matched token, and 3126 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3750 tokens : 15.28% similarity, with 573 matched token, and 3177 token mismatch\r\n" + "## Model validation for 3750 tokens : 15.306666666666665% similarity, with 574 matched token, and 3176 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3800 tokens : 15.026315789473685% similarity, with 571 matched token, and 3229 token mismatch\r\n" + "## Model validation for 3800 tokens : 15.078947368421053% similarity, with 573 matched token, and 3227 token mismatch\r\n" ] }, { @@ -16650,21 +9790,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3900 tokens : 14.692307692307693% similarity, with 573 matched token, and 3327 token mismatch\r\n" + "## Model validation for 3900 tokens : 14.666666666666666% similarity, with 572 matched token, and 3328 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3950 tokens : 14.27848101265823% similarity, with 564 matched token, and 3386 token mismatch\r\n" + "## Model validation for 3950 tokens : 14.253164556962025% similarity, with 563 matched token, and 3387 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4000 tokens : 13.850000000000001% similarity, with 554 matched token, and 3446 token mismatch\r\n" + "## Model validation for 4000 tokens : 13.875000000000002% similarity, with 555 matched token, and 3445 token mismatch\r\n" ] }, { @@ -16683,20 +9823,20 @@ }, { "cell_type": "code", - "execution_count": 15, - "id": "44ea2959", + "execution_count": 12, + "id": "55c4b231", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T22:20:35.545636Z", - "iopub.status.busy": "2023-09-05T22:20:35.545083Z", - "iopub.status.idle": "2023-09-05T23:20:17.504268Z", - "shell.execute_reply": "2023-09-05T23:20:17.503356Z" + "iopub.execute_input": "2023-08-26T14:44:23.524751Z", + "iopub.status.busy": "2023-08-26T14:44:23.524350Z", + "iopub.status.idle": "2023-08-26T15:43:52.551775Z", + "shell.execute_reply": "2023-08-26T15:43:52.550592Z" }, "papermill": { - "duration": 3582.074768, - "end_time": "2023-09-05T23:20:17.506577", + "duration": 3569.18119, + "end_time": "2023-08-26T15:43:52.554057", "exception": false, - "start_time": "2023-09-05T22:20:35.431809", + "start_time": "2023-08-26T14:44:23.372867", "status": "completed" }, "tags": [] @@ -16706,7 +9846,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[2023-09-05 22:20:39,857] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + "[2023-08-26 14:44:28,120] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { @@ -16729,14 +9869,14 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4100 tokens : 13.390243902439025% similarity, with 549 matched token, and 3551 token mismatch\r\n" + "## Model validation for 4100 tokens : 13.463414634146343% similarity, with 552 matched token, and 3548 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4200 tokens : 12.547619047619046% similarity, with 527 matched token, and 3673 token mismatch\r\n" + "## Model validation for 4200 tokens : 12.523809523809524% similarity, with 526 matched token, and 3674 token mismatch\r\n" ] }, { @@ -16750,21 +9890,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4400 tokens : 10.772727272727273% similarity, with 474 matched token, and 3926 token mismatch\r\n" + "## Model validation for 4400 tokens : 10.795454545454545% similarity, with 475 matched token, and 3925 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4500 tokens : 9.88888888888889% similarity, with 445 matched token, and 4055 token mismatch\r\n" + "## Model validation for 4500 tokens : 9.911111111111111% similarity, with 446 matched token, and 4054 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4600 tokens : 8.782608695652174% similarity, with 404 matched token, and 4196 token mismatch\r\n" + "## Model validation for 4600 tokens : 8.76086956521739% similarity, with 403 matched token, and 4197 token mismatch\r\n" ] }, { @@ -16792,14 +9932,14 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5000 tokens : 5.4399999999999995% similarity, with 272 matched token, and 4728 token mismatch\r\n" + "## Model validation for 5000 tokens : 5.46% similarity, with 273 matched token, and 4727 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5100 tokens : 4.96078431372549% similarity, with 253 matched token, and 4847 token mismatch\r\n" + "## Model validation for 5100 tokens : 4.980392156862745% similarity, with 254 matched token, and 4846 token mismatch\r\n" ] }, { @@ -16813,21 +9953,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5300 tokens : 4.377358490566038% similarity, with 232 matched token, and 5068 token mismatch\r\n" + "## Model validation for 5300 tokens : 4.3584905660377355% similarity, with 231 matched token, and 5069 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5400 tokens : 4.092592592592593% similarity, with 221 matched token, and 5179 token mismatch\r\n" + "## Model validation for 5400 tokens : 4.12962962962963% similarity, with 223 matched token, and 5177 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5500 tokens : 4.0% similarity, with 220 matched token, and 5280 token mismatch\r\n" + "## Model validation for 5500 tokens : 4.018181818181818% similarity, with 221 matched token, and 5279 token mismatch\r\n" ] }, { @@ -16862,7 +10002,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6000 tokens : 3.55% similarity, with 213 matched token, and 5787 token mismatch\r\n" + "## Model validation for 6000 tokens : 3.5333333333333337% similarity, with 212 matched token, and 5788 token mismatch\r\n" ] }, { @@ -16876,7 +10016,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6200 tokens : 3.5000000000000004% similarity, with 217 matched token, and 5983 token mismatch\r\n" + "## Model validation for 6200 tokens : 3.516129032258065% similarity, with 218 matched token, and 5982 token mismatch\r\n" ] }, { @@ -16904,7 +10044,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6600 tokens : 3.424242424242424% similarity, with 226 matched token, and 6374 token mismatch\r\n" + "## Model validation for 6600 tokens : 3.4393939393939394% similarity, with 227 matched token, and 6373 token mismatch\r\n" ] }, { @@ -16925,7 +10065,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6900 tokens : 3.4492753623188404% similarity, with 238 matched token, and 6662 token mismatch\r\n" + "## Model validation for 6900 tokens : 3.4637681159420293% similarity, with 239 matched token, and 6661 token mismatch\r\n" ] }, { @@ -16946,7 +10086,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 7200 tokens : 3.4027777777777777% similarity, with 245 matched token, and 6955 token mismatch\r\n" + "## Model validation for 7200 tokens : 3.3888888888888893% similarity, with 244 matched token, and 6956 token mismatch\r\n" ] }, { @@ -17030,7 +10170,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 8400 tokens : 3.428571428571429% similarity, with 288 matched token, and 8112 token mismatch\r\n" + "## Model validation for 8400 tokens : 3.4166666666666665% similarity, with 287 matched token, and 8113 token mismatch\r\n" ] }, { @@ -17079,7 +10219,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9100 tokens : 3.4505494505494507% similarity, with 314 matched token, and 8786 token mismatch\r\n" + "## Model validation for 9100 tokens : 3.4395604395604393% similarity, with 313 matched token, and 8787 token mismatch\r\n" ] }, { @@ -17100,21 +10240,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9400 tokens : 3.404255319148936% similarity, with 320 matched token, and 9080 token mismatch\r\n" + "## Model validation for 9400 tokens : 3.393617021276596% similarity, with 319 matched token, and 9081 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9500 tokens : 3.431578947368421% similarity, with 326 matched token, and 9174 token mismatch\r\n" + "## Model validation for 9500 tokens : 3.421052631578948% similarity, with 325 matched token, and 9175 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9600 tokens : 3.4166666666666665% similarity, with 328 matched token, and 9272 token mismatch\r\n" + "## Model validation for 9600 tokens : 3.4062500000000004% similarity, with 327 matched token, and 9273 token mismatch\r\n" ] }, { @@ -17135,7 +10275,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 9900 tokens : 3.424242424242424% similarity, with 339 matched token, and 9561 token mismatch\r\n" + "## Model validation for 9900 tokens : 3.414141414141414% similarity, with 338 matched token, and 9562 token mismatch\r\n" ] }, { @@ -17177,7 +10317,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 10500 tokens : 3.4666666666666663% similarity, with 364 matched token, and 10136 token mismatch\r\n" + "## Model validation for 10500 tokens : 3.4571428571428573% similarity, with 363 matched token, and 10137 token mismatch\r\n" ] }, { @@ -17338,7 +10478,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 12800 tokens : 3.578125% similarity, with 458 matched token, and 12342 token mismatch\r\n" + "## Model validation for 12800 tokens : 3.5703125% similarity, with 457 matched token, and 12343 token mismatch\r\n" ] }, { @@ -17366,7 +10506,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 13200 tokens : 3.5833333333333335% similarity, with 473 matched token, and 12727 token mismatch\r\n" + "## Model validation for 13200 tokens : 3.5757575757575757% similarity, with 472 matched token, and 12728 token mismatch\r\n" ] }, { @@ -17485,7 +10625,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 14900 tokens : 3.610738255033557% similarity, with 538 matched token, and 14362 token mismatch\r\n" + "## Model validation for 14900 tokens : 3.604026845637584% similarity, with 537 matched token, and 14363 token mismatch\r\n" ] }, { @@ -17527,7 +10667,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15500 tokens : 3.587096774193548% similarity, with 556 matched token, and 14944 token mismatch\r\n" + "## Model validation for 15500 tokens : 3.5806451612903225% similarity, with 555 matched token, and 14945 token mismatch\r\n" ] }, { @@ -17562,13 +10702,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 16000 tokens : 3.5687499999999996% similarity, with 571 matched token, and 15429 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ + "## Model validation for 16000 tokens : 3.5687499999999996% similarity, with 571 matched token, and 15429 token mismatch\r\n", "###\r\n", "### Model validation end ###\r\n", "###\r\n" @@ -17581,13 +10715,13 @@ }, { "cell_type": "markdown", - "id": "b398575a", + "id": "9fdb5030", "metadata": { "papermill": { - "duration": 0.123548, - "end_time": "2023-09-05T23:20:17.753184", + "duration": 0.075748, + "end_time": "2023-08-26T15:43:52.704738", "exception": false, - "start_time": "2023-09-05T23:20:17.629636", + "start_time": "2023-08-26T15:43:52.628990", "status": "completed" }, "tags": [] @@ -17598,20 +10732,20 @@ }, { "cell_type": "code", - "execution_count": 16, - "id": "b3229188", + "execution_count": 13, + "id": "59ffd864", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T23:20:18.000562Z", - "iopub.status.busy": "2023-09-05T23:20:18.000185Z", - "iopub.status.idle": "2023-09-05T23:21:27.371500Z", - "shell.execute_reply": "2023-09-05T23:21:27.370336Z" + "iopub.execute_input": "2023-08-26T15:43:52.859479Z", + "iopub.status.busy": "2023-08-26T15:43:52.858275Z", + "iopub.status.idle": "2023-08-26T15:44:58.323128Z", + "shell.execute_reply": "2023-08-26T15:44:58.322179Z" }, "papermill": { - "duration": 69.497703, - "end_time": "2023-09-05T23:21:27.373916", + "duration": 65.543854, + "end_time": "2023-08-26T15:44:58.325168", "exception": false, - "start_time": "2023-09-05T23:20:17.876213", + "start_time": "2023-08-26T15:43:52.781314", "status": "completed" }, "tags": [] @@ -17621,7 +10755,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[2023-09-05 23:20:22,562] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + "[2023-08-26 15:43:57,356] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { @@ -18132,20 +11266,20 @@ }, { "cell_type": "code", - "execution_count": 17, - "id": "33e254f7", + "execution_count": 14, + "id": "816d4475", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T23:21:27.628949Z", - "iopub.status.busy": "2023-09-05T23:21:27.628479Z", - "iopub.status.idle": "2023-09-05T23:25:51.884822Z", - "shell.execute_reply": "2023-09-05T23:25:51.883772Z" + "iopub.execute_input": "2023-08-26T15:44:58.475082Z", + "iopub.status.busy": "2023-08-26T15:44:58.474129Z", + "iopub.status.idle": "2023-08-26T15:48:50.587080Z", + "shell.execute_reply": "2023-08-26T15:48:50.585908Z" }, "papermill": { - "duration": 264.386818, - "end_time": "2023-09-05T23:25:51.887041", + "duration": 232.19095, + "end_time": "2023-08-26T15:48:50.589477", "exception": false, - "start_time": "2023-09-05T23:21:27.500223", + "start_time": "2023-08-26T15:44:58.398527", "status": "completed" }, "tags": [] @@ -18155,7 +11289,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[2023-09-05 23:21:32,282] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + "[2023-08-26 15:45:02,461] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { @@ -18192,7 +11326,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1200 tokens : 77.16666666666666% similarity, with 926 matched token, and 274 token mismatch\r\n" + "## Model validation for 1200 tokens : 77.08333333333334% similarity, with 925 matched token, and 275 token mismatch\r\n" ] }, { @@ -18206,7 +11340,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1300 tokens : 73.0% similarity, with 949 matched token, and 351 token mismatch\r\n" + "## Model validation for 1300 tokens : 73.07692307692307% similarity, with 950 matched token, and 350 token mismatch\r\n" ] }, { @@ -18269,7 +11403,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1750 tokens : 59.08571428571429% similarity, with 1034 matched token, and 716 token mismatch\r\n" + "## Model validation for 1750 tokens : 59.14285714285714% similarity, with 1035 matched token, and 715 token mismatch\r\n" ] }, { @@ -18283,21 +11417,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1850 tokens : 56.00000000000001% similarity, with 1036 matched token, and 814 token mismatch\r\n" + "## Model validation for 1850 tokens : 55.945945945945944% similarity, with 1035 matched token, and 815 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1900 tokens : 54.89473684210526% similarity, with 1043 matched token, and 857 token mismatch\r\n" + "## Model validation for 1900 tokens : 54.94736842105263% similarity, with 1044 matched token, and 856 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 1950 tokens : 53.17948717948718% similarity, with 1037 matched token, and 913 token mismatch\r\n" + "## Model validation for 1950 tokens : 53.230769230769226% similarity, with 1038 matched token, and 912 token mismatch\r\n" ] }, { @@ -18311,7 +11445,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2050 tokens : 50.8780487804878% similarity, with 1043 matched token, and 1007 token mismatch\r\n" + "## Model validation for 2050 tokens : 50.926829268292686% similarity, with 1044 matched token, and 1006 token mismatch\r\n" ] }, { @@ -18353,21 +11487,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2350 tokens : 41.61702127659574% similarity, with 978 matched token, and 1372 token mismatch\r\n" + "## Model validation for 2350 tokens : 41.65957446808511% similarity, with 979 matched token, and 1371 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2400 tokens : 40.875% similarity, with 981 matched token, and 1419 token mismatch\r\n" + "## Model validation for 2400 tokens : 40.91666666666667% similarity, with 982 matched token, and 1418 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2450 tokens : 38.9795918367347% similarity, with 955 matched token, and 1495 token mismatch\r\n" + "## Model validation for 2450 tokens : 39.02040816326531% similarity, with 956 matched token, and 1494 token mismatch\r\n" ] }, { @@ -18381,35 +11515,35 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2550 tokens : 36.431372549019606% similarity, with 929 matched token, and 1621 token mismatch\r\n" + "## Model validation for 2550 tokens : 36.470588235294116% similarity, with 930 matched token, and 1620 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2600 tokens : 35.53846153846154% similarity, with 924 matched token, and 1676 token mismatch\r\n" + "## Model validation for 2600 tokens : 35.46153846153846% similarity, with 922 matched token, and 1678 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2650 tokens : 34.60377358490566% similarity, with 917 matched token, and 1733 token mismatch\r\n" + "## Model validation for 2650 tokens : 34.56603773584906% similarity, with 916 matched token, and 1734 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2700 tokens : 33.925925925925924% similarity, with 916 matched token, and 1784 token mismatch\r\n" + "## Model validation for 2700 tokens : 33.88888888888889% similarity, with 915 matched token, and 1785 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2750 tokens : 32.690909090909095% similarity, with 899 matched token, and 1851 token mismatch\r\n" + "## Model validation for 2750 tokens : 32.654545454545456% similarity, with 898 matched token, and 1852 token mismatch\r\n" ] }, { @@ -18423,28 +11557,28 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2850 tokens : 31.017543859649123% similarity, with 884 matched token, and 1966 token mismatch\r\n" + "## Model validation for 2850 tokens : 31.05263157894737% similarity, with 885 matched token, and 1965 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2900 tokens : 30.06896551724138% similarity, with 872 matched token, and 2028 token mismatch\r\n" + "## Model validation for 2900 tokens : 30.10344827586207% similarity, with 873 matched token, and 2027 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 2950 tokens : 29.322033898305083% similarity, with 865 matched token, and 2085 token mismatch\r\n" + "## Model validation for 2950 tokens : 29.355932203389827% similarity, with 866 matched token, and 2084 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3000 tokens : 28.7% similarity, with 861 matched token, and 2139 token mismatch\r\n" + "## Model validation for 3000 tokens : 28.666666666666668% similarity, with 860 matched token, and 2140 token mismatch\r\n" ] }, { @@ -18486,14 +11620,14 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3300 tokens : 25.151515151515152% similarity, with 830 matched token, and 2470 token mismatch\r\n" + "## Model validation for 3300 tokens : 25.181818181818183% similarity, with 831 matched token, and 2469 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3350 tokens : 24.507462686567163% similarity, with 821 matched token, and 2529 token mismatch\r\n" + "## Model validation for 3350 tokens : 24.44776119402985% similarity, with 819 matched token, and 2531 token mismatch\r\n" ] }, { @@ -18542,14 +11676,14 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3700 tokens : 21.756756756756758% similarity, with 805 matched token, and 2895 token mismatch\r\n" + "## Model validation for 3700 tokens : 21.783783783783782% similarity, with 806 matched token, and 2894 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 3750 tokens : 21.493333333333332% similarity, with 806 matched token, and 2944 token mismatch\r\n" + "## Model validation for 3750 tokens : 21.52% similarity, with 807 matched token, and 2943 token mismatch\r\n" ] }, { @@ -18603,20 +11737,20 @@ }, { "cell_type": "code", - "execution_count": 18, - "id": "5d33ffaa", + "execution_count": 15, + "id": "3246699f", "metadata": { "execution": { - "iopub.execute_input": "2023-09-05T23:25:52.152096Z", - "iopub.status.busy": "2023-09-05T23:25:52.151535Z", - "iopub.status.idle": "2023-09-06T00:28:45.815950Z", - "shell.execute_reply": "2023-09-06T00:28:45.814816Z" + "iopub.execute_input": "2023-08-26T15:48:50.755698Z", + "iopub.status.busy": "2023-08-26T15:48:50.754546Z", + "iopub.status.idle": "2023-08-26T16:51:12.767938Z", + "shell.execute_reply": "2023-08-26T16:51:12.766985Z" }, "papermill": { - "duration": 3773.798194, - "end_time": "2023-09-06T00:28:45.818553", + "duration": 3742.098954, + "end_time": "2023-08-26T16:51:12.770407", "exception": false, - "start_time": "2023-09-05T23:25:52.020359", + "start_time": "2023-08-26T15:48:50.671453", "status": "completed" }, "tags": [] @@ -18626,7 +11760,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[2023-09-05 23:25:56,732] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" + "[2023-08-26 15:48:55,284] [INFO] [real_accelerator.py:133:get_accelerator] Setting ds_accelerator to cuda (auto detect)\r\n" ] }, { @@ -18649,35 +11783,35 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4100 tokens : 19.390243902439025% similarity, with 795 matched token, and 3305 token mismatch\r\n" + "## Model validation for 4100 tokens : 19.439024390243905% similarity, with 797 matched token, and 3303 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4200 tokens : 18.452380952380953% similarity, with 775 matched token, and 3425 token mismatch\r\n" + "## Model validation for 4200 tokens : 18.5% similarity, with 777 matched token, and 3423 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4300 tokens : 17.883720930232556% similarity, with 769 matched token, and 3531 token mismatch\r\n" + "## Model validation for 4300 tokens : 17.906976744186046% similarity, with 770 matched token, and 3530 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4400 tokens : 17.09090909090909% similarity, with 752 matched token, and 3648 token mismatch\r\n" + "## Model validation for 4400 tokens : 17.06818181818182% similarity, with 751 matched token, and 3649 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 4500 tokens : 16.400000000000002% similarity, with 738 matched token, and 3762 token mismatch\r\n" + "## Model validation for 4500 tokens : 16.377777777777776% similarity, with 737 matched token, and 3763 token mismatch\r\n" ] }, { @@ -18712,14 +11846,14 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5000 tokens : 12.46% similarity, with 623 matched token, and 4377 token mismatch\r\n" + "## Model validation for 5000 tokens : 12.42% similarity, with 621 matched token, and 4379 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5100 tokens : 11.490196078431373% similarity, with 586 matched token, and 4514 token mismatch\r\n" + "## Model validation for 5100 tokens : 11.470588235294118% similarity, with 585 matched token, and 4515 token mismatch\r\n" ] }, { @@ -18740,7 +11874,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5400 tokens : 8.685185185185185% similarity, with 469 matched token, and 4931 token mismatch\r\n" + "## Model validation for 5400 tokens : 8.666666666666668% similarity, with 468 matched token, and 4932 token mismatch\r\n" ] }, { @@ -18775,7 +11909,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 5900 tokens : 5.6440677966101696% similarity, with 333 matched token, and 5567 token mismatch\r\n" + "## Model validation for 5900 tokens : 5.627118644067797% similarity, with 332 matched token, and 5568 token mismatch\r\n" ] }, { @@ -18831,14 +11965,14 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6700 tokens : 3.805970149253731% similarity, with 255 matched token, and 6445 token mismatch\r\n" + "## Model validation for 6700 tokens : 3.7910447761194033% similarity, with 254 matched token, and 6446 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 6800 tokens : 3.691176470588235% similarity, with 251 matched token, and 6549 token mismatch\r\n" + "## Model validation for 6800 tokens : 3.6764705882352944% similarity, with 250 matched token, and 6550 token mismatch\r\n" ] }, { @@ -19468,27 +12602,21 @@ "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 15800 tokens : 3.531645569620253% similarity, with 558 matched token, and 15242 token mismatch\r\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "## Model validation for 15900 tokens : 3.534591194968553% similarity, with 562 matched token, and 15338 token mismatch\r\n" + "## Model validation for 15800 tokens : 3.537974683544304% similarity, with 559 matched token, and 15241 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "## Model validation for 16000 tokens : 3.5249999999999995% similarity, with 564 matched token, and 15436 token mismatch\r\n" + "## Model validation for 15900 tokens : 3.528301886792453% similarity, with 561 matched token, and 15339 token mismatch\r\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ + "## Model validation for 16000 tokens : 3.5249999999999995% similarity, with 564 matched token, and 15436 token mismatch\r\n", "###\r\n", "### Model validation end ###\r\n", "###\r\n" @@ -19520,14 +12648,14 @@ }, "papermill": { "default_parameters": {}, - "duration": 16222.341869, - "end_time": "2023-09-06T00:28:46.417740", + "duration": 12231.801051, + "end_time": "2023-08-26T16:51:13.211146", "environment_variables": {}, "exception": null, "input_path": "/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/notebook/experiment/memory-bench/Benchmark-V5.ipynb", "output_path": "/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/Benchmark-V5.ipynb", "parameters": {}, - "start_time": "2023-09-05T19:58:24.075871", + "start_time": "2023-08-26T13:27:21.410095", "version": "2.4.0" } },