File size: 10,818 Bytes
8454beb
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
53bc06c
dd895c2
7ddc620
 
 
 
 
 
 
 
 
 
 
 
ee3a211
 
11c5233
8654a52
4ee5efd
f924a7e
9682aeb
27a3eb2
16d30e4
6a91f3b
cf7e531
14a1344
43cfc25
37c532b
3174373
9d8d0d1
71703ff
628af9b
75b431c
9a6ecaa
1775dcc
ceba8a7
9520fd8
76ae850
d8c75e1
4e1f31f
6064435
bb5e1f0
9d5ca78
5c6bf4e
343ab45
89b3cf3
267e3f4
0060bfd
c5fa00d
ed039d0
ff7fe26
44c409b
02e5adf
c380549
ba60d68
83b88d8
11a005c
6de3653
18cf0db
c30f394
bb603ed
b03b051
63a930b
2a4cdfa
a88a1bd
432b7bb
5009739
95d0170
033ffd7
51c4d54
2609be5
21657c7
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-headsize2x/v5-L6-D4096-E1e-1-ctx4k-part2.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-headsize2x/v5-L6-D2048-E1e-1-ctx4k-part2.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/BaseV5-C-Tune5-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/BaseV5-C-Tune5-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-hs2x-L6-D4096-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-hs2x-L6-D4096-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-L6-D2048-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-L6-D2048-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-L6-D4096-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-L6-D4096-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5wave-1B5-E0_1-ctx-16k-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5wave-1B5-E0_1-ctx-16k-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/WavenetV5-C-Tune5-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/WavenetV5-C-Tune5-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5wave-13-1B5-E0_1-ctx-16k-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5wave-13-1B5-E0_1-ctx-16k-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-headsize32/v5-L6-D2048-E1e-1-ctx4k-part2.ipynb filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-L6-D4096-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-L6-D4096-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-L6-D2048-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-L6-D2048-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/BaseV5-C-Tune5-4k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/BaseV5-C-Tune5-16k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/rwkv-x-exp/v5-small-model/v5-L6-ctx4k-models-part1.ipynb filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5wave-13-1B5-E0_1-ctx-16k-4k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/WavenetV5-C-Tune5-4k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/WavenetV5-C-Tune5-16k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5wave-13-1B5-E0_1-ctx-16k-16k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-hs2x-L6-D4096-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-hs2x-L6-D2048-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-hs2x-L6-D2048-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-hs2x-L6-D4096-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/WavenetV5-C-Tune5-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5wave-13-1B5-E0_1-ctx-16k-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/WavenetV5-C-Tune5-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5wave-13-1B5-E0_1-ctx-16k-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-hs2x-L6-D4096-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-hs2x-L6-D2048-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-hs2x-L6-D4096-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-hs2x-L6-D2048-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-L6-D4096-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-L6-D4096-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-L6-D2048-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/v5-L6-D2048-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/BaseV5-C-Tune5-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/actions-runner/_work/RWKV-infctx-trainer/RWKV-infctx-trainer/output/experiment/memory-bench/logs/BaseV5-C-Tune5-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-L96-D1024-E0_1-mem-ctx-8k-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-L96-D1024-E0_1-mem-ctx-8k-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-slim-memory/v5-L6-D1024-E1e-1-ctx4k.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-L6-D1024-E0_1-4k.csv filter=lfs diff=lfs merge=lfs -text
experiment/memory-bench/logs/v5-L6-D1024-E0_1-16k.csv filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L12-D2048-E1e-1-ctx4k/part1.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2048-E1e-1-ctx4k/part1.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2048-E1e-1-ctx4k/part2.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L12-D2048-E1e-1-ctx4k/part2.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2560-E1e-1-ctx4k/part1.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2560-E1e-1-ctx4k/stage2.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2048-E1e-1-ctx4k/stage2.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2560-E1e-1-ctx4k/stage3.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2048-E1e-1-ctx4k/stage3.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2560-E1e-1-ctx4k/stage4.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2048-E1e-1-ctx4k/stage4.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2560-E1e-1-ctx4k/stage5.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/v5-r3-memory/L6-D2048-E1e-1-ctx4k/stage5.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/multi-size-train/v5-L6-D2048-part1.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/multi-size-train/v5-L6-D2048-baseline.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/multi-size-train/v5-L12-D2048-part1.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/multi-size-train/v5-L12-D2048-baseline.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/multi-size-train/v5-L6+6-D2048-overwrite-naive.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/multi-size-train/v5-L6-D2048-split-train.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/multi-size-train/v5-L6+6-D2048-layer-expansion.ipynb filter=lfs diff=lfs merge=lfs -text
experiment/rwkv-x-exp/multi-size-train/v5-L6-D2048-split-baseline.ipynb filter=lfs diff=lfs merge=lfs -text