recurrentg-2b-it / 2b-it /checkpoint
yingbei's picture
Upload 11 files
3309088 verified
raw
history blame
28.8 kB
��blocks.0��channel_pre_norm��scale�-PLACEHOLDER://blocks.0.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.0.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.0.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.0.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.0.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�0PLACEHOLDER://blocks.0.recurrent_block.conv_1d.b�w�0PLACEHOLDER://blocks.0.recurrent_block.conv_1d.w�linear_out��bias�6PLACEHOLDER://blocks.0.recurrent_block.linear_out.bias�kernel�8PLACEHOLDER://blocks.0.recurrent_block.linear_out.kernel�linear_x��bias�4PLACEHOLDER://blocks.0.recurrent_block.linear_x.bias�kernel�6PLACEHOLDER://blocks.0.recurrent_block.linear_x.kernel�linear_y��bias�4PLACEHOLDER://blocks.0.recurrent_block.linear_y.bias�kernel�6PLACEHOLDER://blocks.0.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�6PLACEHOLDER://blocks.0.recurrent_block.rg_lru.a_gate.b�w�6PLACEHOLDER://blocks.0.recurrent_block.rg_lru.a_gate.w�a_param�5PLACEHOLDER://blocks.0.recurrent_block.rg_lru.a_param�input_gate��b�:PLACEHOLDER://blocks.0.recurrent_block.rg_lru.input_gate.b�w�:PLACEHOLDER://blocks.0.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.0.temporal_pre_norm.scale�blocks.1��channel_pre_norm��scale�-PLACEHOLDER://blocks.1.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.1.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.1.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.1.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.1.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�0PLACEHOLDER://blocks.1.recurrent_block.conv_1d.b�w�0PLACEHOLDER://blocks.1.recurrent_block.conv_1d.w�linear_out��bias�6PLACEHOLDER://blocks.1.recurrent_block.linear_out.bias�kernel�8PLACEHOLDER://blocks.1.recurrent_block.linear_out.kernel�linear_x��bias�4PLACEHOLDER://blocks.1.recurrent_block.linear_x.bias�kernel�6PLACEHOLDER://blocks.1.recurrent_block.linear_x.kernel�linear_y��bias�4PLACEHOLDER://blocks.1.recurrent_block.linear_y.bias�kernel�6PLACEHOLDER://blocks.1.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�6PLACEHOLDER://blocks.1.recurrent_block.rg_lru.a_gate.b�w�6PLACEHOLDER://blocks.1.recurrent_block.rg_lru.a_gate.w�a_param�5PLACEHOLDER://blocks.1.recurrent_block.rg_lru.a_param�input_gate��b�:PLACEHOLDER://blocks.1.recurrent_block.rg_lru.input_gate.b�w�:PLACEHOLDER://blocks.1.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.1.temporal_pre_norm.scale�blocks.10��channel_pre_norm��scale�.PLACEHOLDER://blocks.10.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.10.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.10.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.10.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.10.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.10.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.10.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.10.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.10.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.10.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.10.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.10.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.10.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.10.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.10.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.10.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.10.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.10.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.10.temporal_pre_norm.scale�blocks.11��attention_block��proj_final��bias�7PLACEHOLDER://blocks.11.attention_block.proj_final.bias�kernel�9PLACEHOLDER://blocks.11.attention_block.proj_final.kernel�proj_k��kernel�5PLACEHOLDER://blocks.11.attention_block.proj_k.kernel�proj_q��kernel�5PLACEHOLDER://blocks.11.attention_block.proj_q.kernel�proj_v��kernel�5PLACEHOLDER://blocks.11.attention_block.proj_v.kernel�channel_pre_norm��scale�.PLACEHOLDER://blocks.11.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.11.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.11.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.11.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.11.mlp_block.ffw_up.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.11.temporal_pre_norm.scale�blocks.12��channel_pre_norm��scale�.PLACEHOLDER://blocks.12.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.12.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.12.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.12.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.12.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.12.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.12.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.12.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.12.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.12.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.12.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.12.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.12.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.12.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.12.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.12.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.12.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.12.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.12.temporal_pre_norm.scale�blocks.13��channel_pre_norm��scale�.PLACEHOLDER://blocks.13.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.13.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.13.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.13.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.13.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.13.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.13.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.13.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.13.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.13.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.13.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.13.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.13.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.13.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.13.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.13.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.13.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.13.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.13.temporal_pre_norm.scale�blocks.14��attention_block��proj_final��bias�7PLACEHOLDER://blocks.14.attention_block.proj_final.bias�kernel�9PLACEHOLDER://blocks.14.attention_block.proj_final.kernel�proj_k��kernel�5PLACEHOLDER://blocks.14.attention_block.proj_k.kernel�proj_q��kernel�5PLACEHOLDER://blocks.14.attention_block.proj_q.kernel�proj_v��kernel�5PLACEHOLDER://blocks.14.attention_block.proj_v.kernel�channel_pre_norm��scale�.PLACEHOLDER://blocks.14.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.14.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.14.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.14.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.14.mlp_block.ffw_up.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.14.temporal_pre_norm.scale�blocks.15��channel_pre_norm��scale�.PLACEHOLDER://blocks.15.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.15.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.15.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.15.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.15.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.15.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.15.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.15.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.15.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.15.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.15.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.15.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.15.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.15.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.15.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.15.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.15.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.15.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.15.temporal_pre_norm.scale�blocks.16��channel_pre_norm��scale�.PLACEHOLDER://blocks.16.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.16.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.16.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.16.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.16.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.16.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.16.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.16.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.16.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.16.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.16.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.16.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.16.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.16.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.16.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.16.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.16.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.16.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.16.temporal_pre_norm.scale�blocks.17��attention_block��proj_final��bias�7PLACEHOLDER://blocks.17.attention_block.proj_final.bias�kernel�9PLACEHOLDER://blocks.17.attention_block.proj_final.kernel�proj_k��kernel�5PLACEHOLDER://blocks.17.attention_block.proj_k.kernel�proj_q��kernel�5PLACEHOLDER://blocks.17.attention_block.proj_q.kernel�proj_v��kernel�5PLACEHOLDER://blocks.17.attention_block.proj_v.kernel�channel_pre_norm��scale�.PLACEHOLDER://blocks.17.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.17.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.17.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.17.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.17.mlp_block.ffw_up.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.17.temporal_pre_norm.scale�blocks.18��channel_pre_norm��scale�.PLACEHOLDER://blocks.18.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.18.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.18.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.18.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.18.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.18.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.18.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.18.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.18.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.18.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.18.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.18.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.18.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.18.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.18.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.18.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.18.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.18.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.18.temporal_pre_norm.scale�blocks.19��channel_pre_norm��scale�.PLACEHOLDER://blocks.19.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.19.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.19.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.19.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.19.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.19.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.19.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.19.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.19.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.19.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.19.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.19.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.19.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.19.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.19.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.19.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.19.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.19.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.19.temporal_pre_norm.scale�blocks.2��attention_block��proj_final��bias�6PLACEHOLDER://blocks.2.attention_block.proj_final.bias�kernel�8PLACEHOLDER://blocks.2.attention_block.proj_final.kernel�proj_k��kernel�4PLACEHOLDER://blocks.2.attention_block.proj_k.kernel�proj_q��kernel�4PLACEHOLDER://blocks.2.attention_block.proj_q.kernel�proj_v��kernel�4PLACEHOLDER://blocks.2.attention_block.proj_v.kernel�channel_pre_norm��scale�-PLACEHOLDER://blocks.2.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.2.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.2.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.2.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.2.mlp_block.ffw_up.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.2.temporal_pre_norm.scale�blocks.20��attention_block��proj_final��bias�7PLACEHOLDER://blocks.20.attention_block.proj_final.bias�kernel�9PLACEHOLDER://blocks.20.attention_block.proj_final.kernel�proj_k��kernel�5PLACEHOLDER://blocks.20.attention_block.proj_k.kernel�proj_q��kernel�5PLACEHOLDER://blocks.20.attention_block.proj_q.kernel�proj_v��kernel�5PLACEHOLDER://blocks.20.attention_block.proj_v.kernel�channel_pre_norm��scale�.PLACEHOLDER://blocks.20.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.20.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.20.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.20.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.20.mlp_block.ffw_up.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.20.temporal_pre_norm.scale�blocks.21��channel_pre_norm��scale�.PLACEHOLDER://blocks.21.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.21.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.21.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.21.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.21.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.21.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.21.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.21.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.21.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.21.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.21.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.21.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.21.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.21.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.21.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.21.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.21.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.21.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.21.temporal_pre_norm.scale�blocks.22��channel_pre_norm��scale�.PLACEHOLDER://blocks.22.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.22.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.22.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.22.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.22.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.22.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.22.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.22.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.22.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.22.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.22.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.22.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.22.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.22.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.22.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.22.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.22.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.22.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.22.temporal_pre_norm.scale�blocks.23��attention_block��proj_final��bias�7PLACEHOLDER://blocks.23.attention_block.proj_final.bias�kernel�9PLACEHOLDER://blocks.23.attention_block.proj_final.kernel�proj_k��kernel�5PLACEHOLDER://blocks.23.attention_block.proj_k.kernel�proj_q��kernel�5PLACEHOLDER://blocks.23.attention_block.proj_q.kernel�proj_v��kernel�5PLACEHOLDER://blocks.23.attention_block.proj_v.kernel�channel_pre_norm��scale�.PLACEHOLDER://blocks.23.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.23.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.23.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.23.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.23.mlp_block.ffw_up.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.23.temporal_pre_norm.scale�blocks.24��channel_pre_norm��scale�.PLACEHOLDER://blocks.24.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.24.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.24.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.24.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.24.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.24.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.24.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.24.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.24.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.24.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.24.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.24.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.24.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.24.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.24.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.24.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.24.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.24.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.24.temporal_pre_norm.scale�blocks.25��channel_pre_norm��scale�.PLACEHOLDER://blocks.25.channel_pre_norm.scale�mlp_block��ffw_down��bias�/PLACEHOLDER://blocks.25.mlp_block.ffw_down.bias�kernel�1PLACEHOLDER://blocks.25.mlp_block.ffw_down.kernel�ffw_up��b�*PLACEHOLDER://blocks.25.mlp_block.ffw_up.b�w�*PLACEHOLDER://blocks.25.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�1PLACEHOLDER://blocks.25.recurrent_block.conv_1d.b�w�1PLACEHOLDER://blocks.25.recurrent_block.conv_1d.w�linear_out��bias�7PLACEHOLDER://blocks.25.recurrent_block.linear_out.bias�kernel�9PLACEHOLDER://blocks.25.recurrent_block.linear_out.kernel�linear_x��bias�5PLACEHOLDER://blocks.25.recurrent_block.linear_x.bias�kernel�7PLACEHOLDER://blocks.25.recurrent_block.linear_x.kernel�linear_y��bias�5PLACEHOLDER://blocks.25.recurrent_block.linear_y.bias�kernel�7PLACEHOLDER://blocks.25.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�7PLACEHOLDER://blocks.25.recurrent_block.rg_lru.a_gate.b�w�7PLACEHOLDER://blocks.25.recurrent_block.rg_lru.a_gate.w�a_param�6PLACEHOLDER://blocks.25.recurrent_block.rg_lru.a_param�input_gate��b�;PLACEHOLDER://blocks.25.recurrent_block.rg_lru.input_gate.b�w�;PLACEHOLDER://blocks.25.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�/PLACEHOLDER://blocks.25.temporal_pre_norm.scale�blocks.3��channel_pre_norm��scale�-PLACEHOLDER://blocks.3.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.3.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.3.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.3.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.3.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�0PLACEHOLDER://blocks.3.recurrent_block.conv_1d.b�w�0PLACEHOLDER://blocks.3.recurrent_block.conv_1d.w�linear_out��bias�6PLACEHOLDER://blocks.3.recurrent_block.linear_out.bias�kernel�8PLACEHOLDER://blocks.3.recurrent_block.linear_out.kernel�linear_x��bias�4PLACEHOLDER://blocks.3.recurrent_block.linear_x.bias�kernel�6PLACEHOLDER://blocks.3.recurrent_block.linear_x.kernel�linear_y��bias�4PLACEHOLDER://blocks.3.recurrent_block.linear_y.bias�kernel�6PLACEHOLDER://blocks.3.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�6PLACEHOLDER://blocks.3.recurrent_block.rg_lru.a_gate.b�w�6PLACEHOLDER://blocks.3.recurrent_block.rg_lru.a_gate.w�a_param�5PLACEHOLDER://blocks.3.recurrent_block.rg_lru.a_param�input_gate��b�:PLACEHOLDER://blocks.3.recurrent_block.rg_lru.input_gate.b�w�:PLACEHOLDER://blocks.3.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.3.temporal_pre_norm.scale�blocks.4��channel_pre_norm��scale�-PLACEHOLDER://blocks.4.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.4.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.4.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.4.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.4.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�0PLACEHOLDER://blocks.4.recurrent_block.conv_1d.b�w�0PLACEHOLDER://blocks.4.recurrent_block.conv_1d.w�linear_out��bias�6PLACEHOLDER://blocks.4.recurrent_block.linear_out.bias�kernel�8PLACEHOLDER://blocks.4.recurrent_block.linear_out.kernel�linear_x��bias�4PLACEHOLDER://blocks.4.recurrent_block.linear_x.bias�kernel�6PLACEHOLDER://blocks.4.recurrent_block.linear_x.kernel�linear_y��bias�4PLACEHOLDER://blocks.4.recurrent_block.linear_y.bias�kernel�6PLACEHOLDER://blocks.4.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�6PLACEHOLDER://blocks.4.recurrent_block.rg_lru.a_gate.b�w�6PLACEHOLDER://blocks.4.recurrent_block.rg_lru.a_gate.w�a_param�5PLACEHOLDER://blocks.4.recurrent_block.rg_lru.a_param�input_gate��b�:PLACEHOLDER://blocks.4.recurrent_block.rg_lru.input_gate.b�w�:PLACEHOLDER://blocks.4.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.4.temporal_pre_norm.scale�blocks.5��attention_block��proj_final��bias�6PLACEHOLDER://blocks.5.attention_block.proj_final.bias�kernel�8PLACEHOLDER://blocks.5.attention_block.proj_final.kernel�proj_k��kernel�4PLACEHOLDER://blocks.5.attention_block.proj_k.kernel�proj_q��kernel�4PLACEHOLDER://blocks.5.attention_block.proj_q.kernel�proj_v��kernel�4PLACEHOLDER://blocks.5.attention_block.proj_v.kernel�channel_pre_norm��scale�-PLACEHOLDER://blocks.5.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.5.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.5.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.5.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.5.mlp_block.ffw_up.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.5.temporal_pre_norm.scale�blocks.6��channel_pre_norm��scale�-PLACEHOLDER://blocks.6.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.6.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.6.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.6.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.6.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�0PLACEHOLDER://blocks.6.recurrent_block.conv_1d.b�w�0PLACEHOLDER://blocks.6.recurrent_block.conv_1d.w�linear_out��bias�6PLACEHOLDER://blocks.6.recurrent_block.linear_out.bias�kernel�8PLACEHOLDER://blocks.6.recurrent_block.linear_out.kernel�linear_x��bias�4PLACEHOLDER://blocks.6.recurrent_block.linear_x.bias�kernel�6PLACEHOLDER://blocks.6.recurrent_block.linear_x.kernel�linear_y��bias�4PLACEHOLDER://blocks.6.recurrent_block.linear_y.bias�kernel�6PLACEHOLDER://blocks.6.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�6PLACEHOLDER://blocks.6.recurrent_block.rg_lru.a_gate.b�w�6PLACEHOLDER://blocks.6.recurrent_block.rg_lru.a_gate.w�a_param�5PLACEHOLDER://blocks.6.recurrent_block.rg_lru.a_param�input_gate��b�:PLACEHOLDER://blocks.6.recurrent_block.rg_lru.input_gate.b�w�:PLACEHOLDER://blocks.6.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.6.temporal_pre_norm.scale�blocks.7��channel_pre_norm��scale�-PLACEHOLDER://blocks.7.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.7.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.7.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.7.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.7.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�0PLACEHOLDER://blocks.7.recurrent_block.conv_1d.b�w�0PLACEHOLDER://blocks.7.recurrent_block.conv_1d.w�linear_out��bias�6PLACEHOLDER://blocks.7.recurrent_block.linear_out.bias�kernel�8PLACEHOLDER://blocks.7.recurrent_block.linear_out.kernel�linear_x��bias�4PLACEHOLDER://blocks.7.recurrent_block.linear_x.bias�kernel�6PLACEHOLDER://blocks.7.recurrent_block.linear_x.kernel�linear_y��bias�4PLACEHOLDER://blocks.7.recurrent_block.linear_y.bias�kernel�6PLACEHOLDER://blocks.7.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�6PLACEHOLDER://blocks.7.recurrent_block.rg_lru.a_gate.b�w�6PLACEHOLDER://blocks.7.recurrent_block.rg_lru.a_gate.w�a_param�5PLACEHOLDER://blocks.7.recurrent_block.rg_lru.a_param�input_gate��b�:PLACEHOLDER://blocks.7.recurrent_block.rg_lru.input_gate.b�w�:PLACEHOLDER://blocks.7.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.7.temporal_pre_norm.scale�blocks.8��attention_block��proj_final��bias�6PLACEHOLDER://blocks.8.attention_block.proj_final.bias�kernel�8PLACEHOLDER://blocks.8.attention_block.proj_final.kernel�proj_k��kernel�4PLACEHOLDER://blocks.8.attention_block.proj_k.kernel�proj_q��kernel�4PLACEHOLDER://blocks.8.attention_block.proj_q.kernel�proj_v��kernel�4PLACEHOLDER://blocks.8.attention_block.proj_v.kernel�channel_pre_norm��scale�-PLACEHOLDER://blocks.8.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.8.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.8.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.8.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.8.mlp_block.ffw_up.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.8.temporal_pre_norm.scale�blocks.9��channel_pre_norm��scale�-PLACEHOLDER://blocks.9.channel_pre_norm.scale�mlp_block��ffw_down��bias�.PLACEHOLDER://blocks.9.mlp_block.ffw_down.bias�kernel�0PLACEHOLDER://blocks.9.mlp_block.ffw_down.kernel�ffw_up��b�)PLACEHOLDER://blocks.9.mlp_block.ffw_up.b�w�)PLACEHOLDER://blocks.9.mlp_block.ffw_up.w�recurrent_block��conv_1d��b�0PLACEHOLDER://blocks.9.recurrent_block.conv_1d.b�w�0PLACEHOLDER://blocks.9.recurrent_block.conv_1d.w�linear_out��bias�6PLACEHOLDER://blocks.9.recurrent_block.linear_out.bias�kernel�8PLACEHOLDER://blocks.9.recurrent_block.linear_out.kernel�linear_x��bias�4PLACEHOLDER://blocks.9.recurrent_block.linear_x.bias�kernel�6PLACEHOLDER://blocks.9.recurrent_block.linear_x.kernel�linear_y��bias�4PLACEHOLDER://blocks.9.recurrent_block.linear_y.bias�kernel�6PLACEHOLDER://blocks.9.recurrent_block.linear_y.kernel�rg_lru��a_gate��b�6PLACEHOLDER://blocks.9.recurrent_block.rg_lru.a_gate.b�w�6PLACEHOLDER://blocks.9.recurrent_block.rg_lru.a_gate.w�a_param�5PLACEHOLDER://blocks.9.recurrent_block.rg_lru.a_param�input_gate��b�:PLACEHOLDER://blocks.9.recurrent_block.rg_lru.input_gate.b�w�:PLACEHOLDER://blocks.9.recurrent_block.rg_lru.input_gate.w�temporal_pre_norm��scale�.PLACEHOLDER://blocks.9.temporal_pre_norm.scale�embedder��input_embedding�&PLACEHOLDER://embedder.input_embedding�final_norm��scale�PLACEHOLDER://final_norm.scale