runtime error
Space failed. Exit code: 1. Reason: mpl return forward_call(*args, **kwargs) File "/home/user/.cache/huggingface/modules/transformers_modules/OpenAssistant/falcon-7b-sft-top1-696/9f95b9e269c1d99c29f70be8d5ef3d0fb1bd1c30/modelling_RW.py", line 648, in forward outputs = block( File "/opt/conda/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl return forward_call(*args, **kwargs) File "/home/user/.cache/huggingface/modules/transformers_modules/OpenAssistant/falcon-7b-sft-top1-696/9f95b9e269c1d99c29f70be8d5ef3d0fb1bd1c30/modelling_RW.py", line 381, in forward layernorm_output = self.input_layernorm(hidden_states) File "/opt/conda/lib/python3.9/site-packages/torch/nn/modules/module.py", line 1501, in _call_impl return forward_call(*args, **kwargs) File "/opt/conda/lib/python3.9/site-packages/torch/nn/modules/normalization.py", line 190, in forward return F.layer_norm( File "/opt/conda/lib/python3.9/site-packages/torch/nn/functional.py", line 2515, in layer_norm return torch.layer_norm(input, normalized_shape, weight, bias, eps, torch.backends.cudnn.enabled) RuntimeError: "LayerNormKernelImpl" not implemented for 'Half' [2m2023-10-22T08:40:47.202144Z[0m [31mERROR[0m [1mwarmup[0m[1m{[0m[3mmax_input_length[0m[2m=[0m1024 [3mmax_prefill_tokens[0m[2m=[0m4096 [3mmax_total_tokens[0m[2m=[0m2048[1m}[0m[2m:[0m[1mwarmup[0m[2m:[0m [2mtext_generation_client[0m[2m:[0m [2mrouter/client/src/lib.rs[0m[2m:[0m[2m33:[0m Server error: "LayerNormKernelImpl" not implemented for 'Half' Error: Warmup(Generation("\"LayerNormKernelImpl\" not implemented for 'Half'")) [2m2023-10-22T08:40:47.248685Z[0m [31mERROR[0m [2mtext_generation_launcher[0m[2m:[0m Webserver Crashed [2m2023-10-22T08:40:47.248756Z[0m [32m INFO[0m [2mtext_generation_launcher[0m[2m:[0m Shutting down shards [2m2023-10-22T08:40:47.994827Z[0m [32m INFO[0m [1mshard-manager[0m: [2mtext_generation_launcher[0m[2m:[0m Shard terminated [2m[3mrank[0m[2m=[0m0[0m Error: WebserverFailed
Container logs:
Fetching error logs...