CUDA_VISIBLE_DEVICES=0 FORCE_CMAKE=1 CMAKE_ARGS="-DLLAMA_CUBLAS=on" no_proxy=localhost,127.0.0.1 OPENAI_API_KEY=NOONEEED OPENAI_API_BASE=http://localhost:1300/v1