vllm serve fdtn-ai/Foundation-Sec-8B-Reasoning --trust-remote-code --dtype bfloat16 -tp 1 --max-model-len 32768 --port 8010