vllm serve LGAI-EXAONE/EXAONE-4.0-1.2B --trust-remote-code --dtype bfloat16 -tp 1 --max-model-len 32768 --port 8010