convert_weight.sh 590 Bytes
Newer Older
luopl's avatar
luopl committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
#!/usr/bin/env bash

set -euo pipefail

# Step 1: fp4/fp8 -> bf16
INPUT_FP8_HF_PATH="deepseek-ai/DeepSeek-V4-Flash"
OUTPUT_BF16_HF_PATH="deepseek-ai/DeepSeek-V4-Flash-bf16"

python3 convert_weight.py \
  --input-fp8-hf-path "${INPUT_FP8_HF_PATH}" \
  --output-bf16-hf-path "${OUTPUT_BF16_HF_PATH}"

# Step 2: bf16 -> bf16-mp16
MP=8
HF_CKPT_BF16_PATH="${OUTPUT_BF16_HF_PATH}"
SAVE_PATH="deepseek-ai/DeepSeek-V4-Flash-bf16-mp16"
EXPERTS=256

python3 convert.py \
  --hf-ckpt-path "${HF_CKPT_BF16_PATH}" \
  --save-path "${SAVE_PATH}" \
  --n-experts "${EXPERTS}" \
  --model-parallel "${MP}"