Commit 902cab8d authored by zhuwenwen's avatar zhuwenwen
Browse files

update readme

parent 53f20a9d
......@@ -46,8 +46,8 @@ docker run -it --name llama --privileged --shm-size=32G --device=/dev/kfd --dev
```bash
git clone http://developer.hpccube.com/codes/modelzoo/bloom_fastertransformer.git
cd bloom_fastertransformer
mkdir -p astertransformer/build
cd astertransformer/build
mkdir -p afstertransformer/build
cd fastertransformer/build
git submodule init && git submodule update
cmake -DCMAKE_BUILD_TYPE=Release -DBUILD_MULTI_GPU=ON -DCMAKE_CXX_COMPILER=nvcc ..
export C_INCLUDE_PATH=$PWD/_deps/googletest-src/googletest/include${C_INCLUDE_PATH:+:${C_INCLUDE_PATH}}
......@@ -66,8 +66,8 @@ export LD_LIBRARY_PATH=$PWD/src/fastertransformer/utils/gemm_test/CMakeFiles/gpt
```bash
python ../examples/pytorch/gpt/utils/huggingface_bloom_convert.py \
--input-dir=/data/models/llama-7b-infer/ \
--output-dir=/data/models/llama-7b-hf/ \
--input-dir=/data/models/bloom-7b-infer/ \
--output-dir=/data/models/bloom-7b-hf/ \
-tp 1 --data-type fp16 -p 8 -v
```
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment