merge v0.4.1
Showing
examples/aqlm_example.py
0 → 100644
examples/fp8/README.md
0 → 100644
File moved
| cmake>=3.21 | cmake >= 3.21 | ||
| ninja # For faster builds. | ninja # For faster builds. | ||
| psutil | psutil | ||
| ray >= 2.9 | |||
| sentencepiece # Required for LLaMA tokenizer. | sentencepiece # Required for LLaMA tokenizer. | ||
| numpy | numpy | ||
| torch == 2.1.2 | |||
| requests | requests | ||
| psutil | |||
| py-cpuinfo | py-cpuinfo | ||
| transformers >= 4.39.1 # Required for StarCoder2 & Llava. | transformers >= 4.40.0 # Required for StarCoder2 & Llava, Llama 3. | ||
| xformers == 0.0.23.post1 # Required for CUDA 12.1. | tokenizers >= 0.19.1 # Required for Llama 3. | ||
| fastapi | fastapi | ||
| uvicorn[standard] | uvicorn[standard] | ||
| pydantic >= 2.0 # Required for OpenAI server. | pydantic >= 2.0 # Required for OpenAI server. | ||
| prometheus_client >= 0.18.0 | prometheus_client >= 0.18.0 | ||
| pynvml == 11.5.0 | tiktoken == 0.6.0 # Required for DBRX tokenizer | ||
| triton >= 2.1.0 | lm-format-enforcer == 0.9.8 | ||
| outlines == 0.0.34 | outlines == 0.0.34 # Requires torch >= 2.1.0 | ||
| tiktoken == 0.6.0 # Required for DBRX tokenizer | typing_extensions | ||
| filelock >= 3.10.4 # filelock starts to support `mode` argument from 3.10.4 |
requirements-cpu.txt
0 → 100644
requirements-cuda.txt
0 → 100644
Please register or sign in to comment