_toctree.yml 1.15 KB
Newer Older
1
2
3
4
5
6
7
8
9
- sections:
  - local: index
    title: Text Generation Inference
  - local: quicktour
    title: Quick Tour
  - local: installation
    title: Installation
  - local: supported_models
    title: Supported Models and Hardware
10
11
  - local: messages_api
    title: Messages API
12
13
14
15
16
17
18
19
  title: Getting started
- sections:
  - local: basic_tutorials/consuming_tgi
    title: Consuming TGI
  - local: basic_tutorials/preparing_model
    title: Preparing Model for Serving
  - local: basic_tutorials/gated_model_access
    title: Serving Private & Gated Models
Merve Noyan's avatar
Merve Noyan committed
20
21
  - local: basic_tutorials/using_cli
    title: Using TGI CLI
Merve Noyan's avatar
Merve Noyan committed
22
23
  - local: basic_tutorials/launcher
    title: All TGI CLI  options
24
25
  - local: basic_tutorials/non_core_models
    title: Non-core Model Serving
26
  title: Tutorials
Omar Sanseviero's avatar
Omar Sanseviero committed
27
28
29
- sections:
  - local: conceptual/streaming
    title: Streaming
Merve Noyan's avatar
Merve Noyan committed
30
31
  - local: conceptual/quantization
    title: Quantization
32
33
  - local: conceptual/tensor_parallelism
    title: Tensor Parallelism
34
35
  - local: conceptual/paged_attention
    title: PagedAttention
36
37
  - local: conceptual/safetensors
    title: Safetensors
38
39
  - local: conceptual/flash_attention
    title: Flash Attention
Omar Sanseviero's avatar
Omar Sanseviero committed
40
  title: Conceptual Guides