flake.nix 2.66 KB
Newer Older
1
2
3
4
5
{
  inputs = {
    tgi-nix.url = "github:danieldk/tgi-nix";
    nixpkgs.follows = "tgi-nix/nixpkgs";
    flake-utils.url = "github:numtide/flake-utils";
Nicolas Patry's avatar
Nicolas Patry committed
6
    poetry2nix.url = "github:nix-community/poetry2nix";
7
8
9
10
    rust-overlay = {
      url = "github:oxalica/rust-overlay";
      inputs.nixpkgs.follows = "tgi-nix/nixpkgs";
    };
11
12
13
14
15
16
  };
  outputs =
    {
      self,
      nixpkgs,
      flake-utils,
17
      rust-overlay,
18
      tgi-nix,
Nicolas Patry's avatar
Nicolas Patry committed
19
      poetry2nix,
20
21
22
23
24
25
26
27
28
29
    }:
    flake-utils.lib.eachDefaultSystem (
      system:
      let
        config = {
          allowUnfree = true;
          cudaSupport = true;
        };
        pkgs = import nixpkgs {
          inherit config system;
30
31
32
33
          overlays = [
            rust-overlay.overlays.default
            tgi-nix.overlay
          ];
34
        };
Nicolas Patry's avatar
Nicolas Patry committed
35
36
37
38
39

        inherit (poetry2nix.lib.mkPoetry2Nix { inherit pkgs; }) mkPoetryEditablePackage;
        text-generation-server = mkPoetryEditablePackage {
            editablePackageSources = ./server;
        };
40
41
42
43
44
45
46
47
48
      in
      {
        devShells.default =
          with pkgs;
          mkShell {
            buildInputs =
              [
                openssl.dev
                pkg-config
49
50
51
52
53
54
                (rust-bin.stable.latest.default.override {
                  extensions = [
                    "rust-analyzer"
                    "rust-src"
                  ];
                })
55
56
57
58
59
              ]
              ++ (with python3.pkgs; [
                venvShellHook
                pip

Nicolas Patry's avatar
Nicolas Patry committed
60
                click
61
62
                einops
                fbgemm-gpu
Nicolas Patry's avatar
Nicolas Patry committed
63
                flashinfer
64
65
66
67
68
69
                flash-attn
                flash-attn-layer-norm
                flash-attn-rotary
                grpc-interceptor
                grpcio-reflection
                grpcio-status
Nicolas Patry's avatar
Nicolas Patry committed
70
                grpcio-tools
71
72
73
74
75
76
77
78
79
80
81
82
                hf-transfer
                loguru
                marlin-kernels
                opentelemetry-api
                opentelemetry-exporter-otlp
                opentelemetry-instrumentation-grpc
                opentelemetry-semantic-conventions
                peft
                tokenizers
                torch
                transformers
                vllm
83
84
85
86

                (callPackage ./router.nix {
                  inherit (rustPlatform) buildRustPackage importCargoLock;
                })
87
88
89
                (callPackage ./_launcher.nix {
                  inherit (rustPlatform) buildRustPackage importCargoLock;
                })
90
91
92
93
94
95
96
97
98
99
100
101
102
103
              ]);

            venvDir = "./.venv";

            postVenv = ''
              unset SOURCE_DATE_EPOCH
            '';
            postShellHook = ''
              unset SOURCE_DATE_EPOCH
            '';
          };
      }
    );
}