flake.nix 4.3 KB
Newer Older
1
2
{
  inputs = {
3
4
5
6
    crate2nix = {
      url = "github:nix-community/crate2nix";
      inputs.nixpkgs.follows = "tgi-nix/nixpkgs";
    };
7
    nix-filter.url = "github:numtide/nix-filter";
8
9
10
    tgi-nix.url = "github:danieldk/tgi-nix";
    nixpkgs.follows = "tgi-nix/nixpkgs";
    flake-utils.url = "github:numtide/flake-utils";
11
12
13
14
    rust-overlay = {
      url = "github:oxalica/rust-overlay";
      inputs.nixpkgs.follows = "tgi-nix/nixpkgs";
    };
15
16
17
18
  };
  outputs =
    {
      self,
19
      crate2nix,
20
      nix-filter,
21
22
      nixpkgs,
      flake-utils,
23
      rust-overlay,
24
25
26
27
28
      tgi-nix,
    }:
    flake-utils.lib.eachDefaultSystem (
      system:
      let
29
30
31
        cargoNix = crate2nix.tools.${system}.appliedCargoNix {
          name = "tgi";
          src = ./.;
32
          additionalCargoNixArgs = [ "--all-features" ];
33
        };
34
        pkgs = import nixpkgs {
35
36
          inherit system;
          inherit (tgi-nix.lib) config;
37
38
          overlays = [
            rust-overlay.overlays.default
39
            tgi-nix.overlays.default
40
          ];
41
        };
42
        crateOverrides = import ./nix/crate-overrides.nix { inherit pkgs nix-filter; };
43
44
45
        benchmark = cargoNix.workspaceMembers.text-generation-benchmark.build.override {
          inherit crateOverrides;
        };
46
47
48
        launcher = cargoNix.workspaceMembers.text-generation-launcher.build.override {
          inherit crateOverrides;
        };
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
        router =
          let
            routerUnwrapped = cargoNix.workspaceMembers.text-generation-router-v3.build.override {
              inherit crateOverrides;
            };
            packagePath =
              with pkgs.python3.pkgs;
              makePythonPath [
                protobuf
                sentencepiece
                torch
                transformers
              ];
          in
          pkgs.writeShellApplication {
            name = "text-generation-router";
            text = ''
              PYTHONPATH="${packagePath}" ${routerUnwrapped}/bin/text-generation-router "$@"
            '';
          };
69
        server = pkgs.python3.pkgs.callPackage ./nix/server.nix { inherit nix-filter; };
70
71
      in
      {
Nicolas Patry's avatar
Nicolas Patry committed
72
        formatter = pkgs.nixfmt-rfc-style;
73
74
75
76
77
        devShells = with pkgs; rec {
          default = pure;

          pure = mkShell {
            buildInputs = [
78
              benchmark
79
80
81
82
83
              launcher
              router
              server
            ];
          };
Nicolas Patry's avatar
Nicolas Patry committed
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
          test = mkShell {
            buildInputs =
              [
                # benchmark
                # launcher
                # router
                server
                openssl.dev
                pkg-config
                cargo
                rustfmt
                clippy
              ]
              ++ (with python3.pkgs; [
                docker
                pytest
                pytest-asyncio
                syrupy
                pre-commit
                ruff
              ]);

          };
107
108

          impure = mkShell {
109
110
111
112
            buildInputs =
              [
                openssl.dev
                pkg-config
113
114
115
116
117
118
                (rust-bin.stable.latest.default.override {
                  extensions = [
                    "rust-analyzer"
                    "rust-src"
                  ];
                })
119
                protobuf
120
121
122
              ]
              ++ (with python3.pkgs; [
                venvShellHook
123
                docker
124
                pip
Nicolas Patry's avatar
Nicolas Patry committed
125
                ipdb
Nicolas Patry's avatar
Nicolas Patry committed
126
                click
127
                pyright
128
129
                pytest
                pytest-asyncio
130
                ruff
131
                syrupy
132
133
              ]);

134
135
            inputsFrom = [ server ];

136
137
            venvDir = "./.venv";

138
            postVenvCreation = ''
139
              unset SOURCE_DATE_EPOCH
140
141
              ( cd server ; python -m pip install --no-dependencies -e . )
              ( cd clients/python ; python -m pip install --no-dependencies -e . )
142
143
144
            '';
            postShellHook = ''
              unset SOURCE_DATE_EPOCH
145
              export PATH=$PATH:~/.cargo/bin
146
147
            '';
          };
148
        };
149
150
151
152
153
154
155
156
157
158
159

        packages.default = pkgs.writeShellApplication {
          name = "text-generation-inference";
          runtimeInputs = [
            server
            router
          ];
          text = ''
            ${launcher}/bin/text-generation-launcher "$@"
          '';
        };
160
161
162
      }
    );
}