llama.cpp/flake.nix

{
  inputs = {
    nixpkgs.url = "github:NixOS/nixpkgs/nixos-unstable";
    flake-utils.url = "github:numtide/flake-utils";
  };
  outputs = { self, nixpkgs, flake-utils }:
    flake-utils.lib.eachDefaultSystem (system:
      let
        inherit (pkgs.stdenv) isAarch64 isDarwin;
        inherit (pkgs.lib) optionals;
        isM1 = isAarch64 && isDarwin;
        osSpecific =
          if isM1 then with pkgs.darwin.apple_sdk_11_0.frameworks; [ Accelerate MetalKit MetalPerformanceShaders MetalPerformanceShadersGraph ]
          else if isDarwin then with pkgs.darwin.apple_sdk.frameworks; [ Accelerate CoreGraphics CoreVideo ]
          else [ ];
        pkgs = import nixpkgs {
          inherit system;
        };
        llama-python = pkgs.python310.withPackages (ps: with ps; [
          numpy
          sentencepiece
        ]);
      in
      {
        packages.default = pkgs.stdenv.mkDerivation {
          name = "llama.cpp";
          src = ./.;
          postPatch =
            if isM1 then ''
              substituteInPlace ./ggml-metal.m \
                --replace '[bundle pathForResource:@"ggml-metal" ofType:@"metal"];' "@\"$out/ggml-metal.metal\";"
            '' else "";
          nativeBuildInputs = with pkgs; [ cmake ];
          buildInputs = osSpecific;
          cmakeFlags = [ "-DLLAMA_BUILD_SERVER=ON" ] ++ (optionals isM1 [
            "-DCMAKE_C_FLAGS=-D__ARM_FEATURE_DOTPROD=1"
            "-DLLAMA_METAL=ON"
          ]);
          installPhase = ''
            mkdir -p $out/bin
            mv bin/* $out/bin/
            mv $out/bin/main $out/bin/llama
            mv $out/bin/server $out/bin/llama-server

            echo "#!${llama-python}/bin/python" > $out/bin/convert.py
            cat ${./convert.py} >> $out/bin/convert.py
            chmod +x $out/bin/convert.py
          '';
          meta.mainProgram = "llama";
        };
        apps.llama-server = {
          type = "app";
          program = "${self.packages.${system}.default}/bin/llama-server";
        };
        apps.llama-embedding = {
          type = "app";
          program = "${self.packages.${system}.default}/bin/embedding";
        };
        apps.llama = {
          type = "app";
          program = "${self.packages.${system}.default}/bin/llama";
        };
        apps.default = self.apps.${system}.llama;
        devShells.default = pkgs.mkShell {
          packages = with pkgs; [
            cmake
            llama-python
          ] ++ osSpecific;
        };
      }
    );
}
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`{`
			`inputs = {`
			`nixpkgs.url = "github:NixOS/nixpkgs/nixos-unstable";`
			`flake-utils.url = "github:numtide/flake-utils";`
			`};`
			`outputs = { self, nixpkgs, flake-utils }:`
			`flake-utils.lib.eachDefaultSystem (system:`
			`let`
flake : update to support metal on m1/m2 (#1724) 2023-06-07 04:15:31 +00:00			`inherit (pkgs.stdenv) isAarch64 isDarwin;`
			`inherit (pkgs.lib) optionals;`
			`isM1 = isAarch64 && isDarwin;`
			`osSpecific =`
			`if isM1 then with pkgs.darwin.apple_sdk_11_0.frameworks; [ Accelerate MetalKit MetalPerformanceShaders MetalPerformanceShadersGraph ]`
			`else if isDarwin then with pkgs.darwin.apple_sdk.frameworks; [ Accelerate CoreGraphics CoreVideo ]`
			`else [ ];`
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`pkgs = import nixpkgs {`
			`inherit system;`
			`};`
			`llama-python = pkgs.python310.withPackages (ps: with ps; [`
			`numpy`
			`sentencepiece`
			`]);`
			`in`
			`{`
			`packages.default = pkgs.stdenv.mkDerivation {`
			`name = "llama.cpp";`
			`src = ./.;`
flake : update to support metal on m1/m2 (#1724) 2023-06-07 04:15:31 +00:00			`postPatch =`
			`if isM1 then ''`
			`substituteInPlace ./ggml-metal.m \`
metal : fix issue with ggml-metal.metal path. Closes #1769 (#1782) * Fix issue with ggml-metal.metal path * Add ggml-metal.metal as a resource for llama target * Update flake.nix metal kernel substitution 2023-06-10 14:47:34 +00:00			`--replace '[bundle pathForResource:@"ggml-metal" ofType:@"metal"];' "@\"$out/ggml-metal.metal\";"`
flake : update to support metal on m1/m2 (#1724) 2023-06-07 04:15:31 +00:00			`'' else "";`
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`nativeBuildInputs = with pkgs; [ cmake ];`
flake : update to support metal on m1/m2 (#1724) 2023-06-07 04:15:31 +00:00			`buildInputs = osSpecific;`
			`cmakeFlags = [ "-DLLAMA_BUILD_SERVER=ON" ] ++ (optionals isM1 [`
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`"-DCMAKE_C_FLAGS=-D__ARM_FEATURE_DOTPROD=1"`
flake : update to support metal on m1/m2 (#1724) 2023-06-07 04:15:31 +00:00			`"-DLLAMA_METAL=ON"`
			`]);`
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`installPhase = ''`
			`mkdir -p $out/bin`
flake.nix: add all binaries from bin (#848) 2023-04-13 13:49:05 +00:00			`mv bin/* $out/bin/`
			`mv $out/bin/main $out/bin/llama`
flake : update to support metal on m1/m2 (#1724) 2023-06-07 04:15:31 +00:00			`mv $out/bin/server $out/bin/llama-server`
Add new binaries to flake.nix (#847) 2023-04-08 10:04:23 +00:00
nix: use convert.py instead of legacy wrapper convert-pth-to-ggml.py (#981) 2023-04-25 21:19:57 +00:00			`echo "#!${llama-python}/bin/python" > $out/bin/convert.py`
			`cat ${./convert.py} >> $out/bin/convert.py`
			`chmod +x $out/bin/convert.py`
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`'';`
Nix flake: set meta.mainProgram to llama 2023-03-20 21:44:30 +00:00			`meta.mainProgram = "llama";`
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`};`
exposed modules so that they can be invoked by nix run github:ggerganov/llama.cpp#server etc (#1863) 2023-06-17 12:13:05 +00:00			`apps.llama-server = {`
			`type = "app";`
			`program = "${self.packages.${system}.default}/bin/llama-server";`
			`};`
			`apps.llama-embedding = {`
			`type = "app";`
			`program = "${self.packages.${system}.default}/bin/embedding";`
			`};`
			`apps.llama = {`
			`type = "app";`
			`program = "${self.packages.${system}.default}/bin/llama";`
			`};`
			`apps.default = self.apps.${system}.llama;`
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`devShells.default = pkgs.mkShell {`
			`packages = with pkgs; [`
			`cmake`
			`llama-python`
flake : update to support metal on m1/m2 (#1724) 2023-06-07 04:15:31 +00:00			`] ++ osSpecific;`
Nix flake (#40) * Nix flake * Nix: only add Accelerate framework on macOS * Nix: development shel, direnv and compatibility * Nix: use python packages supplied by withPackages * Nix: remove channel compatibility * Nix: fix ARM neon dotproduct on macOS --------- Co-authored-by: Pavol Rusnak <pavol@rusnak.io> 2023-03-17 22:03:48 +00:00			`};`
			`}`
			`);`
			`}`