flake.nix : add rocm support and cleanup (#2808)

author Tungsten842 <redacted>

Sat, 26 Aug 2023 18:19:44 +0000 (20:19 +0200)

committer GitHub <redacted>

Sat, 26 Aug 2023 18:19:44 +0000 (21:19 +0300)
author Tungsten842 <redacted>
Sat, 26 Aug 2023 18:19:44 +0000 (20:19 +0200)
committer GitHub <redacted>
Sat, 26 Aug 2023 18:19:44 +0000 (21:19 +0300)
diff --git a/flake.lock b/flake.lock

index 33164e09679533041f6d3a3a94f9ddd057727f9f..a7777d05d5c0cd0d6e41ab048a9046aa446a044e 100644 (file)
--- a/flake.lock
+++ b/flake.lock
@@ -5,11 +5,11 @@
          "systems": "systems"
        },
        "locked": {
-        "lastModified": 1685518550,
-        "narHash": "sha256-o2d0KcvaXzTrPRIo0kOLV0/QXHhDQ5DTi+OxcjO8xqY=",
+        "lastModified": 1692799911,
+        "narHash": "sha256-3eihraek4qL744EvQXsK1Ha6C3CR7nnT8X2qWap4RNk=",
          "owner": "numtide",
          "repo": "flake-utils",
-        "rev": "a1720a10a6cfe8234c0e93907ffe81be440f4cef",
+        "rev": "f9e7cf818399d17d347f847525c5a5a8032e4e44",
          "type": "github"
        },
        "original": {
@@ -20,11 +20,11 @@
      },
      "nixpkgs": {
        "locked": {
-        "lastModified": 1685931219,
-        "narHash": "sha256-8EWeOZ6LKQfgAjB/USffUSELPRjw88A+xTcXnOUvO5M=",
+        "lastModified": 1692913444,
+        "narHash": "sha256-1SvMQm2DwofNxXVtNWWtIcTh7GctEVrS/Xel/mdc6iY=",
          "owner": "NixOS",
          "repo": "nixpkgs",
-        "rev": "7409480d5c8584a1a83c422530419efe4afb0d19",
+        "rev": "18324978d632ffc55ef1d928e81630c620f4f447",
          "type": "github"
        },
        "original": {
diff --git a/flake.nix b/flake.nix

index d454cedc3714a3ff7929cb6315c7c093ad40ea8d..02095411e026a5a85fa96595eeb6428f3ba1adec 100644 (file)
--- a/flake.nix
+++ b/flake.nix
@@ -6,6 +6,9 @@
    outputs = { self, nixpkgs, flake-utils }:
      flake-utils.lib.eachDefaultSystem (system:
        let
+        name = "llama.cpp";
+        src = ./.;
+        meta.mainProgram = "llama";
          inherit (pkgs.stdenv) isAarch32 isAarch64 isDarwin;
          buildInputs = with pkgs; [ openmpi ];
          osSpecific = with pkgs; buildInputs ++
@@ -31,7 +34,7 @@
              with pkgs; [ openblas ]
          );
          pkgs = import nixpkgs { inherit system; };
-        nativeBuildInputs = with pkgs; [ cmake pkgconfig ];
+        nativeBuildInputs = with pkgs; [ cmake ninja pkgconfig ];
          llama-python =
            pkgs.python3.withPackages (ps: with ps; [ numpy sentencepiece ]);
          postPatch = ''
@@ -44,35 +47,35 @@
            mv $out/bin/server $out/bin/llama-server
          '';
          cmakeFlags = [ "-DLLAMA_BUILD_SERVER=ON" "-DLLAMA_MPI=ON" "-DBUILD_SHARED_LIBS=ON" "-DCMAKE_SKIP_BUILD_RPATH=ON" ];
-      in {
+      in
+      {
          packages.default = pkgs.stdenv.mkDerivation {
-          name = "llama.cpp";
-          src = ./.;
-          postPatch = postPatch;
-          nativeBuildInputs = nativeBuildInputs;
-          buildInputs = osSpecific;
+          inherit name src meta postPatch nativeBuildInputs buildInputs postInstall;
            cmakeFlags = cmakeFlags
              ++ (if isAarch64 && isDarwin then [
-              "-DCMAKE_C_FLAGS=-D__ARM_FEATURE_DOTPROD=1"
-              "-DLLAMA_METAL=ON"
-            ] else [
-              "-DLLAMA_BLAS=ON"
-              "-DLLAMA_BLAS_VENDOR=OpenBLAS"
+            "-DCMAKE_C_FLAGS=-D__ARM_FEATURE_DOTPROD=1"
+            "-DLLAMA_METAL=ON"
+          ] else [
+            "-DLLAMA_BLAS=ON"
+            "-DLLAMA_BLAS_VENDOR=OpenBLAS"
            ]);
-          postInstall = postInstall;
-          meta.mainProgram = "llama";
          };
          packages.opencl = pkgs.stdenv.mkDerivation {
-          name = "llama.cpp";
-          src = ./.;
-          postPatch = postPatch;
-          nativeBuildInputs = nativeBuildInputs;
+          inherit name src meta postPatch nativeBuildInputs postInstall;
            buildInputs = with pkgs; buildInputs ++ [ clblast ];
            cmakeFlags = cmakeFlags ++ [
              "-DLLAMA_CLBLAST=ON"
            ];
-          postInstall = postInstall;
-          meta.mainProgram = "llama";
+        };
+        packages.rocm = pkgs.stdenv.mkDerivation {
+          inherit name src meta postPatch nativeBuildInputs postInstall;
+          buildInputs = with pkgs; buildInputs ++ [ hip hipblas rocblas ];
+          cmakeFlags = cmakeFlags ++ [
+            "-DLLAMA_HIPBLAS=1"
+            "-DCMAKE_C_COMPILER=hipcc"
+            "-DCMAKE_CXX_COMPILER=hipcc"
+            "-DCMAKE_POSITION_INDEPENDENT_CODE=ON"
+          ];
          };
          apps.llama-server = {
            type = "app";
author	Tungsten842 <redacted>
	Sat, 26 Aug 2023 18:19:44 +0000 (20:19 +0200)
committer	GitHub <redacted>
	Sat, 26 Aug 2023 18:19:44 +0000 (21:19 +0300)
flake.lock		patch \| blob \| history
flake.nix		patch \| blob \| history