fix: it builds now

wip: llama-cpp with hexagon
renamed: llama-cpp-hexagon -> llama-cpp
2026-04-21 23:10:14 +01:00 · 2026-04-21 17:38:09 +01:00 · 2026-04-20 20:37:53 +01:00 · 2026-04-20 20:37:29 +01:00
3 changed files with 229 additions and 90 deletions
@@ -1,90 +0,0 @@
-{
-  lib,
-  pkgs,
-  stdenvNoCC,
-  stdenv,
-  p7zip,
-  curl,
-  jq,
-  cacert,
-}:
-
-let
-  version = "v6.4.0.2";
-  src = fetchTarball {
-    url = "https://github.com/snapdragon-toolchain/hexagon-sdk/releases/download/v6.4.0.2/hexagon-sdk-v6.4.0.2-amd64-lnx.tar.xz";
-    sha256 = "0qadmn84sdqbqh3s837s0amdmln3akb1b01k8x5nha0lkw6a3jwc";
-  };
-  gmp_override = pkgs.gmp.overrideAttrs (
-    final: prev: {
-      postInstall =
-        (prev.postInstall or "")
-        + "
-				ls
-				cd $out
-				cd lib
-				ls
-			rm libgmp.so.10
-			cp libgmp.so.10.5.0 libgmp.so.10
-			cp libgmp.so.10.5.0 $out/libgmp.so.10
-			";
-    }
-  );
-  libs = [
-    pkgs.stdenv.cc.cc.lib
-    pkgs.libc
-    pkgs.libcxx
-    pkgs.gmp
-    pkgs.libz
-    pkgs.libgccjit
-    # pkgs.zlib
-    # pkgs.ncurses
-  ];
-
-  # we get Nixpkgs to create the library paths for us, so we don't have to wrangle them by hand
-  libPath = pkgs.lib.makeLibraryPath libs;
-in
-stdenv.mkDerivation rec {
-  pname = "hexagon-sdk";
-  inherit version src;
-
-  # dontUnpack = true;
-  # dontBuild = true;
-
-  nativeBuildInputs = [
-  ];
-  buildInputs = [ pkgs.patchelf ];
-  runtimeDependencies = with pkgs; [ gmpxx ];
-
-  buildPhase = ''
-    runHook preBuild
-    						# cp $out/opt/tools/HEXAGON_Tools/19.0.04/Tools/lib/libLW.so.3 $out/opt/tools/HEXAGON_Tools/19.0.04/Tools/bin/
-    runHook postBuild
-  '';
-
-  installPhase = ''
-                    runHook preInstall
-                    mkdir $out
-                    cp -r ${src} $out/opt
-                    runHook postInstall
-
-                    chmod +w $out/opt/ipc/fastrpc/qaic/bin/qaic
-                		chmod +w $out/opt/tools/HEXAGON_Tools/19.0.04/Tools/bin/hexagon-clang
-                		chmod +w $out/opt/tools/HEXAGON_Tools/19.0.04/Tools/bin/hexagon-link
-                    patchelf $out/opt/ipc/fastrpc/qaic/bin/qaic --set-interpreter ${pkgs.stdenv.cc.bintools.dynamicLinker} --set-rpath ${libPath}
-                    patchelf $out/opt/tools/HEXAGON_Tools/19.0.04/Tools/bin/hexagon-clang --set-interpreter ${pkgs.stdenv.cc.bintools.dynamicLinker} --set-rpath ${libPath}
-        						lib=${libPath}
-        						lib=$lib:$out/opt/tools/HEXAGON_Tools/19.0.04/Tools/lib
-    								echo $lib
-                    patchelf $out/opt/tools/HEXAGON_Tools/19.0.04/Tools/bin/hexagon-link --set-interpreter ${pkgs.stdenv.cc.bintools.dynamicLinker} --set-rpath $lib
-  '';
-
-  meta = {
-    description = "Hexagon SDK for working with the Qualcomm NPU/DSP";
-    homepage = "https://github.com/snapdragon-toolchain/hexagon-sdk";
-    license = lib.licenses.unfree;
-    platforms = [
-      "x86_64-linux"
-    ];
-  };
-}
@@ -0,0 +1,6 @@
+{ llama-cpp }:
+
+llama-cpp.override {
+  hexagonSupport = true;
+  blasSupport = false;
+}
@@ -0,0 +1,223 @@
+{
+  lib,
+  pkgs,
+  autoAddDriverRunpath,
+  cmake,
+  fetchFromGitHub,
+  nix-update-script,
+  stdenv,
+
+  config,
+  cudaSupport ? config.cudaSupport,
+  cudaPackages ? { },
+
+  rocmSupport ? config.rocmSupport,
+  rocmPackages ? { },
+  rocmGpuTargets ? rocmPackages.clr.localGpuTargets or rocmPackages.clr.gpuTargets,
+
+  openclSupport ? false,
+  clblast,
+
+  blasSupport ? builtins.all (x: !x) [
+    cudaSupport
+    metalSupport
+    openclSupport
+    rocmSupport
+    vulkanSupport
+  ],
+  blas,
+
+  pkg-config,
+  metalSupport ? stdenv.hostPlatform.isDarwin && stdenv.hostPlatform.isAarch64 && !openclSupport,
+  vulkanSupport ? false,
+  rpcSupport ? false,
+  hexagonSupport ? false,
+  curl,
+  llama-cpp,
+  shaderc,
+  vulkan-headers,
+  hexagon-sdk,
+  vulkan-loader,
+  ninja,
+}:
+
+let
+  # It's necessary to consistently use backendStdenv when building with CUDA support,
+  # otherwise we get libstdc++ errors downstream.
+  # cuda imposes an upper bound on the gcc version
+  buildPkgs = import pkgs.path {
+    system = "x86_64-linux"; # builder uses x86_64
+  };
+
+  # hexagon needs a x86 build env
+  crossPkgs = buildPkgs.pkgsCross.aarch64-multiplatform;
+
+  effectiveStdenv = if hexagonSupport then crossPkgs.stdenv else stdenv;
+  inherit (lib)
+    cmakeBool
+    cmakeFeature
+    optionals
+    optionalString
+    ;
+
+  cudaBuildInputs = with cudaPackages; [
+    cuda_cccl # <nv/target>
+
+    # A temporary hack for reducing the closure size, remove once cudaPackages
+    # have stopped using lndir: https://github.com/NixOS/nixpkgs/issues/271792
+    cuda_cudart
+    libcublas
+  ];
+
+  rocmBuildInputs = with rocmPackages; [
+    clr
+    hipblas
+    rocblas
+  ];
+
+  vulkanBuildInputs = [
+    shaderc
+    vulkan-headers
+    vulkan-loader
+  ];
+
+  hexagonBuildInputs = [
+    hexagon-sdk
+  ];
+in
+effectiveStdenv.mkDerivation (finalAttrs: {
+  pname = "llama-cpp";
+  version = "8871";
+
+  src = fetchFromGitHub {
+    owner = "ggml-org";
+    repo = "llama.cpp";
+    tag = "b${finalAttrs.version}";
+    hash = "sha256-dSMomkkG3YFwXAcYTym6Z03u8ZAWFFio8jdQJPMJ/yg=";
+    leaveDotGit = true;
+    postFetch = ''
+      git -C "$out" rev-parse --short HEAD > $out/COMMIT
+      find "$out" -name .git -print0 | xargs -0 rm -rf
+    '';
+  };
+
+  nativeBuildInputs = [
+    cmake
+    pkgs.clang
+    ninja
+    pkg-config
+    blas
+  ]
+  ++ optionals cudaSupport [
+    cudaPackages.cuda_nvcc
+    autoAddDriverRunpath
+  ];
+
+  buildInputs =
+    optionals cudaSupport cudaBuildInputs
+    ++ optionals openclSupport [ clblast ]
+    ++ optionals rocmSupport rocmBuildInputs
+    ++ optionals blasSupport [ blas ]
+    ++ optionals vulkanSupport vulkanBuildInputs
+    ++ optionals hexagonSupport hexagonBuildInputs
+    ++ [
+      curl
+    ];
+
+  preConfigure = ''
+    prependToVar cmakeFlags "-DLLAMA_BUILD_COMMIT:STRING=$(cat COMMIT)"
+  '';
+
+  cmakeFlags = [
+    # -march=native is non-deterministic; override with platform-specific flags if needed
+    (cmakeBool "GGML_NATIVE" false)
+    (cmakeBool "LLAMA_BUILD_EXAMPLES" false)
+    (cmakeBool "LLAMA_BUILD_SERVER" true)
+    (cmakeBool "LLAMA_BUILD_TESTS" (finalAttrs.finalPackage.doCheck or false))
+    (cmakeBool "LLAMA_CURL" true)
+    (cmakeBool "BUILD_SHARED_LIBS" true)
+    (cmakeBool "GGML_BLAS" blasSupport)
+    (cmakeBool "GGML_CLBLAST" openclSupport)
+    (cmakeBool "GGML_CUDA" cudaSupport)
+    (cmakeBool "GGML_HIP" rocmSupport)
+    (cmakeBool "GGML_METAL" metalSupport)
+    (cmakeBool "GGML_RPC" rpcSupport)
+    (cmakeBool "GGML_VULKAN" vulkanSupport)
+    (cmakeBool "GGML_HEXAGON" hexagonSupport)
+    (cmakeFeature "LLAMA_BUILD_NUMBER" finalAttrs.version)
+  ]
+  ++ optionals cudaSupport [
+    (cmakeFeature "CMAKE_CUDA_ARCHITECTURES" cudaPackages.flags.cmakeCudaArchitecturesString)
+  ]
+  ++ optionals rocmSupport [
+    (cmakeFeature "CMAKE_HIP_COMPILER" "${rocmPackages.clr.hipClangPath}/clang++")
+    (cmakeFeature "CMAKE_HIP_ARCHITECTURES" (builtins.concatStringsSep ";" rocmGpuTargets))
+  ]
+  ++ optionals metalSupport [
+    (cmakeFeature "CMAKE_C_FLAGS" "-D__ARM_FEATURE_DOTPROD=1")
+    (cmakeBool "LLAMA_METAL_EMBED_LIBRARY" true)
+  ]
+  ++ optionals rpcSupport [
+    # This is done so we can move rpc-server out of bin because llama.cpp doesn't
+    # install rpc-server in their install target.
+    (cmakeBool "CMAKE_SKIP_BUILD_RPATH" true)
+  ]
+  ++ optionals hexagonSupport [
+    # (cmakeFeature "CMAKE_TOOLCHAIN_FILE" "${finalAttrs.src}/cmake/arm64-linux-clang.cmake")
+    (cmakeFeature "CMAKE_C_FLAGS" "-D__ARM_FEATURE_DOTPROD=1")
+    (cmakeFeature "CMAKE_CXX_FLAGS" "")
+    (cmakeBool "GGML_OPENMP" false)
+    (cmakeBool "GGML_LLAMAFILE" false)
+    (cmakeFeature "GGML_OPENCL" "OFF")
+    (cmakeFeature "PREBUILT_LIB_DIR" "linux_aarch64")
+    (cmakeFeature "GGML_HEXAGON_FP32_QUANTIZE_GROUP_SIZE" "128")
+    (cmakeFeature "HEXAGON_SDK_ROOT" "${hexagon-sdk}/opt")
+    (cmakeFeature "HEXAGON_TOOLS_ROOT" "${hexagon-sdk}/opt/tools/HEXAGON_Tools/19.0.04")
+    (cmakeFeature "LLAMA_OPENSSL" "OFF")
+  ];
+
+  # upstream plans on adding targets at the cmakelevel, remove those
+  # additional steps after that
+  postInstall = ''
+    # Match previous binary name for this package
+    ln -sf $out/bin/llama-cli $out/bin/llama
+
+    mkdir -p $out/include
+    cp $src/include/llama.h $out/include/
+  ''
+  + optionalString rpcSupport "cp bin/rpc-server $out/bin/llama-rpc-server";
+
+  # the tests are failing as of 2025-08
+  doCheck = false;
+
+  passthru = {
+    tests = lib.optionalAttrs stdenv.hostPlatform.isDarwin {
+      metal = llama-cpp.override { metalSupport = true; };
+    };
+    updateScript = nix-update-script {
+      attrPath = "llama-cpp";
+      extraArgs = [
+        "--version-regex"
+        "b(.*)"
+      ];
+    };
+  };
+
+  meta = {
+    description = "Inference of Meta's LLaMA model (and others) in pure C/C++";
+    homepage = "https://github.com/ggml-org/llama.cpp";
+    license = lib.licenses.mit;
+    mainProgram = "llama";
+    maintainers = with lib.maintainers; [
+      booxter
+      dit7ya
+      philiptaron
+      xddxdd
+    ];
+    platforms = lib.platforms.unix;
+    badPlatforms = optionals (cudaSupport || openclSupport) lib.platforms.darwin;
+    broken =
+      (metalSupport && !effectiveStdenv.hostPlatform.isDarwin)
+      || (hexagonSupport && !effectiveStdenv.hostPlatform.isAarch64);
+  };
+})
Author	SHA1	Message	Date
doloro	0188aff399	fix: it builds now check / build (push) Failing after 15s Details check / build (pull_request) Failing after 14s Details	2026-04-21 23:10:14 +01:00
doloro	34974204db	wip: llama-cpp with hexagon	2026-04-21 17:38:09 +01:00
doloro	1228969d80	renamed: llama-cpp-hexagon -> llama-cpp check / build (push) Failing after 15s Details	2026-04-20 20:37:53 +01:00
doloro	d462837a55	added: llama-cpp	2026-04-20 20:37:29 +01:00