custom llama

This commit is contained in:
Daniel Bulant 2026-04-18 18:01:27 +02:00
parent d414ea45dd
commit 51f7519c3b
No known key found for this signature in database
3 changed files with 35 additions and 1 deletions

View file

@ -122,6 +122,11 @@
url = "http://sonarr.eisen.danbulant.cloud";
icon = "si:sonarr";
}
{
title = "Prowlarr";
url = "http://prowlarr.eisen.danbulant.cloud";
icon = "si:prowlarr";
}
{
title = "Vaultwarden";
url = "https://vaultwarden.danbulant.cloud";

View file

@ -70,6 +70,31 @@
environment.systemPackages = with pkgs; [
nvitop
basalt-monado
cudaPackages.cuda_nvcc
(llama-cpp.overrideAttrs (prevAttrs: {
cmakeFlags = with lib; [
# -march=native is non-deterministic; override with platform-specific flags if needed
(cmakeBool "GGML_NATIVE" true)
(cmakeBool "LLAMA_BUILD_EXAMPLES" false)
(cmakeBool "LLAMA_BUILD_SERVER" true)
(cmakeBool "LLAMA_BUILD_TESTS" false)
(cmakeBool "LLAMA_OPENSSL" true)
(cmakeBool "BUILD_SHARED_LIBS" true)
(cmakeBool "GGML_BLAS" false)
(cmakeBool "GGML_LTO" true)
(cmakeBool "GGML_CLBLAST" true)
(cmakeBool "GGML_CUDA" true)
(cmakeBool "GGML_CUDA_GRAPHS" true)
(cmakeBool "GGML_CUDA_F16" true)
(cmakeBool "GGML_CUDA_FA_ALL_QUANTS" true)
(cmakeBool "GGML_HIP" false)
(cmakeBool "GGML_METAL" false)
(cmakeBool "GGML_RPC" false)
(cmakeBool "GGML_VULKAN" false)
(cmakeFeature "LLAMA_BUILD_NUMBER" "8770")
(cmakeFeature "CMAKE_CUDA_ARCHITECTURES" "120")
];
}))
];
hardware.nvidia = {
open = true;

View file

@ -390,7 +390,11 @@ in
# url = "https://raw.githubusercontent.com/MrOtherGuy/fx-autoconfig/master/program/config.js";
# sha256 = "1mx679fbc4d9x4bnqajqx5a95y1lfasvf90pbqkh9sm3ch945p40";
# })
(builtins.readFile ./uc.js)
# (builtins.toFile (builtins.readFile ./uc.js))
(builtins.path {
path = ./uc.js;
name = "config.js";
})
];
};
fish = {