4a7c396766
Changelog: https://github.com/LostRuins/koboldcpp/releases/tag/v1.72 Diff: https://github.com/LostRuins/koboldcpp/compare/v1.71.1...v1.72
177 lines
4.7 KiB
Nix
177 lines
4.7 KiB
Nix
{
|
|
lib,
|
|
fetchFromGitHub,
|
|
stdenv,
|
|
makeWrapper,
|
|
gitUpdater,
|
|
python3Packages,
|
|
python311Packages ? null, # Ignored. Kept for compatibility with the release
|
|
tk,
|
|
addDriverRunpath,
|
|
|
|
darwin,
|
|
|
|
koboldLiteSupport ? true,
|
|
|
|
config,
|
|
cudaPackages ? { },
|
|
|
|
openblasSupport ? !stdenv.isDarwin,
|
|
openblas,
|
|
|
|
cublasSupport ? config.cudaSupport,
|
|
# You can find a full list here: https://arnon.dk/matching-sm-architectures-arch-and-gencode-for-various-nvidia-cards/
|
|
# For example if you're on an GTX 1080 that means you're using "Pascal" and you need to pass "sm_60"
|
|
cudaArches ? cudaPackages.cudaFlags.realArches or [ ],
|
|
|
|
clblastSupport ? stdenv.isLinux,
|
|
clblast,
|
|
ocl-icd,
|
|
|
|
vulkanSupport ? true,
|
|
vulkan-loader,
|
|
|
|
metalSupport ? stdenv.isDarwin && stdenv.isAarch64,
|
|
march ? "",
|
|
mtune ? "",
|
|
}:
|
|
|
|
let
|
|
makeBool = option: bool: (if bool then "${option}=1" else "");
|
|
|
|
libraryPathWrapperArgs = lib.optionalString config.cudaSupport ''
|
|
--prefix LD_LIBRARY_PATH : "${lib.makeLibraryPath [ addDriverRunpath.driverLink ]}"
|
|
'';
|
|
|
|
darwinFrameworks =
|
|
if (stdenv.isDarwin && stdenv.isx86_64) then
|
|
darwin.apple_sdk.frameworks
|
|
else
|
|
darwin.apple_sdk_11_0.frameworks;
|
|
|
|
effectiveStdenv = if cublasSupport then cudaPackages.backendStdenv else stdenv;
|
|
in
|
|
effectiveStdenv.mkDerivation (finalAttrs: {
|
|
pname = "koboldcpp";
|
|
version = "1.72";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "LostRuins";
|
|
repo = "koboldcpp";
|
|
rev = "refs/tags/v${finalAttrs.version}";
|
|
hash = "sha256-DePcBVNXIWIlOXyNeNMUFFIQxQuwqG8KBUh2/X7R6X8=";
|
|
};
|
|
|
|
enableParallelBuilding = true;
|
|
|
|
nativeBuildInputs = [
|
|
makeWrapper
|
|
python3Packages.wrapPython
|
|
];
|
|
|
|
pythonInputs = builtins.attrValues { inherit (python3Packages) tkinter customtkinter packaging; };
|
|
|
|
buildInputs =
|
|
[ tk ]
|
|
++ finalAttrs.pythonInputs
|
|
++ lib.optionals effectiveStdenv.isDarwin [
|
|
darwinFrameworks.Accelerate
|
|
darwinFrameworks.CoreVideo
|
|
darwinFrameworks.CoreGraphics
|
|
darwinFrameworks.CoreServices
|
|
]
|
|
++ lib.optionals metalSupport [
|
|
darwinFrameworks.MetalKit
|
|
darwinFrameworks.Foundation
|
|
darwinFrameworks.MetalPerformanceShaders
|
|
]
|
|
++ lib.optionals openblasSupport [ openblas ]
|
|
++ lib.optionals cublasSupport [
|
|
cudaPackages.libcublas
|
|
cudaPackages.cuda_nvcc
|
|
cudaPackages.cuda_cudart
|
|
cudaPackages.cuda_cccl
|
|
]
|
|
++ lib.optionals clblastSupport [
|
|
clblast
|
|
ocl-icd
|
|
]
|
|
++ lib.optionals vulkanSupport [ vulkan-loader ];
|
|
|
|
pythonPath = finalAttrs.pythonInputs;
|
|
|
|
darwinLdFlags = lib.optionals stdenv.isDarwin [
|
|
"-F${darwinFrameworks.CoreServices}/Library/Frameworks"
|
|
"-F${darwinFrameworks.Accelerate}/Library/Frameworks"
|
|
"-framework CoreServices"
|
|
"-framework Accelerate"
|
|
];
|
|
metalLdFlags = lib.optionals metalSupport [
|
|
"-F${darwinFrameworks.Foundation}/Library/Frameworks"
|
|
"-F${darwinFrameworks.Metal}/Library/Frameworks"
|
|
"-framework Foundation"
|
|
"-framework Metal"
|
|
];
|
|
|
|
env.NIX_LDFLAGS = lib.concatStringsSep " " (finalAttrs.darwinLdFlags ++ finalAttrs.metalLdFlags);
|
|
|
|
env.NIX_CFLAGS_COMPILE =
|
|
lib.optionalString (march != "") (
|
|
lib.warn "koboldcpp: the march argument is only kept for compatibility; use overrideAttrs intead" "-march=${march}"
|
|
)
|
|
+ lib.optionalString (mtune != "") (
|
|
lib.warn "koboldcpp: the mtune argument is only kept for compatibility; use overrideAttrs intead" "-mtune=${mtune}"
|
|
);
|
|
|
|
makeFlags = [
|
|
(makeBool "LLAMA_OPENBLAS" openblasSupport)
|
|
(makeBool "LLAMA_CUBLAS" cublasSupport)
|
|
(makeBool "LLAMA_CLBLAST" clblastSupport)
|
|
(makeBool "LLAMA_VULKAN" vulkanSupport)
|
|
(makeBool "LLAMA_METAL" metalSupport)
|
|
(lib.optionals cublasSupport "CUDA_DOCKER_ARCH=${builtins.head cudaArches}")
|
|
];
|
|
|
|
installPhase = ''
|
|
runHook preInstall
|
|
|
|
mkdir -p "$out/bin"
|
|
|
|
install -Dm755 koboldcpp.py "$out/bin/koboldcpp.unwrapped"
|
|
cp *.so "$out/bin"
|
|
cp *.embd "$out/bin"
|
|
|
|
${lib.optionalString (!koboldLiteSupport) ''
|
|
rm "$out/bin/kcpp_docs.embd"
|
|
rm "$out/bin/klite.embd"
|
|
''}
|
|
|
|
runHook postInstall
|
|
'';
|
|
|
|
# Remove an unused argument, mainly intended for Darwin to reduce warnings
|
|
postPatch = ''
|
|
substituteInPlace Makefile \
|
|
--replace-warn " -s " " "
|
|
'';
|
|
|
|
postFixup = ''
|
|
wrapPythonProgramsIn "$out/bin" "$pythonPath"
|
|
makeWrapper "$out/bin/koboldcpp.unwrapped" "$out/bin/koboldcpp" \
|
|
--prefix PATH : ${lib.makeBinPath [ tk ]} ${libraryPathWrapperArgs}
|
|
'';
|
|
|
|
passthru.updateScript = gitUpdater { rev-prefix = "v"; };
|
|
|
|
meta = {
|
|
description = "Way to run various GGML and GGUF models";
|
|
license = lib.licenses.agpl3Only;
|
|
maintainers = with lib.maintainers; [
|
|
maxstrid
|
|
donteatoreo
|
|
];
|
|
mainProgram = "koboldcpp";
|
|
platforms = lib.platforms.unix;
|
|
};
|
|
})
|