nixpkgs/pkgs/by-name/wh/whisper-cpp/package.nix

{
  lib,
  stdenv,
  cmake,
  apple-sdk_11,
  ninja,
  fetchFromGitHub,
  SDL2,
  wget,
  which,
  autoAddDriverRunpath,
  makeWrapper,

  metalSupport ? stdenv.hostPlatform.isDarwin && stdenv.hostPlatform.isAarch64,
  coreMLSupport ? stdenv.hostPlatform.isDarwin && false, # FIXME currently broken

  config,
  cudaSupport ? config.cudaSupport,
  cudaPackages ? { },

  rocmSupport ? config.rocmSupport,
  rocmPackages ? { },
  rocmGpuTargets ? builtins.concatStringsSep ";" rocmPackages.clr.gpuTargets,

  vulkanSupport ? false,
  shaderc,
  vulkan-headers,
  vulkan-loader,

  withSDL ? true,
}:

assert metalSupport -> stdenv.hostPlatform.isDarwin;
assert coreMLSupport -> stdenv.hostPlatform.isDarwin;

let
  # It's necessary to consistently use backendStdenv when building with CUDA support,
  # otherwise we get libstdc++ errors downstream.
  # cuda imposes an upper bound on the gcc version, e.g. the latest gcc compatible with cudaPackages_11 is gcc11
  effectiveStdenv = if cudaSupport then cudaPackages.backendStdenv else stdenv;
  inherit (lib)
    cmakeBool
    cmakeFeature
    optional
    optionals
    optionalString
    forEach
    ;

  darwinBuildInputs = [ apple-sdk_11 ];

  cudaBuildInputs = with cudaPackages; [
    cuda_cccl # <nv/target>

    # A temporary hack for reducing the closure size, remove once cudaPackages
    # have stopped using lndir: https://github.com/NixOS/nixpkgs/issues/271792
    cuda_cudart
    libcublas
  ];

  rocmBuildInputs = with rocmPackages; [
    clr
    hipblas
    rocblas
  ];

  vulkanBuildInputs = [
    shaderc
    vulkan-headers
    vulkan-loader
  ];

in
effectiveStdenv.mkDerivation (finalAttrs: {
  pname = "whisper-cpp";
  version = "1.7.2";

  src = fetchFromGitHub {
    owner = "ggerganov";
    repo = "whisper.cpp";
    rev = "refs/tags/v${finalAttrs.version}";
    hash = "sha256-y30ZccpF3SCdRGa+P3ddF1tT1KnvlI4Fexx81wZxfTk=";
  };

  # The upstream download script tries to download the models to the
  # directory of the script, which is not writable due to being
  # inside the nix store. This patch changes the script to download
  # the models to the current directory of where it is being run from.
  patches = [ ./download-models.patch ];

  postPatch = ''
    for target in examples/{bench,command,main,quantize,server,stream,talk}/CMakeLists.txt; do
      if ! grep -q -F 'install('; then
        echo 'install(TARGETS ''${TARGET} RUNTIME)' >> $target
      fi
    done
  '';

  nativeBuildInputs =
    [
      cmake
      ninja
      which
      makeWrapper
    ]
    ++ lib.optionals cudaSupport [
      cudaPackages.cuda_nvcc
      autoAddDriverRunpath
    ];

  buildInputs =
    optional withSDL SDL2
    ++ optionals effectiveStdenv.hostPlatform.isDarwin darwinBuildInputs
    ++ optionals cudaSupport cudaBuildInputs
    ++ optionals rocmSupport rocmBuildInputs
    ++ optionals vulkanSupport vulkanBuildInputs;

  cmakeFlags =
    [
      (cmakeBool "WHISPER_BUILD_EXAMPLES" true)
      (cmakeBool "GGML_CUDA" cudaSupport)
      (cmakeBool "GGML_HIPBLAS" rocmSupport)
      (cmakeBool "GGML_VULKAN" vulkanSupport)
      (cmakeBool "WHISPER_SDL2" withSDL)
      (cmakeBool "GGML_LTO" true)
      (cmakeBool "GGML_NATIVE" false)
      (cmakeBool "BUILD_SHARED_LIBS" (!effectiveStdenv.hostPlatform.isStatic))
    ]
    ++ optionals (effectiveStdenv.hostPlatform.isx86 && !effectiveStdenv.hostPlatform.isStatic) [
      (cmakeBool "GGML_BACKEND_DL" true)
      (cmakeBool "GGML_CPU_ALL_VARIANTS" true)
    ]
    ++ optionals cudaSupport [
      (cmakeFeature "CMAKE_CUDA_ARCHITECTURES" cudaPackages.flags.cmakeCudaArchitecturesString)
    ]
    ++ optionals rocmSupport [
      (cmakeFeature "CMAKE_C_COMPILER" "hipcc")
      (cmakeFeature "CMAKE_CXX_COMPILER" "hipcc")

      # Build all targets supported by rocBLAS. When updating search for TARGET_LIST_ROCM
      # in https://github.com/ROCmSoftwarePlatform/rocBLAS/blob/develop/CMakeLists.txt
      # and select the line that matches the current nixpkgs version of rocBLAS.
      "-DAMDGPU_TARGETS=${rocmGpuTargets}"
    ]
    ++ optionals coreMLSupport [
      (cmakeBool "WHISPER_COREML" true)
      (cmakeBool "WHISPER_COREML_ALLOW_FALLBACK" true)
    ]
    ++ optionals metalSupport [
      (cmakeFeature "CMAKE_C_FLAGS" "-D__ARM_FEATURE_DOTPROD=1")
      (cmakeBool "GGML_METAL" true)
      (cmakeBool "GGML_METAL_EMBED_LIBRARY" true)
    ];

  postInstall = ''
    # Add "whisper-cpp" prefix before every command
    mv -v $out/bin/{main,whisper-cpp}

    for file in $out/bin/*; do
      if [[ -x "$file" && -f "$file" && "$(basename $file)" != "whisper-cpp" ]]; then
        mv -v "$file" "$out/bin/whisper-cpp-$(basename $file)"
      fi
    done

    install -v -D -m755 $src/models/download-ggml-model.sh $out/bin/whisper-cpp-download-ggml-model

    wrapProgram $out/bin/whisper-cpp-download-ggml-model \
      --prefix PATH : ${lib.makeBinPath [ wget ]}
  '';

  requiredSystemFeatures = optionals rocmSupport [ "big-parallel" ]; # rocmSupport multiplies build time by the number of GPU targets, which takes arround 30 minutes on a 16-cores system to build

  doInstallCheck = true;

  installCheckPhase = ''
    runHook preInstallCheck
    $out/bin/whisper-cpp --help >/dev/null
    runHook postInstallCheck
  '';

  meta = {
    description = "Port of OpenAI's Whisper model in C/C++";
    longDescription = ''
      To download the models as described in the project's readme, you may
      use the `whisper-cpp-download-ggml-model` binary from this package.
    '';
    homepage = "https://github.com/ggerganov/whisper.cpp";
    license = lib.licenses.mit;
    mainProgram = "whisper-cpp";
    platforms = lib.platforms.all;
    broken = coreMLSupport;
    badPlatforms = optionals cudaSupport lib.platforms.darwin;
    maintainers = with lib.maintainers; [
      dit7ya
      hughobrien
      aviallon
    ];
  };
})
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`{`
			`lib,`
			`stdenv,`
			`cmake,`
			`apple-sdk_11,`
			`ninja,`
			`fetchFromGitHub,`
			`SDL2,`
			`wget,`
			`which,`
			`autoAddDriverRunpath,`
			`makeWrapper,`

			`metalSupport ? stdenv.hostPlatform.isDarwin && stdenv.hostPlatform.isAarch64,`
			`coreMLSupport ? stdenv.hostPlatform.isDarwin && false, # FIXME currently broken`

			`config,`
			`cudaSupport ? config.cudaSupport,`
			`cudaPackages ? { },`

			`rocmSupport ? config.rocmSupport,`
			`rocmPackages ? { },`
			`rocmGpuTargets ? builtins.concatStringsSep ";" rocmPackages.clr.gpuTargets,`

			`vulkanSupport ? false,`
			`shaderc,`
			`vulkan-headers,`
			`vulkan-loader,`

			`withSDL ? true,`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30			`}:`

whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`assert metalSupport -> stdenv.hostPlatform.isDarwin;`
			`assert coreMLSupport -> stdenv.hostPlatform.isDarwin;`

openai-whisper-cpp: add cudaSupport 2024-01-19 00:39:31 +08:00			`let`
			`# It's necessary to consistently use backendStdenv when building with CUDA support,`
			`# otherwise we get libstdc++ errors downstream.`
			`# cuda imposes an upper bound on the gcc version, e.g. the latest gcc compatible with cudaPackages_11 is gcc11`
			`effectiveStdenv = if cudaSupport then cudaPackages.backendStdenv else stdenv;`
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`inherit (lib)`
			`cmakeBool`
			`cmakeFeature`
			`optional`
			`optionals`
			`optionalString`
			`forEach`
			`;`

			`darwinBuildInputs = [ apple-sdk_11 ];`

			`cudaBuildInputs = with cudaPackages; [`
			`cuda_cccl # <nv/target>`

			`# A temporary hack for reducing the closure size, remove once cudaPackages`
			`# have stopped using lndir: https://github.com/NixOS/nixpkgs/issues/271792`
			`cuda_cudart`
			`libcublas`
			`];`

			`rocmBuildInputs = with rocmPackages; [`
			`clr`
			`hipblas`
			`rocblas`
			`];`

			`vulkanBuildInputs = [`
			`shaderc`
			`vulkan-headers`
			`vulkan-loader`
			`];`

openai-whisper-cpp: add cudaSupport 2024-01-19 00:39:31 +08:00			`in`
			`effectiveStdenv.mkDerivation (finalAttrs: {`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30			`pname = "whisper-cpp";`
openai-whisper-cpp: 1.7.1 -> 1.7.2 2024-11-20 22:58:10 +00:00			`version = "1.7.2";`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30
			`src = fetchFromGitHub {`
			`owner = "ggerganov";`
			`repo = "whisper.cpp";`
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`rev = "refs/tags/v${finalAttrs.version}";`
openai-whisper-cpp: 1.7.1 -> 1.7.2 2024-11-20 22:58:10 +00:00			`hash = "sha256-y30ZccpF3SCdRGa+P3ddF1tT1KnvlI4Fexx81wZxfTk=";`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30			`};`

			`# The upstream download script tries to download the models to the`
			`# directory of the script, which is not writable due to being`
			`# inside the nix store. This patch changes the script to download`
			`# the models to the current directory of where it is being run from.`
			`patches = [ ./download-models.patch ];`

whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`postPatch = ''`
			`for target in examples/{bench,command,main,quantize,server,stream,talk}/CMakeLists.txt; do`
			`if ! grep -q -F 'install('; then`
			`echo 'install(TARGETS ''${TARGET} RUNTIME)' >> $target`
			`fi`
			`done`
			`'';`

			`nativeBuildInputs =`
			`[`
			`cmake`
			`ninja`
openai-whisper-cpp: fix cuda build 2024-01-24 17:55:58 -05:00			`which`
openai-whisper-cpp: add cudaSupport 2024-01-19 00:39:31 +08:00			`makeWrapper`
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`]`
			`++ lib.optionals cudaSupport [`
openai-whisper-cpp: use pkgs.autoAddDriverRunpath 2024-03-30 11:06:48 -07:00			`cudaPackages.cuda_nvcc`
cudaPackages: generalize and refactor setup hook This PR refactor CUDA setup hooks, and in particular autoAddOpenGLRunpath and autoAddCudaCompatRunpathHook, that were using a lot of code in common (in fact, I introduced the latter by copy pasting most of the bash script of the former). This is not satisfying for maintenance, as a recent patch showed, because we need to duplicate changes to both hooks. This commit abstract the common part in a single shell script that applies a generic patch action to every elf file in the output. For autoAddOpenGLRunpath the action is just addOpenGLRunpath (now addDriverRunpath), and is few line function for autoAddCudaCompatRunpathHook. Doing so, we also takes the occasion to use the newer addDriverRunpath instead of the previous addOpenGLRunpath, and rename the CUDA hook to reflect that as well. Co-Authored-By: Connor Baker <connor.baker@tweag.io> 2024-01-17 16:32:24 +01:00			`autoAddDriverRunpath`
openai-whisper-cpp: use pkgs.autoAddDriverRunpath 2024-03-30 11:06:48 -07:00			`];`
openai-whisper-cpp: add cudaSupport 2024-01-19 00:39:31 +08:00
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`buildInputs =`
			`optional withSDL SDL2`
			`++ optionals effectiveStdenv.hostPlatform.isDarwin darwinBuildInputs`
			`++ optionals cudaSupport cudaBuildInputs`
			`++ optionals rocmSupport rocmBuildInputs`
			`++ optionals vulkanSupport vulkanBuildInputs;`

			`cmakeFlags =`
			`[`
			`(cmakeBool "WHISPER_BUILD_EXAMPLES" true)`
			`(cmakeBool "GGML_CUDA" cudaSupport)`
			`(cmakeBool "GGML_HIPBLAS" rocmSupport)`
			`(cmakeBool "GGML_VULKAN" vulkanSupport)`
			`(cmakeBool "WHISPER_SDL2" withSDL)`
			`(cmakeBool "GGML_LTO" true)`
			`(cmakeBool "GGML_NATIVE" false)`
			`(cmakeBool "BUILD_SHARED_LIBS" (!effectiveStdenv.hostPlatform.isStatic))`
			`]`
			`++ optionals (effectiveStdenv.hostPlatform.isx86 && !effectiveStdenv.hostPlatform.isStatic) [`
			`(cmakeBool "GGML_BACKEND_DL" true)`
			`(cmakeBool "GGML_CPU_ALL_VARIANTS" true)`
			`]`
			`++ optionals cudaSupport [`
			`(cmakeFeature "CMAKE_CUDA_ARCHITECTURES" cudaPackages.flags.cmakeCudaArchitecturesString)`
			`]`
			`++ optionals rocmSupport [`
			`(cmakeFeature "CMAKE_C_COMPILER" "hipcc")`
			`(cmakeFeature "CMAKE_CXX_COMPILER" "hipcc")`

			`# Build all targets supported by rocBLAS. When updating search for TARGET_LIST_ROCM`
			`# in https://github.com/ROCmSoftwarePlatform/rocBLAS/blob/develop/CMakeLists.txt`
			`# and select the line that matches the current nixpkgs version of rocBLAS.`
			`"-DAMDGPU_TARGETS=${rocmGpuTargets}"`
			`]`
			`++ optionals coreMLSupport [`
			`(cmakeBool "WHISPER_COREML" true)`
			`(cmakeBool "WHISPER_COREML_ALLOW_FALLBACK" true)`
			`]`
			`++ optionals metalSupport [`
			`(cmakeFeature "CMAKE_C_FLAGS" "-D__ARM_FEATURE_DOTPROD=1")`
			`(cmakeBool "GGML_METAL" true)`
			`(cmakeBool "GGML_METAL_EMBED_LIBRARY" true)`
			`];`
openai-whisper-cpp: install all binaries built by default ``` whisper-cpp whisper-cpp-bench whisper-cpp-command whisper-cpp-lsp whisper-cpp-quantize whisper-cpp-server whisper-cpp-stream whisper-cpp-talk-llama ``` 2024-10-19 01:26:09 +03:00
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`postInstall = ''`
			`# Add "whisper-cpp" prefix before every command`
			`mv -v $out/bin/{main,whisper-cpp}`
openai-whisper-cpp: install all binaries built by default ``` whisper-cpp whisper-cpp-bench whisper-cpp-command whisper-cpp-lsp whisper-cpp-quantize whisper-cpp-server whisper-cpp-stream whisper-cpp-talk-llama ``` 2024-10-19 01:26:09 +03:00
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`for file in $out/bin/*; do`
			`if [[ -x "$file" && -f "$file" && "$(basename $file)" != "whisper-cpp" ]]; then`
			`mv -v "$file" "$out/bin/whisper-cpp-$(basename $file)"`
openai-whisper-cpp: install all binaries built by default ``` whisper-cpp whisper-cpp-bench whisper-cpp-command whisper-cpp-lsp whisper-cpp-quantize whisper-cpp-server whisper-cpp-stream whisper-cpp-talk-llama ``` 2024-10-19 01:26:09 +03:00			`fi`
			`done`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`install -v -D -m755 $src/models/download-ggml-model.sh $out/bin/whisper-cpp-download-ggml-model`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30
			`wrapProgram $out/bin/whisper-cpp-download-ggml-model \`
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`--prefix PATH : ${lib.makeBinPath [ wget ]}`
			`'';`

			`requiredSystemFeatures = optionals rocmSupport [ "big-parallel" ]; # rocmSupport multiplies build time by the number of GPU targets, which takes arround 30 minutes on a 16-cores system to build`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`doInstallCheck = true;`

			`installCheckPhase = ''`
			`runHook preInstallCheck`
			`$out/bin/whisper-cpp --help >/dev/null`
			`runHook postInstallCheck`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30			`'';`

whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`meta = {`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30			`description = "Port of OpenAI's Whisper model in C/C++";`
			`longDescription = ''`
			`To download the models as described in the project's readme, you may`
			use the `whisper-cpp-download-ggml-model` binary from this package.
			`'';`
			`homepage = "https://github.com/ggerganov/whisper.cpp";`
whisper-cpp: add ROCm and Vulkan support, rename from openai-whisper-cpp Rewrite to use CMake build Add aviallon to whisper-cpp's maintainers 2024-12-13 23:54:25 +01:00			`license = lib.licenses.mit;`
			`mainProgram = "whisper-cpp";`
			`platforms = lib.platforms.all;`
			`broken = coreMLSupport;`
			`badPlatforms = optionals cudaSupport lib.platforms.darwin;`
			`maintainers = with lib.maintainers; [`
			`dit7ya`
			`hughobrien`
			`aviallon`
			`];`
openai-whisper-cpp: init at 1.0.4 2022-12-07 20:56:15 +05:30			`};`
openai-whisper-cpp: add cudaSupport 2024-01-19 00:39:31 +08:00			`})`