feat: add OpenVINO AI Plugins (#50)

frenchwr · web-flow · commit 44e9b8b24f66 · 2025-06-02T09:05:14.000+01:00
diff --git a/README.md b/README.md
@@ -23,6 +23,59 @@ distributions.</p>
 
 <p align="center">Published for <img src="https://raw.githubusercontent.com/anythingcodes/slack-emoji-for-techies/gh-pages/emoji/tux.png" align="top" width="24" /> with :gift_heart: by Snapcrafters</p>
 
+## OpenVINO™ AI Plugins
+
+This snap contains support for AI features including:
+
+  - Music Separation
+  - Noise Suppression
+  - Music Generation and Continuation
+  - Transcription
+  - Super Resolution
+
+The plugins come installed out-of-the-box and support running on Intel hardware only (CPU, GPU, and NPU). Instructions for using each of the features can be found in the [upstream GitHub repository](https://github.com/intel/openvino-plugins-ai-audacity/tree/main/doc/feature_doc).
+
+> [!IMPORTANT]
+> The models (which are roughly 6.2 GiB in size total) are NOT built into the snap. To use the AI features you must download and install them from the command line. Note that downloading the models may take several minutes or longer, depending on the speed of your internet connection. Please be patient!
+
+To ease the process of downloading and installing the models, an interactive command is available within the snap that can be invoked like so:
+
+```shell
+sudo audacity.fetch-models
+```
+
+This will provide you with an interactive menu where you can select the model you wish to download and install. Alternatively, if you wish to enable all of the AI features, you can simply pass the `--batch` flag:
+
+```shell
+sudo audacity.fetch-models --batch
+```
+
+
+> [!IMPORTANT]
+> Please ensure you are in the `render` Unix group on your system in order to access Intel accelerators for the plugins (Intel GPU and NPU).
+To check your current groups, please run the following from a terminal:
+
+```shell
+groups
+```
+
+If you do not see `render` listed in the output, you may add your current user with the following:
+
+```shell
+sudo usermod -a -G render $USER
+```
+
+Now log out and back in to ensure your active session has the `render` group included.
+
+To ensure the device nodes have appropriate group permissions set, you may also run:
+
+```shell
+sudo chown root:render /dev/accel/accel*
+sudo chmod g+rw /dev/accel/accel*
+sudo chown root:render /dev/dri/render*
+sudo chmod g+rw /dev/dri/render*
+```
+
 ## How to contribute to this snap
 
 Thanks for your interest! Below you find instructions to help you contribute to this snap.
diff --git a/bin/fetch-models b/bin/fetch-models
@@ -0,0 +1,263 @@
+#!/bin/bash
+
+set -e
+set -E # ensure ERR trap is inherited by shell functions
+set -o pipefail
+
+SCRIPT_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" &>/dev/null && pwd -P)
+
+MODELS="${SNAP_DATA}/models/openvino-models"
+MUSICGEN_TMP="${SNAP_DATA}/tmp/musicgen_tmp"
+MUSICGEN="${MODELS}/musicgen"
+WHISPER_TMP="${SNAP_DATA}/tmp/whisper_tmp"
+WHISPER="${MODELS}"
+SEPARATION_TMP="${SNAP_DATA}/tmp/separation_tmp"
+SEPARATION="${MODELS}"
+SUPPRESSION_TMP="${SNAP_DATA}/tmp/suppression_tmp"
+SUPPRESSION="${MODELS}"
+RESOLUTION_TMP="${SNAP_DATA}/tmp/resolution_tmp"
+RESOLUTION="${MODELS}/audiosr"
+
+usage() {
+  cat<< EOF
+Usage: $(basename "${BASH_SOURCE[0]}") [-h] [-v] [-b]
+
+Manage the installation of OpenVINO™ AI models for Audacity.
+
+This command must be run with sudo as it installs models to ${SNAP_DATA}, where write access
+is only permitted for the root user.
+
+Available options:
+
+-h, --help      Print this help and exit
+-v, --verbose   Print script debug info
+-b, --batch     Install all models in non-interactive mode
+EOF
+  exit
+}
+
+cleanup() {
+  RC=$?
+  rm -rf "${MUSICGEN_TMP}" "${WHISPER_TMP}" "${SEPARATION_TMP}" "${SUPPRESSION_TMP}" "${RESOLUTION_TMP}"
+  if [ "${RC}" -ne 0 ]; then
+    echo "Warning: the script is not exiting normally. You may need to run again. Pass the -v flag to show debug info."
+  fi
+  exit "${RC}"
+}
+
+trap cleanup SIGINT SIGTERM ERR
+
+silent() {
+  if [ "${verbose}" = 'no' ]; then
+    "$@" > /dev/null 2>&1
+  else
+    "$@"
+  fi
+}
+
+musicgen_status() {
+  if [ -d "${MUSICGEN}" ] && \
+     [ "$(find "${MUSICGEN}" -maxdepth 1 -type f | wc -l)" = '12' ] && \
+     [ "$(find "${MUSICGEN}/mono" -maxdepth 1 -type f | wc -l)" = '17' ] && \
+     [ "$(find "${MUSICGEN}/stereo" -maxdepth 1 -type f | wc -l)" = '17' ]; then 
+    echo ' (installed) '
+  fi
+  echo ''
+}
+
+whisper_status() {
+  if [ -d "${WHISPER}" ] && \
+     [ "$(find "${WHISPER}" -name 'ggml*' | wc -l)" = '9' ]; then
+    echo ' (installed) '
+  fi
+  echo ''
+}
+
+separation_status() {
+  if [ -d "${SEPARATION}" ] && \
+     [ "$(find "${SEPARATION}" -name 'htdemucs_v4*' | wc -l)" = '2' ]; then
+    echo ' (installed) '
+  fi
+  echo ''
+}
+
+suppression_status() {
+  if [ -d "${SUPPRESSION}" ] && \
+     [ "$(find "${SUPPRESSION}" -name 'noise-suppression-denseunet-ll-0001*' | wc -l)" = '2' ] && \
+     [ "$(find "${SUPPRESSION}/deepfilternet2" -maxdepth 1 -type f | wc -l)" = '6' ] && \
+     [ "$(find "${SUPPRESSION}/deepfilternet3" -maxdepth 1 -type f | wc -l)" = '6' ]; then 
+    echo ' (installed) '
+  fi
+  echo ''
+}
+
+resolution_status() {
+  if [ -d "${RESOLUTION}" ] && \
+     [ "$(find "${RESOLUTION}" -maxdepth 1 -type f | wc -l)" = '13' ] && \
+     [ "$(find "${RESOLUTION}/basic" -maxdepth 1 -type f | wc -l)" = '2' ] && \
+     [ "$(find "${RESOLUTION}/speech" -maxdepth 1 -type f | wc -l)" = '2' ]; then 
+    echo ' (installed) '
+  fi
+  echo ''
+}
+
+install_musicgen() {
+  echo "
+Downloading Music Generation models from Hugging Face. Please be patient!
+  "
+  silent git clone https://huggingface.co/Intel/musicgen-static-openvino "${MUSICGEN_TMP}"
+  cd "${MUSICGEN_TMP}"
+  silent git checkout b2ad8083f3924ed704814b68c5df9cbbf2ad2aae
+  silent git lfs install
+  silent git lfs pull
+  mkdir -p "${MUSICGEN}"
+  silent unzip -o "${MUSICGEN_TMP}/musicgen_small_enc_dec_tok_openvino_models.zip" -d "${MUSICGEN}"
+  silent unzip -o "${MUSICGEN_TMP}/musicgen_small_mono_openvino_models.zip" -d "${MUSICGEN}"
+  silent unzip -o "${MUSICGEN_TMP}/musicgen_small_stereo_openvino_models.zip" -d "${MUSICGEN}"
+  rm -rf "${MUSICGEN_TMP}"
+  echo "Music Generation models (~2.8GB) successfully installed to ${MUSICGEN}"
+}
+
+install_whisper() {
+  echo "
+Downloading Whisper Transcription models from Hugging Face. Please be patient!
+  "
+  silent git clone https://huggingface.co/Intel/whisper.cpp-openvino-models "${WHISPER_TMP}"
+  cd "${WHISPER_TMP}"
+  silent git lfs install
+  silent git lfs pull
+  mkdir -p "${WHISPER}"
+  silent unzip -o "${WHISPER_TMP}/ggml-base-models.zip" -d "${WHISPER}"
+  silent unzip -o "${WHISPER_TMP}/ggml-small-models.zip" -d "${WHISPER}"
+  silent unzip -o "${WHISPER_TMP}/ggml-small.en-tdrz-models.zip" -d "${WHISPER}"
+  rm -rf "${WHISPER_TMP}"
+  echo "Whisper Transcription models (~1.5GB) successfully installed to ${WHISPER}"
+}
+
+install_separation() {
+  echo "
+Downloading Music Separation models from Hugging Face. Please be patient!
+  "
+  silent git clone https://huggingface.co/Intel/demucs-openvino "${SEPARATION_TMP}"
+  cd "${SEPARATION_TMP}"
+  silent git checkout 97fc578fb57650045d40b00bc84c7d156be77547
+  mkdir -p "${SEPARATION}"
+  cp "${SEPARATION_TMP}/htdemucs_v4."{bin,xml} "${SEPARATION}"
+  rm -rf "${SEPARATION_TMP}"
+  echo "Music Separation models (~99MB) successfully installed to ${SEPARATION}"
+}
+
+install_suppression() {
+  echo "
+Downloading Noise Suppression models from Hugging Face. Please be patient!
+  "
+  silent git clone https://huggingface.co/Intel/deepfilternet-openvino "${SUPPRESSION_TMP}"
+  cd "${SUPPRESSION_TMP}"
+  silent git checkout 995706bda3da69da0825074ba7dbc8a78067e980
+  silent git lfs install
+  silent git lfs pull
+  mkdir -p "${SUPPRESSION}"
+  silent unzip -o "${SUPPRESSION_TMP}/deepfilternet2.zip" -d "${SUPPRESSION}"
+  silent unzip -o "${SUPPRESSION_TMP}/deepfilternet3.zip" -d "${SUPPRESSION}"
+  silent wget -O "${SUPPRESSION}/noise-suppression-denseunet-ll-0001.xml" "https://storage.openvinotoolkit.org/repositories/open_model_zoo/2023.0/models_bin/1/noise-suppression-denseunet-ll-0001/FP16/noise-suppression-denseunet-ll-0001.xml"
+  silent wget -O "${SUPPRESSION}/noise-suppression-denseunet-ll-0001.bin" "https://storage.openvinotoolkit.org/repositories/open_model_zoo/2023.0/models_bin/1/noise-suppression-denseunet-ll-0001/FP16/noise-suppression-denseunet-ll-0001.bin"
+  rm -rf "${SUPPRESSION_TMP}"
+  echo "Noise Suppression models (~27MB) successfully installed to ${SUPPRESSION}"
+}
+
+install_resolution() {
+  echo "
+Downloading Super Resolution models from Hugging Face. Please be patient!
+  "
+  silent git clone https://huggingface.co/Intel/versatile_audio_super_resolution_openvino "${RESOLUTION_TMP}"
+  cd "${RESOLUTION_TMP}"
+  silent git lfs install
+  silent git lfs pull
+  mkdir -p "${RESOLUTION}"
+  silent unzip -o "${RESOLUTION_TMP}/versatile_audio_sr_base_openvino_models.zip" -d "${RESOLUTION}"
+  silent unzip -o "${RESOLUTION_TMP}/versatile_audio_sr_ddpm_basic_openvino_models.zip" -d "${RESOLUTION}"
+  silent unzip -o "${RESOLUTION_TMP}/versatile_audio_sr_ddpm_speech_openvino_models.zip" -d "${RESOLUTION}"
+  rm -rf "${RESOLUTION_TMP}"
+  echo "Super Resolution models (~2GB) successfully installed to ${RESOLUTION}"
+}
+
+build_model_menu() {
+  model_menu="
+-------------------------------------------------------------------------------------------------
+| Audacity OpenVINO™ plugins support several AI models available for download from Hugging Face |
+-------------------------------------------------------------------------------------------------
+
+1. Music Generation$(musicgen_status)
+2. Whisper Transcription$(whisper_status)
+3. Music Separation$(separation_status)
+4. Noise Suppression$(suppression_status)
+5. Super Resolution$(resolution_status)
+6. Exit
+
+Some models are several GB in size, so be mindful of your available disk space and network speed.
+
+To download and install a model, please select an option from the menu above and hit enter: "
+}
+
+parse_params() {
+  verbose='no' # default behavior is to run commands silently
+  batch_mode='no' # default behavior is interactive mode
+
+  while :; do
+    case "${1-}" in
+    -h | --help) usage ;;
+    -v | --verbose) verbose='yes' ;;
+    -b | --batch) batch_mode='yes' ;;
+    -?*) echo "Unknown option: $1" && exit 1 ;;
+    *) break ;;
+    esac
+    shift
+  done
+
+  return 0
+}
+
+loop_menu() {
+  while :; do
+    cd "${SCRIPT_DIR}"
+    build_model_menu
+    read -rp "${model_menu}" model_selection
+    case "${model_selection}" in
+      1) install_musicgen ;;
+      2) install_whisper ;;
+      3) install_separation ;;
+      4) install_suppression ;;
+      5) install_resolution ;;
+      6) exit ;;
+      *) echo "
+Unknown option ${model_selection} selected." ;;
+    esac
+  done
+}
+
+parse_params "$@"
+
+if ! grep -qw "GenuineIntel" /proc/cpuinfo; then
+  echo "The OpenVINO™ AI models are only supported on Intel hardware. Exiting."
+  exit 1
+fi
+
+if [ "${SNAP_UID}" -ne 0 ]; then
+  >&2 echo "
+This tool installs models to ${SNAP_DATA}, 
+where write access is only permitted for the root user.
+Please re-run the command with sudo:
+
+sudo $(basename "${BASH_SOURCE[0]}")
+  "
+  exit 1
+fi
+
+if [ "${batch_mode}" = 'yes' ]; then
+  for model in musicgen whisper separation suppression resolution; do
+    cd "${SCRIPT_DIR}"
+    install_"${model}"
+  done
+else
+  loop_menu
+fi
diff --git a/snap/snapcraft.yaml b/snap/snapcraft.yaml