Train from the command line

The files in the `cli` directory allow you to train wake words from the command line without needing to use the Jupyter notebook or a web browser. Basically, the logic from the notebook has been placed in separate shell scripts and python files wrapped by 3 high-level scripts that do the following: * setup_python_venv: Creates a Python virtual environment with all the packages needed to train. The venv is created in the container's /data directory and is therefore stored on the host, not in the container's root docker volume. * setup_training_datasets: Downloads, extracts and converts the MIT RIR, FMA, Audioset and Negative training reference datasets. Also stored in /data. * train_wake_word: Generates the wake word samples, augments them with the audio from the training datasets, and finally runs the microwakeword training. The resulting model tflite and json files are placed in the /data/output directory. See the README.md file for much more information.
2026-06-12 20:10:19 -06:00 · 2025-12-27 12:32:06 -07:00
parent 4dd7503248
commit cb81f7f02d
21 changed files with 2468 additions and 0 deletions
--- a/cli/setup_python_venv
+++ b/cli/setup_python_venv
@@ -0,0 +1,183 @@
+#!/bin/bash
+PROGDIR="$(dirname $(realpath $0))"
+
+KNOWN_ARGS=( data-dir python gpu no-gpu )
+source "${PROGDIR}/shell.functions"
+
+if [ ${#UNKNOWN_ARGS[@]} -gt 0 ] ; then
+    echo "Unknown argument(s): ${UNKNOWN_ARGS[*]}" >&2
+    HELP=true
+fi
+
+if [ "${HELP}" == "true" ] ; then
+    cat <<EOF >&2
+Usage: setup_python_venv [ --gpu | --no-gpu ] [ --verbose ]
+
+Options:
+--gpu:     Install the GPU-capable versions of packages if available.  This
+           is the default if the script detects that a GPU is available.
+
+--no-gpu:  Install the non-GPU-capable versions of packages even if
+           GPU-capable packages are available.  This is the default if the script
+           detects that a GPU is NOT available.
+
+--verbose: Print the detailed "pip install" output.
+
+EOF
+    exit 1
+fi
+
+[ -n "${DATA_DIR}" ] && DATA_DIR="$(realpath ${DATA_DIR})"
+[ -d  "${DATA_DIR}" ] || {
+    echo "Data directory '${DATA_DIR}' doesn't exist." >&2
+    exit 1
+}
+
+cd "${DATA_DIR}"
+
+[ -z "${GPU}" ] && {
+    GPU=false
+    [ -c /dev/nvidiactl ] && {
+        GPU=true
+        echo "   Nvidia GPU detected"
+    }
+}
+
+"${GPU}" || export CUDA_VISIBLE_DEVICES=-1
+
+VENV="${DATA_DIR}/.venv"
+[ -n "${VIRTUAL_ENV}" ] && deactivate
+
+if [ -n "${PYTHON}" ] ; then
+    PYTHONS=( "${PYTHON}" )
+    unset PYTHON
+else
+    PYTHONS=( python3.12 python3.10 )
+fi
+
+for p in "${PYTHONS[@]}" ; do
+    "${p}" --version &>/dev/null && { PYTHON="${p}" ; break ; }
+done
+
+[ -n "${PYTHON}" ] || {
+    echo "A python 3.12 or 3.10 interpreter wasn't found.  You 'll need to install one before proceeding." >&2
+    exit 1
+}
+
+if [ -d  "${VENV}" ] ; then
+    if [ -f "${DATA_DIR}/.mww-data-dir" ] ; then
+        source "${VENV}/bin/activate" || {
+            echo "Unable to activate existing virtualenv '${VENV}'.  You should delete it and try again." >&2
+            exit 1
+        }
+    else
+        rm -rf "${VENV}"
+    fi
+fi
+
+echo "===== Setting up Python environment ${VENV} ====="
+
+if [ -z "$VIRTUAL_ENV" ] ; then
+    echo "   ===== Creating new virtualenv at '${VENV}' ====="
+else
+    echo "   ===== Updating virtualenv at '${VENV}' ====="
+fi
+${PYTHON} -m venv --upgrade-deps "${VENV}"
+source "${VENV}/bin/activate"
+
+set -euo pipefail
+
+declare -a progfiles=( $(find ${PROGDIR} -mindepth 1 -maxdepth 1 -executable -type f) )
+progfiles+=( "${PROGDIR}/shell.functions" )
+
+for f in "${progfiles[@]}" ; do
+    ln -sfr "${f}" ".venv/bin/$(basename ${f})"
+done
+
+#
+# Pip doesn't process packages from requirements.txt in
+# order but order is important because tensorflow, torch,
+# onnxruntime and micro-wake-word all depend on CUDA packages
+# at various versions. They need to be installed in this specific
+# order or they may not be able to use the GPU.
+#
+export PIP_PROGRESS_BAR=off
+export PIP_NO_COLOR=1
+export PIP_QUIET=0
+
+pip_install() {
+    if $VERBOSE ; then
+        pip install "$@" || return 1
+    else
+        { pip install "$@" || return 1 ; } | stdbuf -i0 -o0 tr -d '[:print:]' | stdbuf -i0 -o0 tr '\n' '.'
+    fi
+    echo
+}
+
+START_TS=$EPOCHSECONDS
+
+echo "   ===== Installing common requirements ====="
+pip_install -r "${PROGDIR}/requirements.txt"
+
+${GPU} && tfgpu='[and-cuda]' || tfgpu=""
+echo "   ===== Installing Tensorflow${tfgpu} ====="
+pip_install ai_edge_litert "tensorflow${tfgpu}==2.20.0" "tensorboard==2.20.0" \
+    "tensorboard-data-server==0.7.2"
+
+${GPU} && torchgpu='--index-url https://download.pytorch.org/whl/cu129' || torchgpu=""
+echo "   ===== Installing torch and torchaudio ${torchgpu:+[cuda]} ====="
+pip_install "torch==2.9.1" "torchaudio==2.9.1" ${torchgpu}
+
+echo "   ===== Checking microwakeword ====="
+MWW="${DATA_DIR}/tools/microWakeWord"
+if [ ! -d "${MWW}" ] || [ -n "$(git -C "${MWW}" status --porcelain)" ] ; then
+    rm -rf "${MWW}" || :
+    echo "   Cloning micro-wake-word to ${DATA_DIR}/tools"
+    git clone https://github.com/TaterTotterson/micro-wake-word "${MWW}" &>/dev/null
+fi
+echo "   Installing microwakeword"
+pip_install -e "${MWW}"
+
+echo "   ===== Checking piper-sample-generator ====="
+PSG="${DATA_DIR}/tools/piper-sample-generator"
+if [ ! -d "${PSG}" ] || [ -n "$(git -C ${PSG} status --porcelain)" ] ; then
+    rm -rf "${PSG}" || :
+    echo "   Cloning piper-sample-generator to ${DATA_DIR}/tools"
+    git clone https://github.com/rhasspy/piper-sample-generator "${PSG}" &>/dev/null
+fi
+echo "   Installing piper-sample-generator"
+pip_install -e "${PSG}"
+git -C tools/piper-sample-generator clean -fd &>/dev/null
+
+MODELS_DIR="${PSG}/models"
+MODEL_NAME="en_US-libritts_r-medium.pt"
+MODEL_FILE="${MODELS_DIR}/${MODEL_NAME}"
+MODEL_URL="https://github.com/rhasspy/piper-sample-generator/releases/download/v2.0.0/${MODEL_NAME}"
+if [ ! -f "${MODEL_FILE}" ] ; then
+    echo "      Downloading ${MODEL_NAME} for piper-sample-generator"
+    curl -sfL "${MODEL_URL}" -o "${MODEL_FILE}"
+fi
+
+if [ ! -f "${MODEL_FILE}.json" ] ; then
+    echo "      Downloading ${MODEL_NAME}.json for piper-sample-generator"
+    curl -sfL "${MODEL_URL}.json" -o "${MODEL_FILE}.json"
+fi
+
+${GPU} && onnxgpu='-gpu[cuda]' || onnxgpu=""
+echo "   ===== Installing onnxruntime${onnxgpu} ====="
+pip_install "onnxruntime${onnxgpu}>=1.16.0"
+
+echo "   ===== Installing keras ====="
+# keras 3.13 has "issues" so we need to back down to 3.12.
+pip_install "keras==3.12.0"
+
+${PROGDIR}/test_python --data-dir="${DATA_DIR}"
+
+touch .mww-data-dir
+END_TS=$EPOCHSECONDS
+
+echo "Run 'source ${VENV}/bin/activate' to activate the new virtualenv in the current shell."
+
+print_elapsed_time "${START_TS}" "${END_TS}" "Python package installation complete"
+
+