BMAD-METHOD/.claude/hooks/voice-manager.sh

#!/bin/bash
#
# File: .claude/hooks/voice-manager.sh
#
# AgentVibes - Finally, your AI Agents can Talk Back! Text-to-Speech WITH personality for AI Assistants!
# Website: https://agentvibes.org
# Repository: https://github.com/paulpreibisch/AgentVibes
#
# Co-created by Paul Preibisch with Claude AI
# Copyright (c) 2025 Paul Preibisch
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# DISCLAIMER: This software is provided "AS IS", WITHOUT WARRANTY OF ANY KIND,
# express or implied. Use at your own risk. See the Apache License for details.
#
# ---
#
# @fileoverview Voice Manager - Unified voice management for both ElevenLabs and Piper providers
# @context Central interface for listing, switching, previewing, and replaying TTS voices across providers
# @architecture Provider-aware operations with dynamic voice listing based on active provider
# @dependencies voices-config.sh (ElevenLabs mappings), piper-voice-manager.sh (Piper voices), provider-manager.sh
# @entrypoints Called by /agent-vibes:switch, /agent-vibes:list, /agent-vibes:whoami, /agent-vibes:replay commands
# @patterns Provider abstraction, numbered selection UI, silent mode for programmatic switching
# @related voices-config.sh, piper-voice-manager.sh, .claude/tts-voice.txt, .claude/audio/ (replay)

# Get script directory (physical path for sourcing files)
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd -P)"
source "$SCRIPT_DIR/voices-config.sh"

# Determine target .claude directory based on context
# Priority:
# 1. CLAUDE_PROJECT_DIR env var (set by MCP for project-specific settings)
# 2. Script location (for direct slash command usage)
# 3. Global ~/.claude (fallback)

if [[ -n "$CLAUDE_PROJECT_DIR" ]] && [[ -d "$CLAUDE_PROJECT_DIR/.claude" ]]; then
  # MCP context: Use the project directory where MCP was invoked
  CLAUDE_DIR="$CLAUDE_PROJECT_DIR/.claude"
else
  # Direct usage context: Use script location
  SCRIPT_PATH="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
  CLAUDE_DIR="$(dirname "$SCRIPT_PATH")"

  # If script is in global ~/.claude, use that
  if [[ "$CLAUDE_DIR" == "$HOME/.claude" ]]; then
    CLAUDE_DIR="$HOME/.claude"
  elif [[ ! -d "$CLAUDE_DIR" ]]; then
    # Fallback to global if directory doesn't exist
    CLAUDE_DIR="$HOME/.claude"
  fi
fi

VOICE_FILE="$CLAUDE_DIR/tts-voice.txt"

case "$1" in
  list)
    # Get active provider
    PROVIDER_FILE="$CLAUDE_DIR/tts-provider.txt"
    if [[ ! -f "$PROVIDER_FILE" ]]; then
      PROVIDER_FILE="$HOME/.claude/tts-provider.txt"
    fi

    ACTIVE_PROVIDER="elevenlabs"  # default
    if [ -f "$PROVIDER_FILE" ]; then
      ACTIVE_PROVIDER=$(cat "$PROVIDER_FILE")
    fi

    CURRENT_VOICE=$(cat "$VOICE_FILE" 2>/dev/null || echo "Cowboy Bob")

    if [[ "$ACTIVE_PROVIDER" == "piper" ]]; then
      echo "🎤 Available Piper TTS Voices:"
      echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"

      # List downloaded Piper voices
      if [[ -f "$SCRIPT_DIR/piper-voice-manager.sh" ]]; then
        source "$SCRIPT_DIR/piper-voice-manager.sh"
        VOICE_DIR=$(get_voice_storage_dir)
        VOICE_COUNT=0
        for onnx_file in "$VOICE_DIR"/*.onnx; do
          if [[ -f "$onnx_file" ]]; then
            voice=$(basename "$onnx_file" .onnx)
            if [ "$voice" = "$CURRENT_VOICE" ]; then
              echo "  ▶ $voice (current)"
            else
              echo "    $voice"
            fi
            ((VOICE_COUNT++))
          fi
        done | sort

        if [[ $VOICE_COUNT -eq 0 ]]; then
          echo "  (No Piper voices downloaded yet)"
          echo ""
          echo "Download voices with: /agent-vibes:provider download <voice-name>"
          echo "Examples: en_US-lessac-medium, en_GB-alba-medium"
        fi
      fi
    else
      echo "🎤 Available ElevenLabs TTS Voices:"
      echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
      for voice in "${!VOICES[@]}"; do
        if [ "$voice" = "$CURRENT_VOICE" ]; then
          echo "  ▶ $voice (current)"
        else
          echo "    $voice"
        fi
      done | sort
    fi

    echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
    echo ""
    echo "Usage: voice-manager.sh switch <name>"
    echo "       voice-manager.sh preview"
    ;;

  preview)
    # Get play-tts.sh path
    SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
    TTS_SCRIPT="$SCRIPT_DIR/play-tts.sh"

    # Check if a specific voice name was provided
    if [[ -n "$2" ]] && [[ "$2" != "first" ]] && [[ "$2" != "last" ]] && ! [[ "$2" =~ ^[0-9]+$ ]]; then
      # User specified a voice name
      VOICE_NAME="$2"

      # Check if voice exists
      if [[ -n "${VOICES[$VOICE_NAME]}" ]]; then
        echo "🎤 Previewing voice: ${VOICE_NAME}"
        echo ""
        "$TTS_SCRIPT" "Hello, this is ${VOICE_NAME}. How do you like my voice?" "${VOICE_NAME}"
      else
        echo "❌ Voice not found: ${VOICE_NAME}"
        echo ""
        echo "Available voices:"
        for voice in "${!VOICES[@]}"; do
          echo "  • $voice"
        done | sort
      fi
      exit 0
    fi

    # Original preview logic for first/last/number
    echo "🎤 Voice Preview - Playing first 3 voices..."
    echo ""

    # Sort voices and preview first 3
    VOICE_ARRAY=()
    for voice in "${!VOICES[@]}"; do
      VOICE_ARRAY+=("$voice")
    done

    # Sort the array
    IFS=$'\n' SORTED_VOICES=($(sort <<<"${VOICE_ARRAY[*]}"))
    unset IFS

    # Play first 3 voices
    COUNT=0
    for voice in "${SORTED_VOICES[@]}"; do
      if [ $COUNT -eq 3 ]; then
        break
      fi
      echo "🔊 ${voice}..."
      "$TTS_SCRIPT" "Hi, I'm ${voice}" "${VOICES[$voice]}"
      sleep 0.5
      COUNT=$((COUNT + 1))
    done

    echo ""
    echo "Would you like to hear more? Reply 'yes' to continue."
    ;;

  switch)
    VOICE_NAME="$2"
    SILENT_MODE=false

    # Check for --silent flag
    if [[ "$2" == "--silent" ]] || [[ "$3" == "--silent" ]]; then
      SILENT_MODE=true
      # If --silent is first arg, voice name is in $3
      [[ "$2" == "--silent" ]] && VOICE_NAME="$3"
    fi

    if [[ -z "$VOICE_NAME" ]]; then
      # Show numbered list for selection
      echo "🎤 Select a voice by number:"
      echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"

      # Get current voice
      CURRENT="Cowboy Bob"
      if [ -f "$VOICE_FILE" ]; then
        CURRENT=$(cat "$VOICE_FILE")
      fi

      # Create array of voice names
      VOICE_ARRAY=()
      for voice in "${!VOICES[@]}"; do
        VOICE_ARRAY+=("$voice")
      done

      # Sort the array
      IFS=$'\n' SORTED_VOICES=($(sort <<<"${VOICE_ARRAY[*]}"))
      unset IFS

      # Display numbered list in two columns for compactness
      HALF=$(( (${#SORTED_VOICES[@]} + 1) / 2 ))

      for i in $(seq 0 $((HALF - 1))); do
        NUM1=$((i + 1))
        VOICE1="${SORTED_VOICES[$i]}"

        # Format first column
        if [[ "$VOICE1" == "$CURRENT" ]]; then
          COL1=$(printf "%2d. %-20s ✓" "$NUM1" "$VOICE1")
        else
          COL1=$(printf "%2d. %-20s  " "$NUM1" "$VOICE1")
        fi

        # Format second column if it exists
        NUM2=$((i + HALF + 1))
        if [[ $((i + HALF)) -lt ${#SORTED_VOICES[@]} ]]; then
          VOICE2="${SORTED_VOICES[$((i + HALF))]}"
          if [[ "$VOICE2" == "$CURRENT" ]]; then
            COL2=$(printf "%2d. %-20s ✓" "$NUM2" "$VOICE2")
          else
            COL2=$(printf "%2d. %-20s  " "$NUM2" "$VOICE2")
          fi
          echo "  $COL1 $COL2"
        else
          echo "  $COL1"
        fi
      done

      echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
      echo ""
      echo "Enter number (1-${#SORTED_VOICES[@]}) or voice name:"
      echo "Usage: /agent-vibes:switch 5"
      echo "       /agent-vibes:switch \"Northern Terry\""
      exit 0
    fi

    # Detect active TTS provider
    PROVIDER_FILE=""
    if [[ -f "$CLAUDE_DIR/tts-provider.txt" ]]; then
      PROVIDER_FILE="$CLAUDE_DIR/tts-provider.txt"
    elif [[ -f "$HOME/.claude/tts-provider.txt" ]]; then
      PROVIDER_FILE="$HOME/.claude/tts-provider.txt"
    fi

    ACTIVE_PROVIDER="elevenlabs"  # default
    if [[ -n "$PROVIDER_FILE" ]]; then
      ACTIVE_PROVIDER=$(cat "$PROVIDER_FILE")
    fi

    # Voice lookup strategy depends on active provider
    if [[ "$ACTIVE_PROVIDER" == "piper" ]]; then
      # Piper voice lookup: Scan voice directory for .onnx files
      source "$SCRIPT_DIR/piper-voice-manager.sh"
      VOICE_DIR=$(get_voice_storage_dir)

      # Check if voice file exists (case-insensitive)
      FOUND=""
      shopt -s nullglob
      for onnx_file in "$VOICE_DIR"/*.onnx; do
        if [[ -f "$onnx_file" ]]; then
          voice=$(basename "$onnx_file" .onnx)
          if [[ "${voice,,}" == "${VOICE_NAME,,}" ]]; then
            FOUND="$voice"
            break
          fi
        fi
      done
      shopt -u nullglob

      # If not found, check multi-speaker registry
      if [[ -z "$FOUND" ]] && [[ -f "$SCRIPT_DIR/piper-multispeaker-registry.sh" ]]; then
        source "$SCRIPT_DIR/piper-multispeaker-registry.sh"

        MULTISPEAKER_INFO=$(get_multispeaker_info "$VOICE_NAME")
        if [[ -n "$MULTISPEAKER_INFO" ]]; then
          MODEL="${MULTISPEAKER_INFO%%:*}"
          SPEAKER_ID="${MULTISPEAKER_INFO#*:}"

          # Verify the model file exists
          if [[ -f "$VOICE_DIR/${MODEL}.onnx" ]]; then
            # Store speaker name in tts-voice.txt
            echo "$VOICE_NAME" > "$VOICE_FILE"

            # Store model and speaker ID separately for play-tts-piper.sh
            echo "$MODEL" > "$CLAUDE_DIR/tts-piper-model.txt"
            echo "$SPEAKER_ID" > "$CLAUDE_DIR/tts-piper-speaker-id.txt"

            DESCRIPTION=$(get_multispeaker_description "$VOICE_NAME")
            echo "✅ Multi-speaker voice switched to: $VOICE_NAME"
            echo "🎤 Model: $MODEL.onnx (Speaker ID: $SPEAKER_ID)"
            if [[ -n "$DESCRIPTION" ]]; then
              echo "📝 Description: $DESCRIPTION"
            fi

            # Have the new voice introduce itself (unless silent mode)
            if [[ "$SILENT_MODE" != "true" ]]; then
              PLAY_TTS="$SCRIPT_DIR/play-tts.sh"
              if [ -x "$PLAY_TTS" ]; then
                "$PLAY_TTS" "Hi, I'm $VOICE_NAME. I'll be your voice assistant moving forward." > /dev/null 2>&1 &
              fi

              echo ""
              echo "💡 Tip: To hear automatic TTS narration, enable the Agent Vibes output style:"
              echo "   /output-style Agent Vibes"
            fi
            exit 0
          else
            echo "❌ Multi-speaker model not found: $MODEL.onnx"
            echo ""
            echo "Download it with: /agent-vibes:provider download"
            exit 1
          fi
        fi
      fi

      if [[ -z "$FOUND" ]]; then
        echo "❌ Piper voice not found: $VOICE_NAME"
        echo ""
        echo "Available Piper voices:"
        shopt -s nullglob
        for onnx_file in "$VOICE_DIR"/*.onnx; do
          if [[ -f "$onnx_file" ]]; then
            echo "  - $(basename "$onnx_file" .onnx)"
          fi
        done | sort
        shopt -u nullglob
        echo ""
        if [[ -f "$SCRIPT_DIR/piper-multispeaker-registry.sh" ]]; then
          echo "Multi-speaker voices (requires 16Speakers.onnx):"
          source "$SCRIPT_DIR/piper-multispeaker-registry.sh"
          for entry in "${MULTISPEAKER_VOICES[@]}"; do
            name="${entry%%:*}"
            echo "  - $name"
          done | sort
          echo ""
        fi
        echo "Download extra voices with: /agent-vibes:provider download"
        exit 1
      fi
    else
      # ElevenLabs voice lookup
      # Check if input is a number
      if [[ "$VOICE_NAME" =~ ^[0-9]+$ ]]; then
        # Get voice array
        VOICE_ARRAY=()
        for voice in "${!VOICES[@]}"; do
          VOICE_ARRAY+=("$voice")
        done

        # Sort the array
        IFS=$'\n' SORTED_VOICES=($(sort <<<"${VOICE_ARRAY[*]}"))
        unset IFS

        # Get voice by number (adjust for 0-based index)
        INDEX=$((VOICE_NAME - 1))

        if [[ $INDEX -ge 0 && $INDEX -lt ${#SORTED_VOICES[@]} ]]; then
          VOICE_NAME="${SORTED_VOICES[$INDEX]}"
          FOUND="${SORTED_VOICES[$INDEX]}"
        else
          echo "❌ Invalid number. Please choose between 1 and ${#SORTED_VOICES[@]}"
          exit 1
        fi
      else
        # Check if voice exists (case-insensitive)
        FOUND=""
        for voice in "${!VOICES[@]}"; do
          if [[ "${voice,,}" == "${VOICE_NAME,,}" ]]; then
            FOUND="$voice"
            break
          fi
        done
      fi

      if [[ -z "$FOUND" ]]; then
        echo "❌ Unknown voice: $VOICE_NAME"
        echo ""
        echo "Available voices:"
        for voice in "${!VOICES[@]}"; do
          echo "  - $voice"
        done | sort
        exit 1
      fi
    fi

    echo "$FOUND" > "$VOICE_FILE"
    echo "✅ Voice switched to: $FOUND"

    # Show voice ID only for ElevenLabs voices
    if [[ "$ACTIVE_PROVIDER" != "piper" ]] && [[ -n "${VOICES[$FOUND]}" ]]; then
      echo "🎤 Voice ID: ${VOICES[$FOUND]}"
    fi

    # Have the new voice introduce itself (unless silent mode)
    if [[ "$SILENT_MODE" != "true" ]]; then
      SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
      PLAY_TTS="$SCRIPT_DIR/play-tts.sh"
      if [ -x "$PLAY_TTS" ]; then
        "$PLAY_TTS" "Hi, I'm $FOUND. I'll be your voice assistant moving forward." "$FOUND" > /dev/null 2>&1 &
      fi

      echo ""
      echo "💡 Tip: To hear automatic TTS narration, enable the Agent Vibes output style:"
      echo "   /output-style Agent Vibes"
    fi
    ;;

  get)
    if [ -f "$VOICE_FILE" ]; then
      cat "$VOICE_FILE"
    else
      echo "Cowboy Bob"
    fi
    ;;

  whoami)
    echo "🎤 Current Voice Configuration"
    echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"

    # Get active TTS provider
    PROVIDER_FILE="$CLAUDE_DIR/tts-provider.txt"
    if [[ ! -f "$PROVIDER_FILE" ]]; then
      PROVIDER_FILE="$HOME/.claude/tts-provider.txt"
    fi

    if [ -f "$PROVIDER_FILE" ]; then
      ACTIVE_PROVIDER=$(cat "$PROVIDER_FILE")
      if [[ "$ACTIVE_PROVIDER" == "elevenlabs" ]]; then
        echo "Provider: ElevenLabs (Premium AI)"
      elif [[ "$ACTIVE_PROVIDER" == "piper" ]]; then
        echo "Provider: Piper TTS (Free, Offline)"
      else
        echo "Provider: $ACTIVE_PROVIDER"
      fi
    else
      # Default to ElevenLabs if no provider file
      echo "Provider: ElevenLabs (Premium AI)"
    fi

    # Get current voice
    if [ -f "$VOICE_FILE" ]; then
      CURRENT_VOICE=$(cat "$VOICE_FILE")
    else
      CURRENT_VOICE="Cowboy Bob"
    fi
    echo "Voice: $CURRENT_VOICE"

    # Get current sentiment (priority)
    if [ -f "$HOME/.claude/tts-sentiment.txt" ]; then
      SENTIMENT=$(cat "$HOME/.claude/tts-sentiment.txt")
      echo "Sentiment: $SENTIMENT (active)"

      # Also show personality if set
      if [ -f "$HOME/.claude/tts-personality.txt" ]; then
        PERSONALITY=$(cat "$HOME/.claude/tts-personality.txt")
        echo "Personality: $PERSONALITY (overridden by sentiment)"
      fi
    else
      # No sentiment, check personality
      if [ -f "$HOME/.claude/tts-personality.txt" ]; then
        PERSONALITY=$(cat "$HOME/.claude/tts-personality.txt")
        echo "Personality: $PERSONALITY (active)"
      else
        echo "Personality: normal"
      fi
    fi

    echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
    ;;

  list-simple)
    # Simple list for AI to parse and display
    # Get active provider
    PROVIDER_FILE="$CLAUDE_DIR/tts-provider.txt"
    if [[ ! -f "$PROVIDER_FILE" ]]; then
      PROVIDER_FILE="$HOME/.claude/tts-provider.txt"
    fi

    ACTIVE_PROVIDER="elevenlabs"  # default
    if [ -f "$PROVIDER_FILE" ]; then
      ACTIVE_PROVIDER=$(cat "$PROVIDER_FILE")
    fi

    if [[ "$ACTIVE_PROVIDER" == "piper" ]]; then
      # List downloaded Piper voices
      if [[ -f "$SCRIPT_DIR/piper-voice-manager.sh" ]]; then
        source "$SCRIPT_DIR/piper-voice-manager.sh"
        VOICE_DIR=$(get_voice_storage_dir)
        for onnx_file in "$VOICE_DIR"/*.onnx; do
          if [[ -f "$onnx_file" ]]; then
            basename "$onnx_file" .onnx
          fi
        done | sort
      fi
    else
      # List ElevenLabs voices
      for voice in "${!VOICES[@]}"; do
        echo "$voice"
      done | sort
    fi
    ;;

  replay)
    # Replay recent TTS audio from history
    # Use project-local directory with same logic as play-tts.sh
    if [[ -n "$CLAUDE_PROJECT_DIR" ]]; then
      AUDIO_DIR="$CLAUDE_PROJECT_DIR/.claude/audio"
    else
      # Fallback: try to find .claude directory in current path
      CURRENT_DIR="$PWD"
      while [[ "$CURRENT_DIR" != "/" ]]; do
        if [[ -d "$CURRENT_DIR/.claude" ]]; then
          AUDIO_DIR="$CURRENT_DIR/.claude/audio"
          break
        fi
        CURRENT_DIR=$(dirname "$CURRENT_DIR")
      done
      # Final fallback to global if no project .claude found
      if [[ -z "$AUDIO_DIR" ]]; then
        AUDIO_DIR="$HOME/.claude/audio"
      fi
    fi

    # Default to replay last audio (N=1)
    N="${2:-1}"

    # Validate N is a number
    if ! [[ "$N" =~ ^[0-9]+$ ]]; then
      echo "❌ Invalid argument. Please use a number (1-10)"
      echo "Usage: /agent-vibes:replay [N]"
      echo "  N=1 - Last audio (default)"
      echo "  N=2 - Second-to-last"
      echo "  N=3 - Third-to-last"
      exit 1
    fi

    # Check bounds
    if [[ $N -lt 1 || $N -gt 10 ]]; then
      echo "❌ Number out of range. Please choose 1-10"
      exit 1
    fi

    # Get list of audio files sorted by time (newest first)
    if [[ ! -d "$AUDIO_DIR" ]]; then
      echo "❌ No audio history found"
      echo "Audio files are stored in: $AUDIO_DIR"
      exit 1
    fi

    # Get the Nth most recent file
    AUDIO_FILE=$(ls -t "$AUDIO_DIR"/tts-*.mp3 2>/dev/null | sed -n "${N}p")

    if [[ -z "$AUDIO_FILE" ]]; then
      TOTAL=$(ls -t "$AUDIO_DIR"/tts-*.mp3 2>/dev/null | wc -l)
      echo "❌ Audio #$N not found in history"
      echo "Total audio files available: $TOTAL"
      exit 1
    fi

    echo "🔊 Replaying audio #$N:"
    echo "   File: $(basename "$AUDIO_FILE")"
    echo "   Path: $AUDIO_FILE"

    # Play the audio file in background
    (paplay "$AUDIO_FILE" 2>/dev/null || aplay "$AUDIO_FILE" 2>/dev/null || mpg123 "$AUDIO_FILE" 2>/dev/null) &
    ;;

  *)
    echo "Usage: voice-manager.sh [list|switch|get|replay|whoami] [voice_name]"
    echo ""
    echo "Commands:"
    echo "  list                    - List all available voices"
    echo "  switch <voice_name>     - Switch to a different voice"
    echo "  get                     - Get current voice name"
    echo "  replay [N]              - Replay Nth most recent audio (default: 1)"
    echo "  whoami                  - Show current voice and personality"
    exit 1
    ;;
esac