Files
vibeline/transcribe.sh
2025-04-07 16:15:05 +01:00

74 lines
2.0 KiB
Bash
Executable File

#!/bin/bash
# Parse arguments
force_flag=""
while getopts "f" opt; do
case $opt in
f) force_flag="--force" ;;
esac
done
shift $((OPTIND-1))
# Load environment variables
[ -f .env ] && source .env
# Check if a file argument was provided
if [ $# -ne 1 ]; then
echo "Usage: $0 [-f] <audio_file>"
exit 1
fi
# Get the input file
input_file="$1"
# Check if the input file exists
if [ ! -f "$input_file" ]; then
echo "Error: File $input_file does not exist"
exit 1
fi
# Set the directory paths
VOICE_MEMOS_DIR="${VOICE_MEMOS_DIR:-VoiceMemos}"
TRANSCRIPT_DIR="$VOICE_MEMOS_DIR/transcripts"
# Create transcripts directory if it doesn't exist
mkdir -p "$TRANSCRIPT_DIR"
# Get the filename without the path and extension
filename=$(basename "$input_file" .m4a)
transcript_file="$TRANSCRIPT_DIR/$filename.txt"
# Check if transcript already exists
if [ -f "$transcript_file" ] && [ -z "$force_flag" ]; then
echo "Transcript already exists: $transcript_file (use -f to overwrite)"
exit 0
fi
echo "Processing file: $input_file"
echo "Transcribing audio..."
# Activate the virtual environment
[ -d "vibenv" ] && source vibenv/bin/activate
# Get the duration of the audio file in seconds using ffprobe
duration=$(ffprobe -v error -show_entries format=duration -of default=noprint_wrappers=1:nokey=1 "$input_file")
# Convert duration to minutes (floating point)
duration_minutes=$(echo "$duration / 60" | bc -l)
# Set output format based on duration
if (( $(echo "$duration_minutes > 21" | bc -l) )); then
# For files longer than 21 minutes, produce all formats
whisper "$input_file" --model $WHISPER_MODEL --output_dir "$TRANSCRIPT_DIR"
else
# For shorter files, produce only txt format
whisper "$input_file" --model $WHISPER_MODEL --output_dir "$TRANSCRIPT_DIR" --output_format txt
fi
# Deactivate the virtual environment
[ -d "vibenv" ] && deactivate
echo "Transcription saved to: $transcript_file"
echo "----------------------------------------"