Add audio resampling utility and scipy dependency

- Created resample_audio.py utility script - Automatically reads target sample rate from config.json - Resamples all WAV files in sounds directory - Creates .backup files before modifying originals - Handles both mono and stereo audio - Uses scipy.signal.resample for high-quality resampling - Added scipy>=1.7.0 dependency to pyproject.toml - Updated Makefile sync command to include scipy - Updated README.md with sample rate troubleshooting section - Updated config example in README to show 48kHz default - Added beep_sound configuration to README system section This resolves sample rate mismatch errors when audio files don't match the configured rate in config.json. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
2025-10-27 13:02:39 +07:00
parent 52b8348a03
commit 30ac7e89e9
4 changed files with 190 additions and 2 deletions
--- a/2
+++ b/2
@@ -13,7 +13,7 @@ test:
 sync:
 	@echo "Installing/syncing dependencies..."
-	uv pip install flask numpy pyaudio RPi.GPIO waitress
+	uv pip install flask numpy pyaudio RPi.GPIO waitress scipy
 install: sync
 	@echo "Dependencies installed!"
--- a/README.md
+++ b/README.md
@@ -97,6 +97,7 @@ Web interface available at: `http://<raspberry-pi-ip>:8080`
  - pyaudio>=0.2.13
  - RPi.GPIO>=0.7.1
  - waitress>=2.1.0 (production WSGI server)
  - scipy>=1.7.0 (audio resampling utility)
 ## Installation
@@ -506,7 +507,7 @@ The `config.json` file contains all system settings:
    "chunk_size": 1024,                    // Audio buffer size
    "format": "paInt16",                   // Audio format (16-bit)
    "channels": 1,                         // Mono audio
-    "sample_rate": 44100,                  // 44.1kHz sample rate
+    "sample_rate": 48000,                  // 48kHz sample rate
    "max_record_seconds": 300              // Max recording time (5 minutes)
  },
  "paths": {
@@ -527,6 +528,8 @@ The `config.json` file contains all system settings:
  "system": {
    "active_greeting": "dialtone.wav",     // Default greeting
    "extra_button_sound": "button_sound.wav", // Default button sound
    "beep_sound": "beep.wav",              // Recording start beep
    "beep_enabled": true,                  // Enable beep before recording
    "greeting_delay_seconds": 0,           // Delay before greeting plays (0-10)
    "volume": 70                           // Default volume (0-100)
  }
@@ -597,6 +600,39 @@ Look for your HiFiBerry device and note its index number, then set it in `config
 4. Check IP address: `hostname -I`
 5. Try localhost: `http://127.0.0.1:8080`
 ### Audio Sample Rate Mismatch
 If you see errors like `Expression 'paInvalidSampleRate' failed` or warnings about sample rate mismatches:
 1. **Check your config.json sample rate** (default is 48000Hz):
   ```json
   "audio": {
     "sample_rate": 48000
   }
   ```
 2. **Resample your audio files** to match the configured rate:
   ```bash
   # Using the provided resampling script
   python3 resample_audio.py
   # Or manually with ffmpeg
   ffmpeg -i input.wav -ar 48000 output.wav
   ```
 3. **Delete default sounds** to regenerate at correct rate:
   ```bash
   rm rotary_phone_data/sounds/dialtone.wav
   rm rotary_phone_data/sounds/beep.wav
   # These will be regenerated at startup
   ```
 The `resample_audio.py` utility will:
 - Automatically detect the target sample rate from `config.json`
 - Create `.backup` files before modifying originals
 - Resample all WAV files in the sounds directory
 - Preserve stereo/mono and bit depth
 ### Configuration Errors
 If the script won't start:
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -10,6 +10,7 @@ dependencies = [
    "pyaudio>=0.2.13",
    "RPi.GPIO>=0.7.1",
    "waitress>=2.1.0",
    "scipy>=1.7.0",
 ]
 [project.scripts]
--- a/resample_audio.py
+++ b/resample_audio.py
@@ -0,0 +1,151 @@
 #!/usr/bin/env python3
 """
 Audio Resampling Utility for Wedding Phone
 Resamples all WAV files in sounds directory to match configured sample rate
 """
 import wave
 import numpy as np
 import os
 import json
 from scipy import signal
 def load_config():
    """Load sample rate from config.json"""
    config_path = 'config.json'
    if not os.path.exists(config_path):
        print("config.json not found, using 48000Hz as default")
        return 48000
    with open(config_path, 'r') as f:
        config = json.load(f)
        return config['audio']['sample_rate']
 def resample_wav(input_file, output_file, target_rate):
    """Resample a WAV file to target sample rate"""
    try:
        # Open source file
        with wave.open(input_file, 'rb') as wf:
            n_channels = wf.getnchannels()
            sampwidth = wf.getsampwidth()
            source_rate = wf.getframerate()
            n_frames = wf.getnframes()
            # Read audio data
            audio_data = wf.readframes(n_frames)
            # Convert to numpy array
            if sampwidth == 1:
                dtype = np.uint8
            elif sampwidth == 2:
                dtype = np.int16
            elif sampwidth == 4:
                dtype = np.int32
            else:
                print(f"Unsupported sample width: {sampwidth}")
                return False
            audio_array = np.frombuffer(audio_data, dtype=dtype)
            # Handle stereo
            if n_channels == 2:
                audio_array = audio_array.reshape(-1, 2)
            # Resample
            if source_rate != target_rate:
                print(f"  Resampling from {source_rate}Hz to {target_rate}Hz...")
                num_samples = int(len(audio_array) * target_rate / source_rate)
                if n_channels == 1:
                    resampled = signal.resample(audio_array, num_samples)
                else:
                    # Resample each channel separately
                    left = signal.resample(audio_array[:, 0], num_samples)
                    right = signal.resample(audio_array[:, 1], num_samples)
                    resampled = np.column_stack((left, right))
                # Convert back to original dtype
                resampled = np.clip(resampled, np.iinfo(dtype).min, np.iinfo(dtype).max)
                audio_array = resampled.astype(dtype)
            # Write output file
            with wave.open(output_file, 'wb') as wf_out:
                wf_out.setnchannels(n_channels)
                wf_out.setsampwidth(sampwidth)
                wf_out.setframerate(target_rate)
                wf_out.writeframes(audio_array.tobytes())
            return True
    except Exception as e:
        print(f"  Error: {e}")
        return False
 def main():
    """Main resampling function"""
    print("Wedding Phone Audio Resampler")
    print("=" * 50)
    # Load target sample rate
    target_rate = load_config()
    print(f"\nTarget sample rate: {target_rate}Hz")
    # Check sounds directory
    sounds_dir = './rotary_phone_data/sounds'
    if not os.path.exists(sounds_dir):
        print(f"\nSounds directory not found: {sounds_dir}")
        return
    # Get all WAV files
    wav_files = [f for f in os.listdir(sounds_dir) if f.endswith('.wav')]
    if not wav_files:
        print("\nNo WAV files found in sounds directory")
        return
    print(f"\nFound {len(wav_files)} WAV file(s)")
    print("-" * 50)
    # Process each file
    for filename in wav_files:
        input_path = os.path.join(sounds_dir, filename)
        print(f"\nProcessing: {filename}")
        # Check current sample rate
        try:
            with wave.open(input_path, 'rb') as wf:
                current_rate = wf.getframerate()
                print(f"  Current rate: {current_rate}Hz")
                if current_rate == target_rate:
                    print(f"  ✓ Already at {target_rate}Hz, skipping")
                    continue
        except Exception as e:
            print(f"  Error reading file: {e}")
            continue
        # Create backup
        backup_path = input_path + '.backup'
        if not os.path.exists(backup_path):
            os.rename(input_path, backup_path)
            print(f"  Backup created: {filename}.backup")
        else:
            input_path = backup_path
            print(f"  Using existing backup")
        # Resample
        output_path = os.path.join(sounds_dir, filename)
        if resample_wav(input_path, output_path, target_rate):
            print(f"  ✓ Successfully resampled to {target_rate}Hz")
        else:
            print(f"  ✗ Failed to resample, restoring backup")
            if os.path.exists(backup_path):
                os.rename(backup_path, output_path)
    print("\n" + "=" * 50)
    print("Resampling complete!")
    print("\nBackup files (.backup) have been created.")
    print("If everything works, you can delete them.")
 if __name__ == "__main__":
    main()