fariedalfarizi commited on
Commit
96d8d72
·
1 Parent(s): 0d19baf

Fix torchcodec error: Replace torchaudio.load with librosa.load for better stability

Browse files
Files changed (2) hide show
  1. core/scoring_engine.py +3 -5
  2. requirements.txt +0 -1
core/scoring_engine.py CHANGED
@@ -5,7 +5,6 @@
5
  # =======================================
6
 
7
  import torch
8
- import torchaudio
9
  import numpy as np
10
  import librosa
11
  from transformers import (
@@ -145,11 +144,10 @@ class AdvancedVocalScoringSystem:
145
  Returns:
146
  ScoreResult dengan semua metrik
147
  """
148
- # Load audio
149
- waveform, sr = torchaudio.load(audio_path)
150
 
151
- # Convert to numpy for librosa
152
- audio_np = waveform.numpy()
153
  if audio_np.ndim > 1:
154
  audio_np = audio_np[0]
155
 
 
5
  # =======================================
6
 
7
  import torch
 
8
  import numpy as np
9
  import librosa
10
  from transformers import (
 
144
  Returns:
145
  ScoreResult dengan semua metrik
146
  """
147
+ # Load audio using librosa (more stable than torchaudio)
148
+ audio_np, sr = librosa.load(audio_path, sr=16000) # 16kHz for Whisper
149
 
150
+ # Ensure mono
 
151
  if audio_np.ndim > 1:
152
  audio_np = audio_np[0]
153
 
requirements.txt CHANGED
@@ -3,7 +3,6 @@
3
 
4
  # Core ML Libraries
5
  torch>=2.0.0
6
- torchaudio>=2.0.0
7
  transformers>=4.35.0
8
 
9
  # Audio Processing
 
3
 
4
  # Core ML Libraries
5
  torch>=2.0.0
 
6
  transformers>=4.35.0
7
 
8
  # Audio Processing