Spaces:
Running
on
Zero
Running
on
Zero
Commit
·
96d8d72
1
Parent(s):
0d19baf
Fix torchcodec error: Replace torchaudio.load with librosa.load for better stability
Browse files- core/scoring_engine.py +3 -5
- requirements.txt +0 -1
core/scoring_engine.py
CHANGED
|
@@ -5,7 +5,6 @@
|
|
| 5 |
# =======================================
|
| 6 |
|
| 7 |
import torch
|
| 8 |
-
import torchaudio
|
| 9 |
import numpy as np
|
| 10 |
import librosa
|
| 11 |
from transformers import (
|
|
@@ -145,11 +144,10 @@ class AdvancedVocalScoringSystem:
|
|
| 145 |
Returns:
|
| 146 |
ScoreResult dengan semua metrik
|
| 147 |
"""
|
| 148 |
-
# Load audio
|
| 149 |
-
|
| 150 |
|
| 151 |
-
#
|
| 152 |
-
audio_np = waveform.numpy()
|
| 153 |
if audio_np.ndim > 1:
|
| 154 |
audio_np = audio_np[0]
|
| 155 |
|
|
|
|
| 5 |
# =======================================
|
| 6 |
|
| 7 |
import torch
|
|
|
|
| 8 |
import numpy as np
|
| 9 |
import librosa
|
| 10 |
from transformers import (
|
|
|
|
| 144 |
Returns:
|
| 145 |
ScoreResult dengan semua metrik
|
| 146 |
"""
|
| 147 |
+
# Load audio using librosa (more stable than torchaudio)
|
| 148 |
+
audio_np, sr = librosa.load(audio_path, sr=16000) # 16kHz for Whisper
|
| 149 |
|
| 150 |
+
# Ensure mono
|
|
|
|
| 151 |
if audio_np.ndim > 1:
|
| 152 |
audio_np = audio_np[0]
|
| 153 |
|
requirements.txt
CHANGED
|
@@ -3,7 +3,6 @@
|
|
| 3 |
|
| 4 |
# Core ML Libraries
|
| 5 |
torch>=2.0.0
|
| 6 |
-
torchaudio>=2.0.0
|
| 7 |
transformers>=4.35.0
|
| 8 |
|
| 9 |
# Audio Processing
|
|
|
|
| 3 |
|
| 4 |
# Core ML Libraries
|
| 5 |
torch>=2.0.0
|
|
|
|
| 6 |
transformers>=4.35.0
|
| 7 |
|
| 8 |
# Audio Processing
|