ItsukiNakano
Eternal Poster
Mga master baka po may alam pano pwede gawin dito, pag uupload sana ng audio files para itrain sa deeplearning. Kaso yung problem napaka rami at napaka laki, hindi kinakaya ng ram ng google colab.
baka po may makatulong
Code:
def load_audio_data(dataset_dir):
audio_data = []
labels = []
supported_extensions = ['mp3', 'wav', 'm4a']
print(f"Loading data from: {dataset_dir}")
def process_directory(directory, label):
for root, _, files in os.walk(directory):
for audio_file in files:
if audio_file.split('.')[-1].lower() in supported_extensions:
audio_path = os.path.join(root, audio_file)
try:
audio, sr = librosa.load(audio_path, sr=None, duration=5)
audio_data.append((audio, sr))
labels.append(label)
print(f"Loaded {audio_path}")
except Exception as e:
print(f"Error loading file {audio_path}: {e}")
for label in tqdm(os.listdir(dataset_dir), desc="Loading labels"):
label_dir = os.path.join(dataset_dir, label)
if os.path.isdir(label_dir):
print(f"Entering directory: {label_dir} (Label: {label})")
process_directory(label_dir, label)
total_data = len(audio_data)
print(f"Total Data Samples: {total_data}")
if audio_data:
print(f"First audio file data: {audio_data[0]}")
print(f"Label of the first audio file: {labels[0]}")
unique_labels = set(labels)
print(f"Unique labels found: {unique_labels}")
for label in unique_labels:
print(f"Number of files for {label}: {labels.count(label)}")
return audio_data, labels
baka po may makatulong