musikalkemist · dhunstack · Dec 22, 2024
diff --git a/.gitignore b/.gitignore
@@ -127,3 +127,6 @@ dmypy.json
 
 # Pyre type checker
 .pyre/
+
+# json files
+*.json
diff --git a/12- Music genre classification: Preparing the dataset/code/extract_data.py b/12- Music genre classification: Preparing the dataset/code/extract_data.py
@@ -3,7 +3,7 @@
 import math
 import librosa
 
-DATASET_PATH = "path/to/marsyas/dataset"
+DATASET_PATH = "path/to/gtzan/dataset"  # can be downloaded from 'https://huggingface.co/datasets/marsyas/gtzan/resolve/main/data/genres.tar.gz'
 JSON_PATH = "data_10.json"
 SAMPLE_RATE = 22050
 TRACK_DURATION = 30 # measured in seconds
@@ -48,7 +48,10 @@ def save_mfcc(dataset_path, json_path, num_mfcc=13, n_fft=2048, hop_length=512,
 
 		# load audio file
                 file_path = os.path.join(dirpath, f)
-                signal, sample_rate = librosa.load(file_path, sr=SAMPLE_RATE)
+                try:
+                    signal, sample_rate = librosa.load(file_path, sr=SAMPLE_RATE)
+                except Exception:
+                    continue
 
                 # process all segments of audio file
                 for d in range(num_segments):
@@ -58,7 +61,7 @@ def save_mfcc(dataset_path, json_path, num_mfcc=13, n_fft=2048, hop_length=512,
                     finish = start + samples_per_segment
 
                     # extract mfcc
-                    mfcc = librosa.feature.mfcc(signal[start:finish], sample_rate, n_mfcc=num_mfcc, n_fft=n_fft, hop_length=hop_length)
+                    mfcc = librosa.feature.mfcc(y=signal[start:finish], sr=sample_rate, n_mfcc=num_mfcc, n_fft=n_fft, hop_length=hop_length)
                     mfcc = mfcc.T
 
                     # store only mfcc feature with expected number of vectors
-Original file line number
+Diff line change
@@ Expand Up / @@ -127,3 +127,6 @@ dmypy.json @@
     # Pyre type checker
     .pyre/
+    # json files
+    *.json