yl4579 · netlinux-ai · May 9, 2026
diff --git a/meldataset.py b/meldataset.py
@@ -18,7 +18,8 @@
 logger = logging.getLogger(__name__)
 logger.setLevel(logging.DEBUG)
 
-import pandas as pd
+# pandas no longer required: the only use was a speaker_id filter,
+# replaced with a list comprehension below.
 
 _pad = "$"
 _punctuation = ';:,.!?¡¿—…"«»“” '
@@ -84,7 +85,6 @@ def __init__(self,
         self.text_cleaner = TextCleaner()
         self.sr = sr
 
-        self.df = pd.DataFrame(self.data_list)
 
         self.to_melspec = torchaudio.transforms.MelSpectrogram(**MEL_PARAMS)
 
@@ -116,7 +116,8 @@ def __getitem__(self, idx):
         acoustic_feature = acoustic_feature[:, :(length_feature - length_feature % 2)]
 
         # get reference sample
-        ref_data = (self.df[self.df[2] == str(speaker_id)]).sample(n=1).iloc[0].tolist()
+        matching = [r for r in self.data_list if r[2] == str(speaker_id)]
+        ref_data = random.choice(matching)
         ref_mel_tensor, ref_label = self._load_data(ref_data[:3])
 
         # get OOD text