feat(inference): add `_parse_list_file` to handle default values for `ref_audio_path` and `ref_text`

- Parse `slicer_opt.list` for default `ref_audio_path` and `ref_text` values if not provided in the config.

Files changed (1) hide show

training_pipeline/stages/inference.py CHANGED Viewed

@@ -165,10 +165,38 @@ class InferenceStage(BaseStage):
         sovits_paths = self.config.sovits_paths()
         return len(gpt_paths) > 0 and len(sovits_paths) > 0
     def run(self) -> Generator[Dict[str, Any], None, None]:
         self._status = StageStatus.RUNNING
         cfg = self.config
         # 确保输出目录存在
         os.makedirs(cfg.output_dir, exist_ok=True)

         sovits_paths = self.config.sovits_paths()
         return len(gpt_paths) > 0 and len(sovits_paths) > 0
+    def _parse_list_file(self) -> tuple[str, str]:
+        """从 asr_opt/slicer_opt.list 解析第一行获取 ref_audio_path 和 ref_text
+        Returns:
+            (ref_audio_path, ref_text) 元组，解析失败返回空字符串
+        """
+        list_path = os.path.join(self.config.exp_dir, 'asr_opt', 'slicer_opt.list')
+        if not os.path.exists(list_path):
+            return "", ""
+        with open(list_path, 'r', encoding='utf-8') as f:
+            first_line = f.readline().strip()
+        if not first_line:
+            return "", ""
+        # 格式: {音频路径}|{文件夹名}|{语言}|{识别文本}
+        parts = first_line.split('|')
+        if len(parts) >= 4:
+            return parts[0], parts[3]
+        return "", ""
     def run(self) -> Generator[Dict[str, Any], None, None]:
         self._status = StageStatus.RUNNING
         cfg = self.config
+        # 如果 ref_text 或 ref_audio_path 为空，从 .list 文件解析默认值
+        if not cfg.ref_text or not cfg.ref_audio_path:
+            parsed_audio, parsed_text = self._parse_list_file()
+            cfg.ref_audio_path = parsed_audio
+            cfg.ref_text = parsed_text
         # 确保输出目录存在
         os.makedirs(cfg.output_dir, exist_ok=True)