timerring · timerring · Dec 12, 2024 · Dec 12, 2024
diff --git a/README.md b/README.md
@@ -86,7 +86,7 @@ graph TD
 
 ### Installation(有 GPU 版本)
 
-> 是否有 GPU 以 `nvidia-smi` 显示驱动以及 `CUDA` 检查通过为准。如果未配置显卡驱动或未安装 `CUDA`，即使有 GPU 也无法使用。
+> 是否有 GPU 以 `nvidia-smi` 显示 nvidia GPU 驱动以及 `nvcc -V` 显示 `CUDA` 版本号为准。如果未配置显卡驱动或未安装 `CUDA`，即使有 GPU 也无法使用，而会使用 CPU 推理（不推荐，可根据自身硬件条件判断是否尝试 CPU 推理）。
 
 > [!TIP]
 > 如果你是 windows 用户，请不要使用命令提示符（Command Prompt）或 Windows PowerShell，请使用 [PowerShell](https://learn.microsoft.com/en-us/powershell/scripting/install/installing-powershell-on-windows?view=powershell-7.4) 或 WSL 或 **Git Bash**(推荐)。
@@ -178,7 +178,7 @@ logs # 日志文件夹
 ### Installation(无 GPU 版本)
 无 GPU 版本过程基本同上，可以跳过步骤 3，需要注意在执行步骤 5 **之前**完成以下设置将确保完全用 CPU 渲染视频弹幕。
 
-1. 请将 `src/allconfig.py` 文件中的 `GPU_EXIST` 参数设置为 `False`
+1. 请将 `src/allconfig.py` 文件中的 `GPU_EXIST` 参数设置为 `False`。（若不置为 `False` 且则会使用 CPU 推理，不推荐，可自行根据硬件条件进行尝试。）
 2. 将 `MODEL_TYPE` 调整为 `merge` 或者 `append`。
 
 > [!TIP]

diff --git a/docs/installation.md b/docs/installation.md
@@ -14,7 +14,7 @@
 
 ## Installation(有 GPU 版本)
 
-> 是否有 GPU 以 `nvidia-smi` 显示驱动以及 `CUDA` 检查通过为准。如果未配置显卡驱动或未安装 `CUDA`，即使有 GPU 也无法使用。
+> 是否有 GPU 以 `nvidia-smi` 显示 nvidia GPU 驱动以及 `nvcc -V` 显示 `CUDA` 版本号为准。如果未配置显卡驱动或未安装 `CUDA`，即使有 GPU 也无法使用，而会使用 CPU 推理（不推荐，可根据自身硬件条件判断是否尝试 CPU 推理）。
 
 > [!TIP]
 > 如果你是 windows 用户，请不要使用命令提示符（Command Prompt）或 Windows PowerShell，请使用 [PowerShell](https://learn.microsoft.com/en-us/powershell/scripting/install/installing-powershell-on-windows?view=powershell-7.4) 或 WSL 或 **Git Bash**(推荐)。
@@ -107,5 +107,5 @@ logs # 日志文件夹
 ## Installation(无 GPU 版本)
 无 GPU 版本过程基本同上，可以跳过步骤 3，需要注意在执行步骤 5 **之前**完成以下设置将确保完全用 CPU 渲染视频弹幕。
 
-1. 请将 `src/allconfig.py` 文件中的 `GPU_EXIST` 参数设置为 `False`
+1. 请将 `src/allconfig.py` 文件中的 `GPU_EXIST` 参数设置为 `False`。（若不置为 `False` 且则会使用 CPU 推理，不推荐，可自行根据硬件条件进行尝试。）
 2. 将 `MODEL_TYPE` 调整为 `merge` 或者 `append`。
diff --git a/src/subtitle/config.py b/src/subtitle/config.py
@@ -43,10 +43,6 @@ def init_settings_config():
 
 init_settings_config()
 
-ffmpeg_bin = os.path.join('linux_x64', 'ffmpeg')
-FFMPEG_PATH = os.path.join(BASE_DIR, '', ffmpeg_bin)
-os.chmod(FFMPEG_PATH, stat.S_IRWXU+stat.S_IRWXG+stat.S_IRWXO)
-
 SILENCE_THRESH = -70           # silence below -70dBFS is considered silence
 MIN_SILENCE_LEN = 700          # if silence is longer than 700ms, split
 LENGTH_LIMIT = 60 * 1000       # split into segments no longer than 1 minute

diff --git a/src/subtitle/generate.py b/src/subtitle/generate.py
@@ -111,7 +111,7 @@ def __call__(self, region):
             start = max(0, start - self.include_before)
             end += self.include_after
             temp = tempfile.NamedTemporaryFile(suffix='.flac', delete=False)
-            command = [config.FFMPEG_PATH, "-ss", str(start), "-t", str(end - start),
+            command = ["ffmpeg", "-ss", str(start), "-t", str(end - start),
                        "-y", "-i", self.source_path,
                        "-loglevel", "error", temp.name]
             use_shell = True if os.name == "nt" else False
@@ -170,10 +170,7 @@ def extract_audio(self, rate=16000):
         if not os.path.isfile(self.filename):
             print("The given file does not exist: {}".format(self.filename))
             raise Exception("Invalid filepath: {}".format(self.filename))
-        if not self.which(config.FFMPEG_PATH):
-            print("ffmpeg: Executable not found on machine.")
-            raise Exception("Dependency not found: ffmpeg")
-        command = [config.FFMPEG_PATH, "-y", "-i", self.filename,
+        command = ["ffmpeg", "-y", "-i", self.filename,
                    "-ac", '1', "-ar", str(rate),
                    "-loglevel", "error", temp.name]
         use_shell = True if os.name == "nt" else False
@@ -252,7 +249,7 @@ def run(self, output=None):
         """
         audio_filename, audio_rate = self.extract_audio()
         regions = self.find_speech_regions(audio_filename)
-        pool = multiprocessing.Pool(10)
+        pool = multiprocessing.Pool(12)
         converter = FLACConverter(source_path=audio_filename)
         recognizer = AudioRecogniser(language=self.language)
         transcripts = []

diff --git a/src/subtitle/linux_x64/ffmpeg b/src/subtitle/linux_x64/ffmpeg