abogen
Advanced tools
@@ -5,5 +5,3 @@ from abogen.utils import get_version | ||
| PROGRAM_NAME = "abogen" | ||
| PROGRAM_DESCRIPTION = ( | ||
| "Generate audiobooks from EPUBs, PDFs and text with synchronized captions." | ||
| ) | ||
| PROGRAM_DESCRIPTION = "Generate audiobooks from EPUBs, PDFs, text and subtitles with synchronized captions." | ||
| GITHUB_URL = "https://github.com/denizsafak/abogen" | ||
@@ -48,2 +46,3 @@ VERSION = get_version() | ||
| "ass", | ||
| "vtt", | ||
| ] | ||
@@ -56,2 +55,5 @@ | ||
| "txt", | ||
| "srt", | ||
| "ass", | ||
| "vtt", | ||
| ] | ||
@@ -58,0 +60,0 @@ |
@@ -17,2 +17,4 @@ # Special thanks to @geo38 from Reddit, who provided this Dockerfile: | ||
| espeak-ng \ | ||
| libxcb-cursor0 \ | ||
| libgl1 \ | ||
| && apt-get clean \ | ||
@@ -19,0 +21,0 @@ && rm -rf /var/lib/apt/lists/* |
+18
-1
@@ -7,2 +7,19 @@ import os | ||
| # Fix PyTorch DLL loading issue ([WinError 1114]) on Windows before importing PyQt6 | ||
| if platform.system() == "Windows": | ||
| import ctypes | ||
| from importlib.util import find_spec | ||
| try: | ||
| if ( | ||
| (spec := find_spec("torch")) | ||
| and spec.origin | ||
| and os.path.exists( | ||
| dll_path := os.path.join(os.path.dirname(spec.origin), "lib", "c10.dll") | ||
| ) | ||
| ): | ||
| ctypes.CDLL(os.path.normpath(dll_path)) | ||
| except Exception: | ||
| pass | ||
| # Qt platform plugin detection (fixes #59) | ||
@@ -138,3 +155,3 @@ try: | ||
| try: | ||
| app.setDesktopFileName("abogen.desktop") | ||
| app.setDesktopFileName("abogen") | ||
| except AttributeError: | ||
@@ -141,0 +158,0 @@ pass |
@@ -90,3 +90,7 @@ # a simple window with a list of items in the queue, no checkboxes | ||
| for url in event.mimeData().urls(): | ||
| if url.isLocalFile() and url.toLocalFile().lower().endswith(".txt"): | ||
| file_path = url.toLocalFile().lower() | ||
| if url.isLocalFile() and ( | ||
| file_path.endswith(".txt") | ||
| or file_path.endswith((".srt", ".ass", ".vtt")) | ||
| ): | ||
| self.drag_overlay.resize(self.size()) | ||
@@ -102,3 +106,7 @@ self.drag_overlay.setVisible(True) | ||
| for url in event.mimeData().urls(): | ||
| if url.isLocalFile() and url.toLocalFile().lower().endswith(".txt"): | ||
| file_path = url.toLocalFile().lower() | ||
| if url.isLocalFile() and ( | ||
| file_path.endswith(".txt") | ||
| or file_path.endswith((".srt", ".ass", ".vtt")) | ||
| ): | ||
| event.acceptProposedAction() | ||
@@ -118,3 +126,7 @@ return | ||
| for url in event.mimeData().urls() | ||
| if url.isLocalFile() and url.toLocalFile().lower().endswith(".txt") | ||
| if url.isLocalFile() | ||
| and ( | ||
| url.toLocalFile().lower().endswith(".txt") | ||
| or url.toLocalFile().lower().endswith((".srt", ".ass", ".vtt")) | ||
| ) | ||
| ] | ||
@@ -157,3 +169,3 @@ if file_paths: | ||
| "<h2>How Queue Works?</h2>" | ||
| "You can add text files (.txt) directly using the '<b>Add files</b>' button below. " | ||
| "You can add text and subtitle files (.txt, .srt, .ass, .vtt) directly using the '<b>Add files</b>' button below. " | ||
| "To add PDF, EPUB or markdown files, use the input box in the main window and click the <b>'Add to Queue'</b> button. " | ||
@@ -170,3 +182,3 @@ "Each file in the queue keeps the configuration settings active when it was added. " | ||
| self.empty_overlay = QLabel( | ||
| "Drag and drop your text files here or use the 'Add files' button.", | ||
| "Drag and drop your text or subtitle files here or use the 'Add files' button.", | ||
| self.listwidget, | ||
@@ -298,3 +310,5 @@ ) | ||
| f"<b>Characters:</b> {getattr(item, 'total_char_count', '')}<br>" | ||
| f"<b>Replace Single Newlines:</b> {getattr(item, 'replace_single_newlines', False)}" | ||
| f"<b>Replace Single Newlines:</b> {getattr(item, 'replace_single_newlines', False)}<br>" | ||
| f"<b>Use Silent Gaps:</b> {getattr(item, 'use_silent_gaps', False)}<br>" | ||
| f"<b>Speed Method:</b> {getattr(item, 'subtitle_speed_method', 'tts')}" | ||
| ) | ||
@@ -412,2 +426,8 @@ # Add book handler options if present | ||
| ) | ||
| # use_silent_gaps | ||
| attrs["use_silent_gaps"] = getattr(parent, "use_silent_gaps", False) | ||
| # subtitle_speed_method | ||
| attrs["subtitle_speed_method"] = getattr( | ||
| parent, "subtitle_speed_method", "tts" | ||
| ) | ||
| # book handler options | ||
@@ -459,2 +479,5 @@ attrs["save_chapters_separately"] = getattr( | ||
| setattr(item, attr, value) | ||
| # Override subtitle_mode to "Disabled" for subtitle files | ||
| if file_path.lower().endswith((".srt", ".ass", ".vtt")): | ||
| item.subtitle_mode = "Disabled" | ||
| # Read file content and calculate total_char_count using calculate_text_length | ||
@@ -491,2 +514,6 @@ try: | ||
| == getattr(item, "replace_single_newlines", False) | ||
| and getattr(queued_item, "use_silent_gaps", False) | ||
| == getattr(item, "use_silent_gaps", False) | ||
| and getattr(queued_item, "subtitle_speed_method", "tts") | ||
| == getattr(item, "subtitle_speed_method", "tts") | ||
| and getattr(queued_item, "save_base_path", None) | ||
@@ -518,5 +545,8 @@ == getattr(item, "save_base_path", None) | ||
| # Only allow .txt files | ||
| # Allow .txt, .srt, .ass, and .vtt files | ||
| files, _ = QFileDialog.getOpenFileNames( | ||
| self, "Select .txt files", "", "Text Files (*.txt)" | ||
| self, | ||
| "Select text or subtitle files", | ||
| "", | ||
| "Supported Files (*.txt *.srt *.ass *.vtt)", | ||
| ) | ||
@@ -523,0 +553,0 @@ if not files: |
@@ -17,4 +17,6 @@ # represents a queued item - book, chapters, voice, etc. | ||
| replace_single_newlines: bool = False | ||
| use_silent_gaps: bool = False | ||
| subtitle_speed_method: str = "tts" | ||
| save_base_path: str = None | ||
| save_chapters_separately: bool = None | ||
| merge_chapters_at_end: bool = None |
+6
-0
@@ -260,2 +260,8 @@ import os | ||
| def get_gpu_acceleration(enabled): | ||
| """ | ||
| Check GPU acceleration availability. | ||
| Note: On Windows, torch DLLs must be pre-loaded in main.py before PyQt6 | ||
| to avoid DLL initialization errors. | ||
| """ | ||
| try: | ||
@@ -262,0 +268,0 @@ import torch |
+1
-1
@@ -1,1 +0,1 @@ | ||
| 1.2.1 | ||
| 1.2.2 |
@@ -281,3 +281,3 @@ import json | ||
| self._slider_style_applied = True | ||
| # Fix slider in Windows | ||
@@ -307,3 +307,3 @@ if platform.system() == "Windows": | ||
| parent_window = parent_window.parent() | ||
| if theme == "light": | ||
@@ -310,0 +310,0 @@ self.slider.setStyleSheet( |
+12
-1
@@ -1,2 +0,13 @@ | ||
| # 1.2.1 (pre-release) | ||
| # 1.2.2 | ||
| - **You can now voice your subtitle files!** Simply add `.srt`, `.ass` or `.vtt` files to generate timed audio. Alternatively, add a text file with timestamps in `HH:MM:SS` or `HH:MM:SS,ms` format to generate audio that matches the timestamps. See [here](https://github.com/denizsafak/abogen?tab=readme-ov-file#about-timestamp-based-text-files) for detailed instructions. | ||
| - New option: **"Use silent gaps between subtitles"**: Prevents unnecessary audio speed-up by letting speech continue into the silent gaps between subtitles. | ||
| - New option: **"Subtitle speed adjustment method"**: Choose how to speed up audio when needed: | ||
| - **TTS Regeneration (better quality):** Re-generates the audio at a faster speed for more natural sound. | ||
| - **FFmpeg Time-stretch (better speed):** Quickly speeds up the generated audio. | ||
| - Added support for embedding cover images in M4B files. Abogen now automatically extracts cover images from EPUB and PDF files. You can also manually specify a cover image using the `<<METADATA_COVER_PATH:path>>` tag in your text file. (To prevent MPV from showing the cover image, you can add `audio-display=no` to your MPV config file.) | ||
| - Fixed `[WinError 1114] A dynamic link library (DLL) initialization routine failed` error on Windows, pre-loading PyTorch DLLs before initializing PyQt6 to avoid DLL initialization errors, mentioned in #98 by @ephr0n. | ||
| - Potential fix for `CUDA GPU is not available` issue, by ensuring PyTorch is installed correctly with CUDA support on Windows using the installer script. | ||
| - Improvements in code and documentation. | ||
| # 1.2.1 | ||
| - Upgraded Abogen's interface from PyQt5 to PyQt6 for better compatibility and long-term support. | ||
@@ -3,0 +14,0 @@ - Added tooltip indicators in queue manager to display book handler options (`Save chapters separately` and `Merge chapters at the end`) for queued items. |
+43
-10
| Metadata-Version: 2.4 | ||
| Name: abogen | ||
| Version: 1.2.1 | ||
| Version: 1.2.2 | ||
| Summary: Generate audiobooks from EPUBs, PDFs and text with synchronized captions. | ||
@@ -49,3 +49,3 @@ Project-URL: Homepage, https://github.com/denizsafak/abogen | ||
| Abogen is a powerful text-to-speech conversion tool that makes it easy to turn ePub, PDF, text or markdown files into high-quality audio with matching subtitles in seconds. Use it for audiobooks, voiceovers for Instagram, YouTube, TikTok, or any project that needs natural-sounding text-to-speech, using [Kokoro-82M](https://huggingface.co/hexgrad/Kokoro-82M). | ||
| Abogen is a powerful text-to-speech conversion tool that makes it easy to turn ePub, PDF, text, markdown, or subtitle files into high-quality audio with matching subtitles in seconds. Use it for audiobooks, voiceovers for Instagram, YouTube, TikTok, or any project that needs natural-sounding text-to-speech, using [Kokoro-82M](https://huggingface.co/hexgrad/Kokoro-82M). | ||
@@ -83,3 +83,4 @@ <img title="Abogen Main" src='https://raw.githubusercontent.com/denizsafak/abogen/refs/heads/main/demo/abogen.png' width="380"> <img title="Abogen Processing" src='https://raw.githubusercontent.com/denizsafak/abogen/refs/heads/main/demo/abogen2.png' width="380"> | ||
| # For NVIDIA GPUs: | ||
| pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128 | ||
| # We need to use an older version of PyTorch (2.8.0) until this issue is fixed: https://github.com/pytorch/pytorch/issues/166628 | ||
| pip install torch==2.8.0+cu128 torchvision==0.23.0+cu128 torchaudio==2.8.0 --index-url https://download.pytorch.org/whl/cu128 | ||
@@ -156,3 +157,3 @@ # For AMD GPUs: | ||
| ## `How to use?` | ||
| 1) Drag and drop any ePub, PDF, text or markdown file (or use the built-in text editor) | ||
| 1) Drag and drop any ePub, PDF, text, markdown, or subtitle file (or use the built-in text editor) | ||
| 2) Configure the settings: | ||
@@ -175,3 +176,3 @@ - Set speech speed | ||
| |---------|-------------| | ||
| | **Input Box** | Drag and drop `ePub`, `PDF`, `.TXT` or `.MD` files (or use built-in text editor) | | ||
| | **Input Box** | Drag and drop `ePub`, `PDF`, `.TXT`, `.MD`, `.SRT`, `.ASS` or `.VTT` files (or use built-in text editor) | | ||
| | **Queue options** | Add multiple files to a queue and process them in batch, with individual settings for each file. See [Queue mode](#queue-mode) for more details. | | ||
@@ -212,2 +213,4 @@ | **Speed** | Adjust speech rate from `0.1x` to `2.0x` | | ||
| | **Clear cache files** | Deletes cache files created during the conversion or preview. | | ||
| | **Use silent gaps between subtitles** | Prevents unnecessary audio speed-up by letting speech continue into the silent gaps between subtitle etries. In short, it ignores the end times in subtitle entries and uses the silent space until the beginning of the next subtitle entry. When disabled, it speeds up the audio to fit the exact time interval specified in the subtitle. (for subtitle files). | | ||
| | **Subtitle speed adjustment method** | Choose how to speed up audio when needed: `TTS Regeneration (better quality)` re-generates the audio at a faster speed, while `FFmpeg Time-stretch (better speed)` quickly speeds up the generated audio. (for subtitle files). | | ||
| | **Check for updates at startup** | Automatically checks for updates when the program starts. | | ||
@@ -272,4 +275,27 @@ | **Disable Kokoro's internet access** | Prevents Kokoro from downloading models or voices from HuggingFace Hub, useful for offline use. | | ||
| <<METADATA_GENRE:Audiobook>> | ||
| <<METADATA_COVER_PATH:path/to/cover.jpg>> | ||
| ``` | ||
| > Note: `METADATA_COVER_PATH` is used to embed a cover image into the generated M4B file. Abogen automatically extracts the cover from EPUB and PDF files and adds this tag for you. | ||
| ## `About Timestamp-based Text Files` | ||
| Similar to converting subtitle files to audio, Abogen can automatically detect text files that contain timestamps in `HH:MM:SS` or `HH:MM:SS,ms` format. When timestamps are found inside your text file, Abogen will ask if you want to use them for audio timing. This is useful for creating timed narrations, scripts, or transcripts where you need exact control over when each segment is spoken. | ||
| Format your text file like this: | ||
| ``` | ||
| 00:00:00 | ||
| This is the first segment of text. | ||
| 00:00:15 | ||
| This is the second segment, starting at 15 seconds. | ||
| 00:00:45 | ||
| And this is the third segment, starting at 45 seconds. | ||
| ``` | ||
| **Important notes:** | ||
| - Timestamps must be in `HH:MM:SS` or `HH:MM:SS,ms` format (e.g., `00:05:30` for 5 minutes 30 seconds, or `00:05:30,500` for 5 minutes 30.5 seconds) | ||
| - Milliseconds are optional and provide precision up to 1/1000th of a second | ||
| - Text before the first timestamp (if any) will automatically start at `00:00:00` | ||
| - When using timestamps, the subtitle generation mode setting is ignored | ||
| ## `Supported Languages` | ||
@@ -296,2 +322,3 @@ ``` | ||
| keep-open=yes | ||
| audio-display=no | ||
| # --- Subtitle --- | ||
@@ -392,3 +419,3 @@ sub-ass-override=no | ||
| > This message means PyTorch couldn't use your GPU. On Windows, Abogen supports NVIDIA GPUs with CUDA. AMD GPUs are supported only on Linux. Abogen will still run on the CPU, but it will be slower. | ||
| > This message means PyTorch could not use your GPU and has fallen back to the CPU. On Windows, Abogen only supports NVIDIA GPUs with CUDA. AMD GPUs are not supported on Windows (they are only supported on Linux with ROCm). Abogen will still work on the CPU, but processing will be slower compared to a supported GPU. | ||
| > | ||
@@ -398,5 +425,11 @@ > If you have a compatible NVIDIA GPU on Windows and still see this warning: | ||
| > ```bash | ||
| > python_embedded\python.exe -m pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128 | ||
| > python_embedded\python.exe -m pip install --force-reinstall torch==2.8.0+cu128 torchvision==0.23.0+cu128 torchaudio==2.8.0 --index-url https://download.pytorch.org/whl/cu128 | ||
| > ``` | ||
| > If you have an AMD GPU, use Linux and follow the Linux/ROCm [instructions](#how-to-install-). If you want to keep running on CPU, no action is required, but performance will just be reduced. See [#32](https://github.com/denizsafak/abogen/issues/32) for more details. | ||
| > | ||
| > If this does not resolve the issue and you are using an older NVIDIA GPU that does not support CUDA 12.8, you can try installing an older version of PyTorch that supports your GPU. For example, for CUDA 12.6, run: | ||
| > ```bash | ||
| > python_embedded\python.exe -m pip install --force-reinstall torch==2.8.0+cu126 torchvision==0.23.0+cu126 torchaudio==2.8.0 --index-url https://download.pytorch.org/whl/cu126 | ||
| > ``` | ||
| > | ||
| > If you have an AMD GPU, you need to use Linux and follow the Linux/ROCm [instructions](#linux). If you want to keep running on CPU, no action is required, but performance will just be reduced. See [#32](https://github.com/denizsafak/abogen/issues/32) for more details. | ||
@@ -431,3 +464,3 @@ </details> | ||
| > ```bash | ||
| > python_embedded\python.exe -m pip install torch==2.8.0 torchaudio==2.8.0 torchvision==0.23.0 | ||
| > python_embedded\python.exe -m pip install --force-reinstall torch==2.8.0+cu128 torchvision==0.23.0+cu128 torchaudio==2.8.0 --index-url https://download.pytorch.org/whl/cu128 | ||
| > ``` | ||
@@ -508,2 +541,2 @@ > If you installed Abogen using pip, open your terminal in the virtual environment and run: | ||
| > Tags: audiobook, kokoro, text-to-speech, TTS, audiobook generator, audiobooks, text to speech, audiobook maker, audiobook creator, audiobook generator, voice-synthesis, text to audio, text to audio converter, text to speech converter, text to speech generator, text to speech software, text to speech app, epub to audio, pdf to audio, markdown to audio, content-creation, media-generation | ||
| > Tags: audiobook, kokoro, text-to-speech, TTS, audiobook generator, audiobooks, text to speech, audiobook maker, audiobook creator, audiobook generator, voice-synthesis, text to audio, text to audio converter, text to speech converter, text to speech generator, text to speech software, text to speech app, epub to audio, pdf to audio, markdown to audio, subtitle to audio, srt to audio, ass to audio, vtt to audio, webvtt to audio, content-creation, media-generation |
+42
-9
@@ -12,3 +12,3 @@ # abogen <img width="40px" title="abogen icon" src="https://raw.githubusercontent.com/denizsafak/abogen/refs/heads/main/abogen/assets/icon.ico" align="right" style="padding-left: 10px; padding-top:5px;"> | ||
| Abogen is a powerful text-to-speech conversion tool that makes it easy to turn ePub, PDF, text or markdown files into high-quality audio with matching subtitles in seconds. Use it for audiobooks, voiceovers for Instagram, YouTube, TikTok, or any project that needs natural-sounding text-to-speech, using [Kokoro-82M](https://huggingface.co/hexgrad/Kokoro-82M). | ||
| Abogen is a powerful text-to-speech conversion tool that makes it easy to turn ePub, PDF, text, markdown, or subtitle files into high-quality audio with matching subtitles in seconds. Use it for audiobooks, voiceovers for Instagram, YouTube, TikTok, or any project that needs natural-sounding text-to-speech, using [Kokoro-82M](https://huggingface.co/hexgrad/Kokoro-82M). | ||
@@ -46,3 +46,4 @@ <img title="Abogen Main" src='https://raw.githubusercontent.com/denizsafak/abogen/refs/heads/main/demo/abogen.png' width="380"> <img title="Abogen Processing" src='https://raw.githubusercontent.com/denizsafak/abogen/refs/heads/main/demo/abogen2.png' width="380"> | ||
| # For NVIDIA GPUs: | ||
| pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128 | ||
| # We need to use an older version of PyTorch (2.8.0) until this issue is fixed: https://github.com/pytorch/pytorch/issues/166628 | ||
| pip install torch==2.8.0+cu128 torchvision==0.23.0+cu128 torchaudio==2.8.0 --index-url https://download.pytorch.org/whl/cu128 | ||
@@ -119,3 +120,3 @@ # For AMD GPUs: | ||
| ## `How to use?` | ||
| 1) Drag and drop any ePub, PDF, text or markdown file (or use the built-in text editor) | ||
| 1) Drag and drop any ePub, PDF, text, markdown, or subtitle file (or use the built-in text editor) | ||
| 2) Configure the settings: | ||
@@ -138,3 +139,3 @@ - Set speech speed | ||
| |---------|-------------| | ||
| | **Input Box** | Drag and drop `ePub`, `PDF`, `.TXT` or `.MD` files (or use built-in text editor) | | ||
| | **Input Box** | Drag and drop `ePub`, `PDF`, `.TXT`, `.MD`, `.SRT`, `.ASS` or `.VTT` files (or use built-in text editor) | | ||
| | **Queue options** | Add multiple files to a queue and process them in batch, with individual settings for each file. See [Queue mode](#queue-mode) for more details. | | ||
@@ -175,2 +176,4 @@ | **Speed** | Adjust speech rate from `0.1x` to `2.0x` | | ||
| | **Clear cache files** | Deletes cache files created during the conversion or preview. | | ||
| | **Use silent gaps between subtitles** | Prevents unnecessary audio speed-up by letting speech continue into the silent gaps between subtitle etries. In short, it ignores the end times in subtitle entries and uses the silent space until the beginning of the next subtitle entry. When disabled, it speeds up the audio to fit the exact time interval specified in the subtitle. (for subtitle files). | | ||
| | **Subtitle speed adjustment method** | Choose how to speed up audio when needed: `TTS Regeneration (better quality)` re-generates the audio at a faster speed, while `FFmpeg Time-stretch (better speed)` quickly speeds up the generated audio. (for subtitle files). | | ||
| | **Check for updates at startup** | Automatically checks for updates when the program starts. | | ||
@@ -235,4 +238,27 @@ | **Disable Kokoro's internet access** | Prevents Kokoro from downloading models or voices from HuggingFace Hub, useful for offline use. | | ||
| <<METADATA_GENRE:Audiobook>> | ||
| <<METADATA_COVER_PATH:path/to/cover.jpg>> | ||
| ``` | ||
| > Note: `METADATA_COVER_PATH` is used to embed a cover image into the generated M4B file. Abogen automatically extracts the cover from EPUB and PDF files and adds this tag for you. | ||
| ## `About Timestamp-based Text Files` | ||
| Similar to converting subtitle files to audio, Abogen can automatically detect text files that contain timestamps in `HH:MM:SS` or `HH:MM:SS,ms` format. When timestamps are found inside your text file, Abogen will ask if you want to use them for audio timing. This is useful for creating timed narrations, scripts, or transcripts where you need exact control over when each segment is spoken. | ||
| Format your text file like this: | ||
| ``` | ||
| 00:00:00 | ||
| This is the first segment of text. | ||
| 00:00:15 | ||
| This is the second segment, starting at 15 seconds. | ||
| 00:00:45 | ||
| And this is the third segment, starting at 45 seconds. | ||
| ``` | ||
| **Important notes:** | ||
| - Timestamps must be in `HH:MM:SS` or `HH:MM:SS,ms` format (e.g., `00:05:30` for 5 minutes 30 seconds, or `00:05:30,500` for 5 minutes 30.5 seconds) | ||
| - Milliseconds are optional and provide precision up to 1/1000th of a second | ||
| - Text before the first timestamp (if any) will automatically start at `00:00:00` | ||
| - When using timestamps, the subtitle generation mode setting is ignored | ||
| ## `Supported Languages` | ||
@@ -259,2 +285,3 @@ ``` | ||
| keep-open=yes | ||
| audio-display=no | ||
| # --- Subtitle --- | ||
@@ -355,3 +382,3 @@ sub-ass-override=no | ||
| > This message means PyTorch couldn't use your GPU. On Windows, Abogen supports NVIDIA GPUs with CUDA. AMD GPUs are supported only on Linux. Abogen will still run on the CPU, but it will be slower. | ||
| > This message means PyTorch could not use your GPU and has fallen back to the CPU. On Windows, Abogen only supports NVIDIA GPUs with CUDA. AMD GPUs are not supported on Windows (they are only supported on Linux with ROCm). Abogen will still work on the CPU, but processing will be slower compared to a supported GPU. | ||
| > | ||
@@ -361,5 +388,11 @@ > If you have a compatible NVIDIA GPU on Windows and still see this warning: | ||
| > ```bash | ||
| > python_embedded\python.exe -m pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu128 | ||
| > python_embedded\python.exe -m pip install --force-reinstall torch==2.8.0+cu128 torchvision==0.23.0+cu128 torchaudio==2.8.0 --index-url https://download.pytorch.org/whl/cu128 | ||
| > ``` | ||
| > If you have an AMD GPU, use Linux and follow the Linux/ROCm [instructions](#how-to-install-). If you want to keep running on CPU, no action is required, but performance will just be reduced. See [#32](https://github.com/denizsafak/abogen/issues/32) for more details. | ||
| > | ||
| > If this does not resolve the issue and you are using an older NVIDIA GPU that does not support CUDA 12.8, you can try installing an older version of PyTorch that supports your GPU. For example, for CUDA 12.6, run: | ||
| > ```bash | ||
| > python_embedded\python.exe -m pip install --force-reinstall torch==2.8.0+cu126 torchvision==0.23.0+cu126 torchaudio==2.8.0 --index-url https://download.pytorch.org/whl/cu126 | ||
| > ``` | ||
| > | ||
| > If you have an AMD GPU, you need to use Linux and follow the Linux/ROCm [instructions](#linux). If you want to keep running on CPU, no action is required, but performance will just be reduced. See [#32](https://github.com/denizsafak/abogen/issues/32) for more details. | ||
@@ -394,3 +427,3 @@ </details> | ||
| > ```bash | ||
| > python_embedded\python.exe -m pip install torch==2.8.0 torchaudio==2.8.0 torchvision==0.23.0 | ||
| > python_embedded\python.exe -m pip install --force-reinstall torch==2.8.0+cu128 torchvision==0.23.0+cu128 torchaudio==2.8.0 --index-url https://download.pytorch.org/whl/cu128 | ||
| > ``` | ||
@@ -471,2 +504,2 @@ > If you installed Abogen using pip, open your terminal in the virtual environment and run: | ||
| > Tags: audiobook, kokoro, text-to-speech, TTS, audiobook generator, audiobooks, text to speech, audiobook maker, audiobook creator, audiobook generator, voice-synthesis, text to audio, text to audio converter, text to speech converter, text to speech generator, text to speech software, text to speech app, epub to audio, pdf to audio, markdown to audio, content-creation, media-generation | ||
| > Tags: audiobook, kokoro, text-to-speech, TTS, audiobook generator, audiobooks, text to speech, audiobook maker, audiobook creator, audiobook generator, voice-synthesis, text to audio, text to audio converter, text to speech converter, text to speech generator, text to speech software, text to speech app, epub to audio, pdf to audio, markdown to audio, subtitle to audio, srt to audio, ass to audio, vtt to audio, webvtt to audio, content-creation, media-generation |
Sorry, the diff of this file is too big to display
Sorry, the diff of this file is too big to display
Sorry, the diff of this file is too big to display
Alert delta unavailable
Currently unable to show alert delta for PyPI packages.
785478
7.77%10882
10.63%