From 0e5aca7138d12668b84a7c3f50a2ec540a21bb03 Mon Sep 17 00:00:00 2001
From: Azis <azuolas.krusna@yahoo.com>
Date: Thu, 19 Feb 2026 23:24:54 +0100
Subject: [PATCH 1/2] Add support for epub

---
 AGENTS.md    |   2 +
 README.md    |   9 +-
 ROADMAP.md   |  16 +--
 reed.py      | 225 +++++++++++++++++++++++++++++++--
 test_reed.py | 341 ++++++++++++++++++++++++++++++++++++++++++++++++++-
 5 files changed, 570 insertions(+), 23 deletions(-)

diff --git a/AGENTS.md b/AGENTS.md
index 88d6f89..3b6621a 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -10,6 +10,7 @@ This is `reed`, a convenient CLI for text-to-speech using piper-tts.
 - Python 3.14+
 - piper-tts (dependency in pyproject.toml, run via `uv run reed`)
 - pypdf (PDF text extraction)
+- stdlib `zipfile` + `xml.etree` (EPUB reading — no external dependency)
 - macOS `afplay` for audio playback, `pbpaste` for clipboard access
 - Linux: `paplay`/`aplay`/`ffplay` for audio, `wl-paste`/`xclip`/`xsel` for clipboard
 - Windows: `powershell`/`ffplay` for audio, `powershell Get-Clipboard` for clipboard
@@ -24,6 +25,7 @@ This is `reed`, a convenient CLI for text-to-speech using piper-tts.
 
 - Run: `reed 'text'`
 - Read PDF: `reed -f doc.pdf` or `reed -f doc.pdf --pages 1,3-5`
+- Read EPUB: `reed -f book.epub` or `reed -f book.epub --pages 1,3-5`
 - Interactive mode: `reed` (launches automatically when no input provided)
 - List voices: `reed voices`
 - Download voice: `reed download en_US-amy-medium`
diff --git a/README.md b/README.md
index 3c70969..2b90da0 100644
--- a/README.md
+++ b/README.md
@@ -6,6 +6,7 @@ A CLI that reads text aloud using [piper-tts](https://github.com/rhasspy/piper).
 
 - **Multiple input sources** — text argument, file (`-f`), clipboard (`-c`), or stdin
 - **PDF support** — read full PDFs or selected pages with `--pages`
+- **EPUB support** — read EPUB e-books, select chapters with `--pages`
 - **Pipe-friendly** — reads from stdin, works anywhere in a shell pipeline
 - **Interactive mode** — conversational TTS with `/replay`, `/help`, `/clear`, tab completion, and history
 - **Adjustable speech** — control speed (`-s`), volume (`-v`), and sentence silence (`--silence`)
@@ -79,6 +80,12 @@ reed -f book.pdf
 # Read selected pages from a PDF (1-based)
 reed -f book.pdf --pages 1,3-5
 
+# Read an EPUB e-book
+reed -f book.epub
+
+# Read selected chapters from an EPUB
+reed -f book.epub --pages 1,3-5
+
 # Read from clipboard
 reed -c
 
@@ -183,7 +190,7 @@ All voice models are hosted on Hugging Face: [https://huggingface.co/rhasspy/pip
 | Flag | Description | Default |
 |------|-------------|---------|
 | `-f`, `--file` | Read text from a file | — |
-| `--pages` | PDF pages to read (1-based), e.g. `1,3-5` | — |
+| `--pages` | PDF pages or EPUB chapters to read (1-based), e.g. `1,3-5` | — |
 | `-c`, `--clipboard` | Read text from clipboard | — |
 | `-m`, `--model` | Voice name or path to voice model | `en_US-kristin-medium` |
 | `-s`, `--speed` | Speech speed (lower = slower) | `1.0` |
diff --git a/ROADMAP.md b/ROADMAP.md
index 52a24d4..38aebfc 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -37,15 +37,17 @@ Currently `speak_text()` blocks on `subprocess.run()` for playback. All interact
 
 ## Phase 2 — File Format Support
 
-### 2.1 EPUB File Reading
+### 2.1 EPUB File Reading ✅
 **Effort:** Medium · **Priority:** High
 **Dependencies:** None
+**Status:** Done
 
-- Add `ebooklib` (or `epub2txt`) as an optional dependency in `pyproject.toml`
-- Create `_iter_epub_chapters()` yielding `(chapter_number, total_chapters, text)` — mirror the existing `_iter_pdf_pages()` pattern
-- Wire into `get_text()` / `main()` with `.epub` suffix detection alongside the existing `.pdf` path
-- Support `--pages` reinterpreted as `--chapters` for EPUBs (or add a `--chapters` flag)
-- Strip HTML tags from EPUB XHTML content (use `html.parser` from stdlib)
+- ✅ Create `_iter_epub_chapters()` yielding `(chapter_number, total_chapters, text)` — mirrors `_iter_pdf_pages()`
+- ✅ Wire into `main()` with `.epub` suffix detection alongside the existing `.pdf` path
+- ✅ `--pages` flag selects chapters for EPUBs
+- ✅ Strip HTML tags from EPUB XHTML content (stdlib `html.parser`)
+- ✅ Navigation documents filtered out via spine ordering
+- ✅ Zero external dependencies — uses stdlib `zipfile` + `xml.etree.ElementTree`
 
 ---
 
@@ -119,7 +121,7 @@ No Lithuanian piper voice model exists yet — this requires training one from s
 | 1.1 | Command autocomplete | Small | — |
 | 1.2 | Non-blocking playback controller | Medium | — |
 | 1.3 | Pause / play / stop commands | Small | 1.2 |
-| 2.1 | EPUB reading | Medium | — |
+| 2.1 | ✅ EPUB reading | Medium | — |
 | 3.1 | Save & resume position | Medium | 1.2, 2.1 |
 | 4.1 | Streaming audio | Large | 1.2 |
 | 5.1 | Lithuanian voice model training | Large | — |
diff --git a/reed.py b/reed.py
index 40c4d86..1f03aad 100755
--- a/reed.py
+++ b/reed.py
@@ -10,9 +10,12 @@
 import tempfile
 import time
 import urllib.request
+import xml.etree.ElementTree as ET
+import zipfile
+from html.parser import HTMLParser
 from dataclasses import dataclass
 from pathlib import Path
-from typing import TYPE_CHECKING, Callable, Iterator, Optional, TextIO
+from typing import TYPE_CHECKING, Callable, Iterator, Optional, Sequence, TextIO
 
 if TYPE_CHECKING:
     from prompt_toolkit import PromptSession
@@ -20,7 +23,7 @@
 try:
     from pypdf import PdfReader
 except ImportError:  # pragma: no cover - validated in runtime error path
-    PdfReader = None
+    PdfReader = None  # type: ignore[assignment,misc]
 
 from rich.console import Console
 from rich.markup import escape
@@ -164,7 +167,7 @@ def get_text(
     if args.file:
         file_path = Path(args.file)
         if args.pages:
-            raise ReedError("--pages can only be used with PDF files")
+            raise ReedError("--pages can only be used with PDF or EPUB files")
         return file_path.read_text()
 
     if not stdin.isatty():
@@ -176,8 +179,10 @@ def get_text(
     raise ReedError("No input provided. Use --help for usage.")
 
 
-def _parse_pdf_pages(page_selection: str, total_pages: int) -> list[int]:
-    selection = page_selection.strip()
+def _parse_range_selection(
+    selection_str: str, total: int, label: str = "page"
+) -> list[int]:
+    selection = selection_str.strip()
     if not selection:
         raise ReedError("Invalid page selection")
 
@@ -196,7 +201,7 @@ def _parse_pdf_pages(page_selection: str, total_pages: int) -> list[int]:
             end = int(bounds[1])
             if start < 1 or end < 1 or end < start:
                 raise ReedError("Invalid page selection")
-            pages = range(start, end + 1)
+            pages: Sequence[int] = range(start, end + 1)
         else:
             if not token.isdigit():
                 raise ReedError("Invalid page selection")
@@ -206,9 +211,9 @@ def _parse_pdf_pages(page_selection: str, total_pages: int) -> list[int]:
             pages = [page]
 
         for page in pages:
-            if page > total_pages:
+            if page > total:
                 raise ReedError(
-                    f"Page {page} is out of range (PDF has {total_pages} pages)"
+                    f"{label.title()} {page} is out of range (total: {total})"
                 )
             index = page - 1
             if index not in seen:
@@ -237,7 +242,9 @@ def _iter_pdf_pages(
         raise ReedError("PDF has no pages")
 
     if page_selection:
-        page_indices = _parse_pdf_pages(page_selection, total_pages)
+        page_indices: Sequence[int] = _parse_range_selection(
+            page_selection, total_pages
+        )
     else:
         page_indices = range(total_pages)
 
@@ -253,6 +260,149 @@ def _iter_pdf_pages(
         raise ReedError("No extractable text found in PDF")
 
 
+_BLOCK_TAGS = frozenset(
+    {
+        "p",
+        "div",
+        "br",
+        "h1",
+        "h2",
+        "h3",
+        "h4",
+        "h5",
+        "h6",
+        "li",
+        "tr",
+        "blockquote",
+        "section",
+        "article",
+    }
+)
+
+
+class _HTMLTextExtractor(HTMLParser):
+    """Extract plain text from HTML, stripping all tags."""
+
+    def __init__(self) -> None:
+        super().__init__()
+        self._parts: list[str] = []
+
+    def handle_starttag(self, tag: str, attrs: list[tuple[str, str | None]]) -> None:
+        if tag.lower() in _BLOCK_TAGS:
+            self._parts.append("\n")
+
+    def handle_data(self, data: str) -> None:
+        self._parts.append(data)
+
+    def get_text(self) -> str:
+        raw = "".join(self._parts)
+        lines = raw.split("\n")
+        paragraphs = [" ".join(line.split()) for line in lines]
+        return "\n".join(paragraphs).strip()
+
+
+def _strip_html(html_bytes: bytes) -> str:
+    extractor = _HTMLTextExtractor()
+    extractor.feed(html_bytes.decode("utf-8", errors="replace"))
+    return extractor.get_text()
+
+
+def _load_epub_spine(path: Path) -> list[tuple[str, zipfile.ZipFile]]:
+    """Parse EPUB spine and return ``(href, zip_file)`` pairs in reading order.
+
+    Only reads the OPF manifest (lightweight), does NOT decompress chapter content.
+    Each item is a tuple of ``(internal_path, ZipFile)`` so callers can lazily
+    read individual chapters with ``zf.read(href)``.
+    """
+    try:
+        zf = zipfile.ZipFile(str(path), "r")
+    except Exception as e:
+        raise ReedError(f"Failed to open EPUB: {e}")
+
+    try:
+        container_xml = zf.read("META-INF/container.xml")
+    except KeyError:
+        zf.close()
+        raise ReedError("Invalid EPUB: missing META-INF/container.xml")
+
+    container = ET.fromstring(container_xml)
+    ns = {"c": "urn:oasis:names:tc:opendocument:xmlns:container"}
+    rootfile_el = container.find(".//c:rootfile", ns)
+    if rootfile_el is None:
+        zf.close()
+        raise ReedError("Invalid EPUB: no rootfile in container.xml")
+    opf_path = rootfile_el.get("full-path", "")
+
+    try:
+        opf_xml = zf.read(opf_path)
+    except KeyError:
+        zf.close()
+        raise ReedError(f"Invalid EPUB: missing {opf_path}")
+
+    opf = ET.fromstring(opf_xml)
+    opf_ns = opf.tag.split("}")[0] + "}" if "}" in opf.tag else ""
+    opf_dir = opf_path.rsplit("/", 1)[0] + "/" if "/" in opf_path else ""
+
+    manifest: dict[str, str] = {}
+    for item in opf.findall(f".//{opf_ns}manifest/{opf_ns}item"):
+        item_id = item.get("id", "")
+        href = item.get("href", "")
+        media = item.get("media-type", "")
+        props = item.get("properties", "")
+        if media == "application/xhtml+xml" and "nav" not in props:
+            manifest[item_id] = opf_dir + href
+
+    spine_hrefs: list[tuple[str, zipfile.ZipFile]] = []
+    for itemref in opf.findall(f".//{opf_ns}spine/{opf_ns}itemref"):
+        idref = itemref.get("idref", "")
+        if idref in manifest:
+            spine_hrefs.append((manifest[idref], zf))
+
+    if not spine_hrefs:
+        zf.close()
+        raise ReedError("No chapters found in EPUB")
+
+    return spine_hrefs
+
+
+def _read_epub_chapter(chapter: tuple[str, zipfile.ZipFile]) -> str:
+    """Read and strip HTML from a single EPUB chapter. Lightweight — only decompresses one file."""
+    href, zf = chapter
+    try:
+        raw = zf.read(href)
+    except KeyError:
+        return ""
+    return _strip_html(raw).strip()
+
+
+def _split_paragraphs(text: str) -> list[str]:
+    """Split text into paragraph-sized chunks for incremental TTS.
+
+    Each non-blank line becomes a separate chunk that is spoken individually
+    so playback starts quickly.
+    """
+    return [line.strip() for line in text.splitlines() if line.strip()]
+
+
+def _iter_epub_chapters(
+    path: Path, chapter_selection: Optional[str]
+) -> Iterator[tuple[int, int, str]]:
+    """Yield ``(chapter_number, total_chapters, text)`` for each selected EPUB chapter."""
+    chapters = _load_epub_spine(path)
+    total_chapters = len(chapters)
+
+    if chapter_selection:
+        chapter_indices: Sequence[int] = _parse_range_selection(
+            chapter_selection, total_chapters, label="chapter"
+        )
+    else:
+        chapter_indices = range(total_chapters)
+
+    for index in chapter_indices:
+        text = _read_epub_chapter(chapters[index])
+        yield (index + 1, total_chapters, text)
+
+
 def build_piper_cmd(
     model: Path,
     speed: float,
@@ -506,10 +656,10 @@ def main(
     args = parser.parse_args(argv)
     if args.pages:
         if not args.file:
-            print_error("--pages requires --file <PDF>", print_fn)
+            print_error("--pages requires --file <PDF or EPUB>", print_fn)
             return 1
-        if Path(args.file).suffix.lower() != ".pdf":
-            print_error("--pages can only be used with PDF files", print_fn)
+        if Path(args.file).suffix.lower() not in (".pdf", ".epub"):
+            print_error("--pages can only be used with PDF or EPUB files", print_fn)
             return 1
 
     # Resolve model: None → default, short name → data dir path
@@ -605,6 +755,57 @@ def main(
                 )
             return 0
 
+        if args.file and Path(args.file).suffix.lower() == ".epub":
+            epub_path = Path(args.file)
+
+            def _speak_chapter(ch_text: str) -> None:
+                paragraphs = _split_paragraphs(ch_text)
+                for para in paragraphs:
+                    speak_text(
+                        para, config, run=run, print_fn=print_fn, play_cmd=play_cmd
+                    )
+
+            chapters = _load_epub_spine(epub_path)
+            total = len(chapters)
+            spoken: set[int] = set()
+
+            for ch_num, total_chapters, text in _iter_epub_chapters(
+                epub_path, args.pages
+            ):
+                if ch_num in spoken:
+                    continue
+                if text:
+                    spoken.add(ch_num)
+                    print_fn(
+                        f"\n[bold cyan]📖 Chapter {ch_num}/{total_chapters}[/bold cyan]"
+                    )
+                    _speak_chapter(text)
+                    continue
+
+                # Chapter is empty — skip to next chapter with text
+                for next_index in range(ch_num, total):
+                    next_num = next_index + 1
+                    if next_num in spoken:
+                        continue
+                    next_text = _read_epub_chapter(chapters[next_index])
+                    if next_text:
+                        spoken.add(next_num)
+                        print_fn(
+                            f"\n[yellow]⏭ Chapter {ch_num}/{total_chapters} has no text, "
+                            f"skipping to chapter {next_num}[/yellow]"
+                        )
+                        print_fn(
+                            f"\n[bold cyan]📖 Chapter {next_num}/{total_chapters}[/bold cyan]"
+                        )
+                        _speak_chapter(next_text)
+                        break
+                else:
+                    print_fn(
+                        f"\n[yellow]⏭ Chapter {ch_num}/{total_chapters} has no text "
+                        f"(no subsequent chapter with text found)[/yellow]"
+                    )
+            return 0
+
         text = get_text(args, stdin, run=run)
 
         if not text:
diff --git a/test_reed.py b/test_reed.py
index 2cfd8a6..a403118 100644
--- a/test_reed.py
+++ b/test_reed.py
@@ -713,15 +713,350 @@ def __init__(self, path):
         with pytest.raises(ReedError, match="Invalid page selection"):
             list(_iter_pdf_pages(Path("book.pdf"), "1,a"))
 
-    def test_pages_flag_with_non_pdf_file_raises(self):
+    def test_pages_flag_with_non_pdf_epub_file_raises(self):
         from reed import ReedError, get_text
 
         txt = io.StringIO("file content")
         args = _make_args(file="notes.txt", pages="1")
-        with pytest.raises(ReedError, match="only be used with PDF files"):
+        with pytest.raises(ReedError, match="only be used with PDF or EPUB files"):
             get_text(args, stdin=txt)
 
 
+# ─── _strip_html tests ───────────────────────────────────────────────
+
+
+class TestStripHtml:
+    def test_strips_basic_tags(self):
+        from reed import _strip_html
+
+        assert _strip_html(b"<p>Hello <b>world</b></p>") == "Hello world"
+
+    def test_preserves_paragraph_breaks(self):
+        from reed import _strip_html
+
+        result = _strip_html(b"<p>First</p><p>Second</p>")
+        assert result == "First\nSecond"
+
+    def test_empty_input(self):
+        from reed import _strip_html
+
+        assert _strip_html(b"") == ""
+
+    def test_plain_text_passthrough(self):
+        from reed import _strip_html
+
+        assert _strip_html(b"no tags here") == "no tags here"
+
+    def test_handles_entities(self):
+        from reed import _strip_html
+
+        result = _strip_html(b"<p>A &amp; B</p>")
+        assert "A & B" in result
+
+    def test_block_elements_add_breaks(self):
+        from reed import _strip_html
+
+        result = _strip_html(b"<div>One</div><div>Two</div>")
+        assert result == "One\nTwo"
+
+    def test_br_adds_break(self):
+        from reed import _strip_html
+
+        result = _strip_html(b"Line one<br/>Line two")
+        assert result == "Line one\nLine two"
+
+    def test_headings_add_breaks(self):
+        from reed import _strip_html
+
+        result = _strip_html(b"<h1>Title</h1><p>Body text</p>")
+        assert result == "Title\nBody text"
+
+
+# ─── _split_paragraphs tests ─────────────────────────────────────────
+
+
+class TestSplitParagraphs:
+    def test_splits_on_blank_lines(self):
+        from reed import _split_paragraphs
+
+        result = _split_paragraphs("First paragraph.\n\nSecond paragraph.")
+        assert result == ["First paragraph.", "Second paragraph."]
+
+    def test_single_paragraph(self):
+        from reed import _split_paragraphs
+
+        result = _split_paragraphs("Just one line.")
+        assert result == ["Just one line."]
+
+    def test_each_line_separate(self):
+        from reed import _split_paragraphs
+
+        result = _split_paragraphs("Line one\nLine two\n\nLine three")
+        assert result == ["Line one", "Line two", "Line three"]
+
+    def test_empty_string(self):
+        from reed import _split_paragraphs
+
+        assert _split_paragraphs("") == []
+
+    def test_only_whitespace(self):
+        from reed import _split_paragraphs
+
+        assert _split_paragraphs("  \n  \n  ") == []
+
+
+# ─── _iter_epub_chapters tests ───────────────────────────────────────
+
+
+class TestIterEpubChapters:
+    def _fake_spine(self, html_list):
+        """Create a fake spine: list of (href, FakeZf) from HTML byte strings."""
+
+        class FakeZf:
+            def __init__(self, data_map):
+                self._data = data_map
+
+            def read(self, href):
+                return self._data[href]
+
+        data = {f"ch{i}.xhtml": html for i, html in enumerate(html_list)}
+        zf = FakeZf(data)
+        return [(href, zf) for href in data]
+
+    def test_reads_all_chapters(self, monkeypatch):
+        from reed import _iter_epub_chapters
+
+        spine = self._fake_spine([b"<p>Chapter one</p>", b"<p>Chapter two</p>"])
+        monkeypatch.setattr("reed._load_epub_spine", lambda p: spine)
+
+        result = list(_iter_epub_chapters(Path("book.epub"), None))
+        assert len(result) == 2
+        assert result[0] == (1, 2, "Chapter one")
+        assert result[1] == (2, 2, "Chapter two")
+
+    def test_selected_chapters(self, monkeypatch):
+        from reed import _iter_epub_chapters
+
+        spine = self._fake_spine(
+            [b"<p>Ch one</p>", b"<p>Ch two</p>", b"<p>Ch three</p>", b"<p>Ch four</p>"]
+        )
+        monkeypatch.setattr("reed._load_epub_spine", lambda p: spine)
+
+        result = list(_iter_epub_chapters(Path("book.epub"), "2,4"))
+        assert result == [(2, 4, "Ch two"), (4, 4, "Ch four")]
+
+    def test_chapter_out_of_range_raises(self, monkeypatch):
+        from reed import ReedError, _iter_epub_chapters
+
+        spine = self._fake_spine([b"<p>Only one</p>"])
+        monkeypatch.setattr("reed._load_epub_spine", lambda p: spine)
+
+        with pytest.raises(ReedError, match="Chapter 5 is out of range"):
+            list(_iter_epub_chapters(Path("book.epub"), "5"))
+
+    def test_yields_empty_chapters(self, monkeypatch):
+        from reed import _iter_epub_chapters
+
+        spine = self._fake_spine([b"<p>Has text</p>", b"  ", b"<p>Also text</p>"])
+        monkeypatch.setattr("reed._load_epub_spine", lambda p: spine)
+
+        result = list(_iter_epub_chapters(Path("book.epub"), None))
+        assert len(result) == 3
+        assert result[0] == (1, 3, "Has text")
+        assert result[1] == (2, 3, "")
+        assert result[2] == (3, 3, "Also text")
+
+    def test_empty_text_still_yielded(self, monkeypatch):
+        from reed import _iter_epub_chapters
+
+        spine = self._fake_spine([b"  "])
+        monkeypatch.setattr("reed._load_epub_spine", lambda p: spine)
+
+        result = list(_iter_epub_chapters(Path("book.epub"), None))
+        assert result == [(1, 1, "")]
+
+
+# ─── main EPUB integration tests ────────────────────────────────────
+
+
+class TestMainEpub:
+    def _capture_main(self, **kwargs):
+        from rich.console import Console as RichConsole
+
+        cap_console = RichConsole(file=io.StringIO(), force_terminal=False)
+        code = _reed.main(print_fn=cap_console.print, **kwargs)
+        output = cap_console.file.getvalue()
+        return code, output
+
+    def _fake_spine(self, html_list):
+        """Create a fake spine: list of (href, FakeZf) from HTML byte strings."""
+
+        class FakeZf:
+            def __init__(self, data_map):
+                self._data = data_map
+
+            def read(self, href):
+                return self._data[href]
+
+        data = {f"ch{i}.xhtml": html for i, html in enumerate(html_list)}
+        zf = FakeZf(data)
+        return [(href, zf) for href in data]
+
+    def test_epub_file_reads_chapters(self, monkeypatch, tmp_path):
+        epub_file = tmp_path / "book.epub"
+        epub_file.touch()
+
+        spoken: list[str] = []
+
+        def fake_speak(text, config, *, run, print_fn, play_cmd):
+            spoken.append(text)
+
+        monkeypatch.setattr("reed.speak_text", fake_speak)
+        monkeypatch.setattr(
+            "reed._load_epub_spine",
+            lambda p: self._fake_spine(
+                [b"<p>Chapter one text</p>", b"<p>Chapter two text</p>"]
+            ),
+        )
+
+        code, output = self._capture_main(
+            argv=["-f", str(epub_file), "-m", __file__],
+            run=lambda *a, **k: types.SimpleNamespace(returncode=0, stderr=""),
+            stdin=io.StringIO(""),
+        )
+        assert code == 0
+        assert "Chapter 1/2" in output
+        assert "Chapter one text" in spoken
+        assert "Chapter two text" in spoken
+
+    def test_epub_skips_to_next_chapter_with_text(self, monkeypatch, tmp_path):
+        epub_file = tmp_path / "book.epub"
+        epub_file.touch()
+
+        spoken: list[str] = []
+
+        def fake_speak(text, config, *, run, print_fn, play_cmd):
+            spoken.append(text)
+
+        monkeypatch.setattr("reed.speak_text", fake_speak)
+        monkeypatch.setattr(
+            "reed._load_epub_spine",
+            lambda p: self._fake_spine([b"  ", b"<p>Real content</p>", b"  "]),
+        )
+
+        code, output = self._capture_main(
+            argv=["-f", str(epub_file), "--pages", "1", "-m", __file__],
+            run=lambda *a, **k: types.SimpleNamespace(returncode=0, stderr=""),
+            stdin=io.StringIO(""),
+        )
+        assert code == 0
+        assert "has no text, skipping to chapter 2" in output
+        assert "Chapter 2/3" in output
+        assert spoken == ["Real content"]
+
+    def test_epub_skip_no_subsequent_text(self, monkeypatch, tmp_path):
+        epub_file = tmp_path / "book.epub"
+        epub_file.touch()
+
+        spoken: list[str] = []
+
+        def fake_speak(text, config, *, run, print_fn, play_cmd):
+            spoken.append(text)
+
+        monkeypatch.setattr("reed.speak_text", fake_speak)
+        monkeypatch.setattr(
+            "reed._load_epub_spine",
+            lambda p: self._fake_spine([b"<p>Content</p>", b"  "]),
+        )
+
+        code, output = self._capture_main(
+            argv=["-f", str(epub_file), "--pages", "2", "-m", __file__],
+            run=lambda *a, **k: types.SimpleNamespace(returncode=0, stderr=""),
+            stdin=io.StringIO(""),
+        )
+        assert code == 0
+        assert "no subsequent chapter with text found" in output
+        assert spoken == []
+
+    def test_epub_all_chapters_skips_empty(self, monkeypatch, tmp_path):
+        epub_file = tmp_path / "book.epub"
+        epub_file.touch()
+
+        spoken: list[str] = []
+
+        def fake_speak(text, config, *, run, print_fn, play_cmd):
+            spoken.append(text)
+
+        monkeypatch.setattr("reed.speak_text", fake_speak)
+        monkeypatch.setattr(
+            "reed._load_epub_spine",
+            lambda p: self._fake_spine([b"  ", b"<p>Real content</p>", b"  "]),
+        )
+
+        code, output = self._capture_main(
+            argv=["-f", str(epub_file), "-m", __file__],
+            run=lambda *a, **k: types.SimpleNamespace(returncode=0, stderr=""),
+            stdin=io.StringIO(""),
+        )
+        assert code == 0
+        assert "Chapter 2/3" in output
+        assert spoken == ["Real content"]
+
+    def test_epub_speaks_paragraph_by_paragraph(self, monkeypatch, tmp_path):
+        epub_file = tmp_path / "book.epub"
+        epub_file.touch()
+
+        spoken: list[str] = []
+
+        def fake_speak(text, config, *, run, print_fn, play_cmd):
+            spoken.append(text)
+
+        monkeypatch.setattr("reed.speak_text", fake_speak)
+        monkeypatch.setattr(
+            "reed._load_epub_spine",
+            lambda p: self._fake_spine(
+                [b"<p>First paragraph.</p><p>Second paragraph.</p>"]
+            ),
+        )
+
+        code, output = self._capture_main(
+            argv=["-f", str(epub_file), "-m", __file__],
+            run=lambda *a, **k: types.SimpleNamespace(returncode=0, stderr=""),
+            stdin=io.StringIO(""),
+        )
+        assert code == 0
+        assert spoken == ["First paragraph.", "Second paragraph."]
+
+    def test_pages_flag_works_with_epub(self, monkeypatch, tmp_path):
+        epub_file = tmp_path / "book.epub"
+        epub_file.touch()
+
+        spoken: list[str] = []
+
+        def fake_speak(text, config, *, run, print_fn, play_cmd):
+            spoken.append(text)
+
+        monkeypatch.setattr("reed.speak_text", fake_speak)
+        monkeypatch.setattr(
+            "reed._load_epub_spine",
+            lambda p: self._fake_spine(
+                [
+                    b"<p>First chapter</p>",
+                    b"<p>Second chapter</p>",
+                    b"<p>Third chapter</p>",
+                ]
+            ),
+        )
+
+        code, output = self._capture_main(
+            argv=["-f", str(epub_file), "--pages", "1,3", "-m", __file__],
+            run=lambda *a, **k: types.SimpleNamespace(returncode=0, stderr=""),
+            stdin=io.StringIO(""),
+        )
+        assert code == 0
+        assert spoken == ["First chapter", "Third chapter"]
+
+
 # ─── main error path tests ───────────────────────────────────────────
 
 
@@ -770,7 +1105,7 @@ def test_pages_without_file_returns_1(self):
             stdin=io.StringIO(""),
         )
         assert code == 1
-        assert "--pages requires --file <PDF>" in output
+        assert "--pages requires --file" in output
 
 
 # ─── _data_dir tests ─────────────────────────────────────────────────

From b1d102078b2895b394f54b24641f592b1e8a1765 Mon Sep 17 00:00:00 2001
From: Azis <azuolas.krusna@yahoo.com>
Date: Thu, 19 Feb 2026 23:39:46 +0100
Subject: [PATCH 2/2] Fix

---
 .github/workflows/tests.yml |  2 +-
 reed.py                     |  4 +++-
 test_reed.py                | 19 ++++++++++++++++---
 3 files changed, 20 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index dd05394..d7942e9 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -19,7 +19,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        os: [ubuntu-latest, macos-latest, windows-latest]
+        os: [ubuntu-slim, macos-latest, windows-latest]
         python-version: ["3.14"]
 
     env:
diff --git a/reed.py b/reed.py
index 1f03aad..7ec9ba1 100755
--- a/reed.py
+++ b/reed.py
@@ -730,7 +730,9 @@ def main(
         print_error(str(e), print_fn)
         return 1
 
-    play_cmd = _default_play_cmd() if not config.output else None
+    # Resolve playback command lazily in speak_text so non-playback flows
+    # (e.g., empty input, mocked speak_text in tests) don't fail early.
+    play_cmd = None
 
     if _should_enter_interactive(args, stdin):
         loop_fn = interactive_loop_fn or interactive_loop
diff --git a/test_reed.py b/test_reed.py
index a403118..f340079 100644
--- a/test_reed.py
+++ b/test_reed.py
@@ -332,8 +332,8 @@ def fake_run(cmd, **kwargs):
 
 
 class TestMainInteractiveFlag:
-    def test_no_input_defaults_to_interactive(self):
-        from reed import main
+    def test_no_input_defaults_to_interactive(self, monkeypatch):
+        from reed import ReedError, main
 
         loop_called = []
 
@@ -351,6 +351,11 @@ def fake_loop(**kwargs):
             loop_called.append(True)
             return 0
 
+        def no_player() -> list[str]:
+            raise ReedError("No supported audio player found")
+
+        monkeypatch.setattr("reed._default_play_cmd", no_player)
+
         code = main(
             argv=["-m", __file__],
             interactive_loop_fn=fake_loop,
@@ -1078,13 +1083,21 @@ def test_missing_model_returns_1(self):
         assert code == 1
         assert "Model not found" in output
 
-    def test_empty_text_returns_1(self):
+    def test_empty_text_returns_1(self, monkeypatch):
+        from reed import ReedError
+
+        def no_player() -> list[str]:
+            raise ReedError("No supported audio player found")
+
+        monkeypatch.setattr("reed._default_play_cmd", no_player)
+
         code, output = self._capture_main(
             argv=[],
             run=lambda *a, **k: types.SimpleNamespace(returncode=0, stderr=""),
             stdin=io.StringIO(""),
         )
         assert code == 1
+        assert "No text to read." in output
 
     def test_reed_error_returns_1(self):
         def failing_run(cmd, **kwargs):