From 7879a51fe36605767edfb7cd0b6ba4a008444e9c Mon Sep 17 00:00:00 2001
From: Admin <admin@kalekber.cc>
Date: Sun, 1 Mar 2026 12:25:16 +0500
Subject: [PATCH] feat: add Kokoro TTS, ranking page, direct HTTP strategy, and
 chapter-number fix

- Add Kokoro-FastAPI TTS integration to the chapter reader UI:
  - Browser-side MSE streaming with paragraph-level click-to-start
  - Voice selector, speed slider, auto-next with prefetch of the next chapter
  - New GET /ui/chapter-text endpoint that strips Markdown and serves plain text

- Add ranking page (novelfire /ranking scraper, WriteRanking/ReadRankingItems
  in writer, GET /ranking + POST /ranking/refresh + GET /ranking/view routes)
  with local-library annotation and one-click scrape buttons

- Add StrategyDirect (plain HTTP client) as a new browser strategy; the
  default strategy is now 'direct' for chapter fetching and 'content'
  for chapter-list URL retrieval (split via BROWSERLESS_URL_STRATEGY)

- Fix chapter numbering bug: numbers are now derived from the URL path
  (/chapter-N) rather than list position, correcting newest-first ordering

- Add 'refresh <slug>' CLI sub-command to re-scrape a book from its saved
  source_url without knowing the original URL

- Extend NovelScraper interface with RankingProvider (ScrapeRanking)

- Tune scraper timeouts: wait-for-selector reduced to 5 s, GotoOptions
  timeout set to 60 s, content/scrape client defaults raised to 90 s

- Add cover extraction fix (figure.cover > img rather than bare img.cover)

- Add AGENTS.md and .aiignore for AI tooling context

- Add integration tests for browser client and novelfire scraper (build
  tag: integration) and unit tests for chapterNumberFromURL and pagination
---
 .aiignore                                     |   20 +
 .env.example                                  |   22 +-
 .gitignore                                    |    4 -
 AGENTS.md                                     |   89 ++
 docker-compose.yml                            |   29 +-
 scraper/cmd/scraper/main.go                   |   55 +-
 scraper/internal/browser/content_scrape.go    |    4 +-
 scraper/internal/browser/http.go              |   68 +
 scraper/internal/browser/integration_test.go  |  152 ++
 scraper/internal/browser/interface.go         |   19 +-
 .../internal/novelfire/integration_test.go    |  344 +++++
 scraper/internal/novelfire/scraper.go         |  277 +++-
 scraper/internal/novelfire/scraper_test.go    |  217 +++
 scraper/internal/scraper/interfaces.go        |   10 +
 scraper/internal/server/server.go             |   57 +-
 scraper/internal/server/ui.go                 | 1331 +++++++++++++++++
 scraper/internal/writer/writer.go             |  206 ++-
 17 files changed, 2816 insertions(+), 88 deletions(-)
 create mode 100644 .aiignore
 create mode 100644 AGENTS.md
 create mode 100644 scraper/internal/browser/http.go
 create mode 100644 scraper/internal/browser/integration_test.go
 create mode 100644 scraper/internal/novelfire/integration_test.go
 create mode 100644 scraper/internal/novelfire/scraper_test.go
 create mode 100644 scraper/internal/server/ui.go
diff --git a/.aiignore b/.aiignore
new file mode 100644
index 0000000..10b81d0
--- /dev/null
+++ b/.aiignore
@@ -0,0 +1,20 @@
+# AI Indexing Ignore
+# These directories/files are excluded from AI context indexing for speed
+
+# Generated/scraped content
+scraper/static/
+
+# Build artifacts
+scraper/bin/
+*.exe
+
+# Dependencies (if using Go modules, the AI doesn't need vendor/)
+# vendor/
+
+# IDE
+.idea/
+.vscode/
+*.swp
+
+# OS
+.DS_Store
diff --git a/.env.example b/.env.example
index 2120f62..d1e4792 100644
--- a/.env.example
+++ b/.env.example
@@ -13,11 +13,29 @@ BROWSERLESS_QUEUED=100
 # Per-session timeout in ms
 BROWSERLESS_TIMEOUT=60000
 
-# Which Browserless strategy the scraper uses: content | scrape | cdp
-BROWSERLESS_STRATEGY=content
+# Optional webhook URL for Browserless error alerts (leave empty to disable)
+ERROR_ALERT_URL=
+
+# Which Browserless strategy the scraper uses: content | scrape | cdp | direct
+BROWSERLESS_STRATEGY=direct
+
+# Strategy for URL retrieval (chapter list). Uses browserless content strategy by default.
+# Set to direct to use plain HTTP, or content/scrape/cdp for browserless.
+BROWSERLESS_URL_STRATEGY=content
 
 # Chapter worker goroutines (0 = NumCPU inside the container)
 SCRAPER_WORKERS=0
 
 # Host path to mount as the static output directory
 STATIC_ROOT=./static/books
+
+# ── Kokoro-FastAPI TTS ────────────────────────────────────────────────────────
+# Base URL for the Kokoro-FastAPI service.  When running via docker-compose the
+# default (http://kokoro:8880) is wired in automatically; override here only if
+# you are pointing at an external or GPU instance.
+KOKORO_URL=http://kokoro:8880
+
+# Default voice used for chapter narration.
+# Single voices: af_bella, af_sky, af_heart, am_adam, …
+# Mixed voices:  af_bella+af_sky  or  af_bella(2)+af_sky(1)  (weighted blend)
+KOKORO_VOICE=af_bella
diff --git a/.gitignore b/.gitignore
index 9286c12..4f6ca69 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,7 +1,3 @@
-# ── Compiled binary ────────────────────────────────────────────────────────────
-/scraper
-/scraper-*
-
 # ── Go toolchain ───────────────────────────────────────────────────────────────
 *.test
 *.out
diff --git a/AGENTS.md b/AGENTS.md
new file mode 100644
index 0000000..74ad802
--- /dev/null
+++ b/AGENTS.md
@@ -0,0 +1,89 @@
+# libnovel Project
+
+Go web scraper for novelfire.net with TTS support via Kokoro-FastAPI.
+
+## Architecture
+
+```
+scraper/
+├── cmd/scraper/main.go           # Entry point: 'run' (one-shot) and 'serve' (HTTP server)
+├── internal/
+│   ├── orchestrator/orchestrator.go  # Coordinates catalogue walk, metadata extraction, chapter scraping
+│   ├── browser/                       # Browser client (content/scrape/cdp strategies) via Browserless
+│   ├── novelfire/scraper.go          # novelfire.net specific scraping logic
+│   ├── server/server.go              # HTTP API (POST /scrape, POST /scrape/book)
+│   ├── writer/writer.go              # File writer (metadata.yaml, chapter .md files)
+│   └── scraper/interfaces.go         # NovelScraper interface definition
+└── static/books/                     # Output directory for scraped content
+```
+
+## Key Concepts
+
+- **Orchestrator**: Manages concurrency - catalogue streaming → per-book metadata goroutines → chapter worker pool
+- **Browser Client**: 3 strategies (content/scrape/cdp) via Browserless Chrome container
+- **Writer**: Writes metadata.yaml and chapter markdown files to `static/books/{slug}/vol-0/1-50/`
+- **Server**: HTTP API with async scrape jobs, UI for browsing books/chapters, chapter-text endpoint for TTS
+
+## Commands
+
+```bash
+# Build
+cd scraper && go build -o bin/scraper ./cmd/scraper
+
+# One-shot scrape (full catalogue)
+./bin/scraper run
+
+# Single book
+./bin/scraper run --url https://novelfire.net/book/xxx
+
+# HTTP server
+./bin/scraper serve
+
+# Tests
+cd scraper && go test ./...
+```
+
+## Environment Variables
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| BROWSERLESS_URL | Browserless Chrome endpoint | http://localhost:3000 |
+| BROWSERLESS_STRATEGY | content \| scrape \| cdp | content |
+| SCRAPER_WORKERS | Chapter goroutines | NumCPU |
+| SCRAPER_STATIC_ROOT | Output directory | ./static/books |
+| SCRAPER_HTTP_ADDR | HTTP listen address | :8080 |
+| KOKORO_URL | Kokoro TTS endpoint | http://localhost:8880 |
+| KOKORO_VOICE | Default TTS voice | af_bella |
+| LOG_LEVEL | debug \| info \| warn \| error | info |
+
+## Docker
+
+```bash
+docker-compose up -d  # Starts browserless, kokoro, scraper
+```
+
+## Code Patterns
+
+- Uses `log/slog` for structured logging
+- Context-based cancellation throughout
+- Worker pool pattern in orchestrator (channel + goroutines)
+- Mutex for single async job (409 on concurrent scrape requests)
+
+## AI Context Tips
+
+- Primary files to modify: `orchestrator.go`, `server.go`, `scraper.go`, `browser/*.go`
+- To add new source: implement `NovelScraper` interface from `internal/scraper/interfaces.go`
+- Skip `static/` directory - generated content, not source
+
+## Speed Up AI Sessions (Optional)
+
+For faster AI context loading, use **Context7** (free, local indexing):
+
+```bash
+# Install and index once
+npx @context7/cli@latest index --path . --ignore .aiignore
+
+# After first run, AI tools will query the index instead of re-scanning files
+```
+
+VSCode extension: https://marketplace.visualstudio.com/items?itemName=context7.context7
diff --git a/docker-compose.yml b/docker-compose.yml
index 0f549db..0cddbcd 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -16,6 +16,8 @@ services:
       QUEUED: "${BROWSERLESS_QUEUED:-100}"
       # Per-session timeout in ms.
       TIMEOUT: "${BROWSERLESS_TIMEOUT:-60000}"
+      # Optional webhook URL for Browserless error alerts.
+      ERROR_ALERT_URL: "${ERROR_ALERT_URL:-}"
     ports:
       - "3000:3000"
     # Shared memory is required for Chrome.
@@ -26,6 +28,21 @@ services:
       timeout: 5s
       retries: 5
 
+  # ─── Kokoro-FastAPI (TTS) ────────────────────────────────────────────────────
+  # CPU image; swap for ghcr.io/remsky/kokoro-fastapi-gpu:latest on NVIDIA hosts.
+  # Models are baked in — no volume mount required for the default voice set.
+  kokoro:
+    image: ghcr.io/remsky/kokoro-fastapi-cpu:latest
+    container_name: libnovel-kokoro
+    restart: unless-stopped
+    ports:
+      - "8880:8880"
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:8880/health"]
+      interval: 15s
+      timeout: 5s
+      retries: 5
+
   # ─── Scraper ─────────────────────────────────────────────────────────────────
   scraper:
     build:
@@ -34,17 +51,23 @@ services:
     container_name: libnovel-scraper
     restart: unless-stopped
     depends_on:
-      browserless:
+      kokoro:
         condition: service_healthy
     environment:
       BROWSERLESS_URL: "http://browserless:3000"
       BROWSERLESS_TOKEN: "${BROWSERLESS_TOKEN:-}"
-      # content | scrape | cdp — swap to test different strategies.
-      BROWSERLESS_STRATEGY: "${BROWSERLESS_STRATEGY:-content}"
+      # content | scrape | cdp | direct — swap to test different strategies.
+      BROWSERLESS_STRATEGY: "${BROWSERLESS_STRATEGY:-direct}"
+      # Strategy for URL retrieval (chapter list). Default: content (browserless)
+      BROWSERLESS_URL_STRATEGY: "${BROWSERLESS_URL_STRATEGY:-content}"
       # 0 → defaults to NumCPU inside the container.
       SCRAPER_WORKERS: "${SCRAPER_WORKERS:-0}"
       SCRAPER_STATIC_ROOT: "/app/static/books"
       SCRAPER_HTTP_ADDR: ":8080"
+      LOG_LEVEL: "debug"
+      # Kokoro-FastAPI TTS endpoint.
+      KOKORO_URL: "${KOKORO_URL:-http://localhost:8880}"
+      KOKORO_VOICE: "${KOKORO_VOICE:-af_bella}"
     ports:
       - "8080:8080"
     volumes:
diff --git a/scraper/cmd/scraper/main.go b/scraper/cmd/scraper/main.go
index fee9203..02c4099 100644
--- a/scraper/cmd/scraper/main.go
+++ b/scraper/cmd/scraper/main.go
@@ -17,6 +17,8 @@
 //	SCRAPER_WORKERS          Chapter goroutine count        (default: NumCPU)
 //	SCRAPER_STATIC_ROOT      Output directory               (default: ./static/books)
 //	SCRAPER_HTTP_ADDR        HTTP listen address            (default: :8080)
+//	KOKORO_URL               Kokoro-FastAPI base URL        (default: "")
+//	KOKORO_VOICE             Default TTS voice              (default: af_bella)
 //	LOG_LEVEL                debug | info | warn | error    (default: info)
 package main
 
@@ -30,11 +32,13 @@ import (
 	"strconv"
 	"strings"
 	"syscall"
+	"time"
 
 	"github.com/libnovel/scraper/internal/browser"
 	"github.com/libnovel/scraper/internal/novelfire"
 	"github.com/libnovel/scraper/internal/orchestrator"
 	"github.com/libnovel/scraper/internal/server"
+	"github.com/libnovel/scraper/internal/writer"
 )
 
 func main() {
@@ -73,11 +77,18 @@ func run(log *slog.Logger) error {
 			browserCfg.MaxConcurrent = n
 		}
 	}
+	if s := os.Getenv("BROWSERLESS_TIMEOUT"); s != "" {
+		if n, err := strconv.Atoi(s); err == nil && n > 0 {
+			browserCfg.Timeout = time.Duration(n) * time.Second
+		}
+	}
 
-	strategy := browser.Strategy(strings.ToLower(envOr("BROWSERLESS_STRATEGY", string(browser.StrategyContent))))
+	strategy := browser.Strategy(strings.ToLower(envOr("BROWSERLESS_STRATEGY", string(browser.StrategyDirect))))
+	urlStrategy := browser.Strategy(strings.ToLower(envOr("BROWSERLESS_URL_STRATEGY", string(browser.StrategyContent))))
 	bc := newBrowserClient(strategy, browserCfg)
+	urlClient := newBrowserClient(urlStrategy, browserCfg)
 
-	nf := novelfire.New(bc, log)
+	nf := novelfire.New(bc, log, urlClient)
 
 	workers := 0
 	if s := os.Getenv("SCRAPER_WORKERS"); s != "" {
@@ -114,15 +125,44 @@ func run(log *slog.Logger) error {
 		o := orchestrator.New(oCfg, nf, log)
 		return o.Run(ctx)
 
+	case "refresh":
+		// refresh <slug> - re-scrape a book from its saved source_url
+		if len(args) < 2 {
+			return fmt.Errorf("refresh command requires a book slug argument")
+		}
+		slug := args[1]
+		w := writer.New(oCfg.StaticRoot)
+		meta, ok, err := w.ReadMetadata(slug)
+		if err != nil {
+			return fmt.Errorf("failed to read metadata for %s: %w", slug, err)
+		}
+		if !ok {
+			return fmt.Errorf("book %q not found in %s", slug, oCfg.StaticRoot)
+		}
+		if meta.SourceURL == "" {
+			return fmt.Errorf("book %q has no source_url in metadata", slug)
+		}
+		oCfg.SingleBookURL = meta.SourceURL
+		log.Info("refreshing book from source_url",
+			"slug", slug,
+			"source_url", meta.SourceURL,
+		)
+		o := orchestrator.New(oCfg, nf, log)
+		return o.Run(ctx)
+
 	case "serve":
 		addr := envOr("SCRAPER_HTTP_ADDR", ":8080")
+		kokoroURL := envOr("KOKORO_URL", "")
+		kokoroVoice := envOr("KOKORO_VOICE", "af_bella")
 		log.Info("starting HTTP server",
 			"addr", addr,
 			"strategy", strategy,
 			"workers", workers,
 			"max_concurrent", browserCfg.MaxConcurrent,
+			"kokoro_url", kokoroURL,
+			"kokoro_voice", kokoroVoice,
 		)
-		srv := server.New(addr, oCfg, nf, log)
+		srv := server.New(addr, oCfg, nf, log, kokoroURL, kokoroVoice)
 		return srv.ListenAndServe(ctx)
 
 	default:
@@ -136,6 +176,8 @@ func newBrowserClient(strategy browser.Strategy, cfg browser.Config) browser.Bro
 		return browser.NewScrapeClient(cfg)
 	case browser.StrategyCDP:
 		return browser.NewCDPClient(cfg)
+	case browser.StrategyDirect:
+		return browser.NewDirectHTTPClient(cfg)
 	default:
 		return browser.NewContentClient(cfg)
 	}
@@ -153,16 +195,21 @@ func printUsage() {
 
 Commands:
   run [--url <book-url>]   One-shot: scrape full catalogue, or a single book
+  refresh <slug>            Re-scrape a book from its saved source_url
   serve                    Start HTTP server (POST /scrape, POST /scrape/book)
 
 Environment variables:
   BROWSERLESS_URL             Browserless base URL      (default: http://localhost:3000)
   BROWSERLESS_TOKEN           API token                 (default: "")
-  BROWSERLESS_STRATEGY        content | scrape | cdp    (default: content)
+  BROWSERLESS_STRATEGY        content|scrape|cdp|direct (default: direct)
+  BROWSERLESS_URL_STRATEGY    Strategy for URL retrieval (default: content)
   BROWSERLESS_MAX_CONCURRENT  Max simultaneous sessions (default: 5)
+  BROWSERLESS_TIMEOUT         HTTP request timeout sec  (default: 90)
   SCRAPER_WORKERS             Chapter goroutines        (default: NumCPU = %d)
   SCRAPER_STATIC_ROOT         Output directory          (default: ./static/books)
   SCRAPER_HTTP_ADDR           HTTP listen address       (default: :8080)
+  KOKORO_URL                  Kokoro-FastAPI base URL   (default: "", TTS disabled)
+  KOKORO_VOICE                Default TTS voice         (default: af_bella)
   LOG_LEVEL                   debug|info|warn|error     (default: info)
 `, runtime.NumCPU())
 }
diff --git a/scraper/internal/browser/content_scrape.go b/scraper/internal/browser/content_scrape.go
index 35eab3c..3e2a38c 100644
--- a/scraper/internal/browser/content_scrape.go
+++ b/scraper/internal/browser/content_scrape.go
@@ -65,7 +65,7 @@ type contentClient struct {
 // NewContentClient returns a BrowserClient that uses POST /content.
 func NewContentClient(cfg Config) BrowserClient {
 	if cfg.Timeout == 0 {
-		cfg.Timeout = 60 * time.Second
+		cfg.Timeout = 90 * time.Second
 	}
 	return &contentClient{
 		cfg:  cfg,
@@ -135,7 +135,7 @@ type scrapeClient struct {
 // NewScrapeClient returns a BrowserClient that uses POST /scrape.
 func NewScrapeClient(cfg Config) BrowserClient {
 	if cfg.Timeout == 0 {
-		cfg.Timeout = 60 * time.Second
+		cfg.Timeout = 90 * time.Second
 	}
 	return &scrapeClient{
 		cfg:  cfg,
diff --git a/scraper/internal/browser/http.go b/scraper/internal/browser/http.go
new file mode 100644
index 0000000..5b9c374
--- /dev/null
+++ b/scraper/internal/browser/http.go
@@ -0,0 +1,68 @@
+package browser
+
+import (
+	"context"
+	"fmt"
+	"io"
+	"net/http"
+	"time"
+)
+
+type httpClient struct {
+	cfg  Config
+	http *http.Client
+	sem  chan struct{}
+}
+
+func NewDirectHTTPClient(cfg Config) BrowserClient {
+	if cfg.Timeout == 0 {
+		cfg.Timeout = 30 * time.Second
+	}
+	return &httpClient{
+		cfg:  cfg,
+		http: &http.Client{Timeout: cfg.Timeout},
+		sem:  makeSem(cfg.MaxConcurrent),
+	}
+}
+
+func (c *httpClient) Strategy() Strategy { return StrategyDirect }
+
+func (c *httpClient) GetContent(ctx context.Context, req ContentRequest) (string, error) {
+	if err := acquire(ctx, c.sem); err != nil {
+		return "", fmt.Errorf("http: semaphore: %w", err)
+	}
+	defer release(c.sem)
+
+	httpReq, err := http.NewRequestWithContext(ctx, http.MethodGet, req.URL, nil)
+	if err != nil {
+		return "", fmt.Errorf("http: build request: %w", err)
+	}
+	httpReq.Header.Set("User-Agent", "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36")
+	httpReq.Header.Set("Accept", "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8")
+	httpReq.Header.Set("Accept-Language", "en-US,en;q=0.5")
+
+	resp, err := c.http.Do(httpReq)
+	if err != nil {
+		return "", fmt.Errorf("http: do request: %w", err)
+	}
+	defer resp.Body.Close()
+
+	if resp.StatusCode != http.StatusOK {
+		b, _ := io.ReadAll(resp.Body)
+		return "", fmt.Errorf("http: unexpected status %d: %s", resp.StatusCode, b)
+	}
+
+	raw, err := io.ReadAll(resp.Body)
+	if err != nil {
+		return "", fmt.Errorf("http: read body: %w", err)
+	}
+	return string(raw), nil
+}
+
+func (c *httpClient) ScrapePage(_ context.Context, _ ScrapeRequest) (ScrapeResponse, error) {
+	return ScrapeResponse{}, fmt.Errorf("http client does not support ScrapePage; use browserless")
+}
+
+func (c *httpClient) CDPSession(_ context.Context, _ string, _ CDPSessionFunc) error {
+	return fmt.Errorf("http client does not support CDP; use browserless")
+}
diff --git a/scraper/internal/browser/integration_test.go b/scraper/internal/browser/integration_test.go
new file mode 100644
index 0000000..e008803
--- /dev/null
+++ b/scraper/internal/browser/integration_test.go
@@ -0,0 +1,152 @@
+//go:build integration
+
+// Integration tests for the Browserless /content API.
+//
+// These tests require a live Browserless instance and are gated behind the
+// "integration" build tag so they never run in normal `go test ./...` passes.
+//
+// Run them with:
+//
+//	BROWSERLESS_URL=http://localhost:3000 \
+//	BROWSERLESS_TOKEN=your-token \          # omit if auth is disabled
+//	go test -v -tags integration -timeout 120s \
+//	    github.com/libnovel/scraper/internal/browser
+package browser_test
+
+import (
+	"context"
+	"os"
+	"strings"
+	"testing"
+	"time"
+
+	"github.com/libnovel/scraper/internal/browser"
+)
+
+// chapterURL is the novelfire chapter used in every integration sub-test.
+const chapterURL = "https://novelfire.net/book/a-dragon-against-the-whole-world/chapter-1"
+
+// newIntegrationClient reads BROWSERLESS_URL / BROWSERLESS_TOKEN from the
+// environment and returns a configured contentClient.
+// The test is skipped when BROWSERLESS_URL is not set.
+func newIntegrationClient(t *testing.T) browser.BrowserClient {
+	t.Helper()
+	baseURL := os.Getenv("BROWSERLESS_URL")
+	if baseURL == "" {
+		t.Skip("BROWSERLESS_URL not set — skipping integration test")
+	}
+	return browser.NewContentClient(browser.Config{
+		BaseURL: baseURL,
+		Token:   os.Getenv("BROWSERLESS_TOKEN"),
+		// Use a generous per-request HTTP timeout so the wait-for-selector
+		// (75 s) doesn't get cut off by the transport layer.
+		Timeout:       120 * time.Second,
+		MaxConcurrent: 1,
+	})
+}
+
+// TestIntegration_ChapterContent_ReturnsHTML verifies that a POST /content
+// request with the production wait-for-selector settings succeeds and that the
+// returned HTML contains the #content div expected on novelfire chapter pages.
+func TestIntegration_ChapterContent_ReturnsHTML(t *testing.T) {
+	client := newIntegrationClient(t)
+
+	ctx, cancel := context.WithTimeout(context.Background(), 110*time.Second)
+	defer cancel()
+
+	req := browser.ContentRequest{
+		URL: chapterURL,
+		WaitFor: &browser.WaitForSelector{
+			Selector: "#content",
+			Timeout:  5000,
+		},
+		RejectResourceTypes: productionRejectTypes(),
+	}
+
+	html, err := client.GetContent(ctx, req)
+	if err != nil {
+		t.Fatalf("GetContent failed: %v", err)
+	}
+
+	// The #content div must not be empty; presence of <p> tags inside it is a
+	// reliable indicator that chapter paragraphs were rendered.
+	contentIdx := strings.Index(html, `id="content"`)
+	if contentIdx == -1 {
+		t.Fatalf("id=\"content\" not found in response (%d bytes)", len(html))
+	}
+
+	// Look for <p> tags after the #content marker — the chapter text lives there.
+	afterContent := html[contentIdx:]
+	if !strings.Contains(afterContent, "<p") {
+		t.Errorf("#content section contains no <p> tags; JS rendering may have failed.\nSection preview:\n%s",
+			truncate(afterContent, 1000))
+	}
+
+	t.Logf("chapter content section starts at byte %d (total response: %d bytes)", contentIdx, len(html))
+}
+
+// TestIntegration_ChapterContent_TimeoutSurfacedCorrectly verifies that a
+// deliberately too-short timeout returns an error containing "TimeoutError" (the
+// Browserless error string seen in the failing log entry).  This ensures our
+// error-classification logic in retryGetContent matches real Browserless output.
+func TestIntegration_ChapterContent_TimeoutSurfacedCorrectly(t *testing.T) {
+	client := newIntegrationClient(t)
+
+	ctx, cancel := context.WithTimeout(context.Background(), 40*time.Second)
+	defer cancel()
+
+	req := browser.ContentRequest{
+		URL: chapterURL,
+		WaitFor: &browser.WaitForSelector{
+			Selector: "#content",
+			Timeout:  500, // intentionally too short (500 ms) → Browserless will time out
+		},
+		RejectResourceTypes: productionRejectTypes(),
+	}
+
+	_, err := client.GetContent(ctx, req)
+	if err == nil {
+		t.Fatal("expected a timeout error from Browserless, but GetContent succeeded — " +
+			"the page may now load very fast; adjust the timeout threshold")
+	}
+
+	t.Logf("got expected error: %v", err)
+
+	// Browserless wraps navigation timeouts in a 500 response with
+	// "TimeoutError: Navigation timeout" in the body — this is the exact
+	// error that is triggering retries in production.
+	if !strings.Contains(err.Error(), "500") {
+		t.Errorf("expected HTTP 500 status in error, got: %v", err)
+	}
+}
+
+// ── helpers ───────────────────────────────────────────────────────────────────
+
+// productionRejectTypes returns the same resource-type block-list the
+// novelfire scraper uses in production, so integration tests exercise the
+// identical request shape.
+func productionRejectTypes() []string {
+	return []string{
+		"cspviolationreport",
+		"eventsource",
+		"fedcm",
+		"font",
+		"image",
+		"manifest",
+		"media",
+		"other",
+		"ping",
+		"signedexchange",
+		"stylesheet",
+		"texttrack",
+		"websocket",
+	}
+}
+
+// truncate returns the first n bytes of s as a string.
+func truncate(s string, n int) string {
+	if len(s) <= n {
+		return s
+	}
+	return s[:n] + "…"
+}
diff --git a/scraper/internal/browser/interface.go b/scraper/internal/browser/interface.go
index aa78212..c2c8fd4 100644
--- a/scraper/internal/browser/interface.go
+++ b/scraper/internal/browser/interface.go
@@ -21,6 +21,10 @@ const (
 	// DevTools Protocol). Most powerful; required for complex interactions
 	// (clicking, scrolling, waiting for network idle, etc.).
 	StrategyCDP Strategy = "cdp"
+
+	// StrategyDirect uses a plain HTTP client to fetch HTML directly.
+	// Suitable for sites that don't require JavaScript rendering.
+	StrategyDirect Strategy = "direct"
 )
 
 // WaitForSelector describes the waitForSelector option sent to Browserless.
@@ -29,12 +33,20 @@ type WaitForSelector struct {
 	Timeout  int    `json:"timeout,omitempty"` // ms
 }
 
+// GotoOptions controls page navigation behavior.
+type GotoOptions struct {
+	Timeout   int    `json:"timeout,omitempty"`   // ms
+	WaitUntil string `json:"waitUntil,omitempty"` // e.g., "networkidle2", "load"
+}
+
 // ContentRequest is the body sent to POST /content.
 type ContentRequest struct {
 	URL                 string           `json:"url"`
 	WaitFor             *WaitForSelector `json:"waitForSelector,omitempty"`
 	WaitForTimeout      int              `json:"waitForTimeout,omitempty"`      // ms
 	RejectResourceTypes []string         `json:"rejectResourceTypes,omitempty"` // e.g. ["image","stylesheet"]
+	GotoOptions         *GotoOptions     `json:"gotoOptions,omitempty"`
+	BestAttempt         bool             `json:"bestAttempt,omitempty"` // return partial content on timeout/error
 }
 
 // ScrapeElement is one element descriptor inside a ScrapeRequest.
@@ -45,9 +57,10 @@ type ScrapeElement struct {
 
 // ScrapeRequest is the body sent to POST /scrape.
 type ScrapeRequest struct {
-	URL      string           `json:"url"`
-	Elements []ScrapeElement  `json:"elements"`
-	WaitFor  *WaitForSelector `json:"waitForSelector,omitempty"`
+	URL         string           `json:"url"`
+	Elements    []ScrapeElement  `json:"elements"`
+	WaitFor     *WaitForSelector `json:"waitForSelector,omitempty"`
+	GotoOptions *GotoOptions     `json:"gotoOptions,omitempty"`
 }
 
 // ScrapeResult is one entry in the response from POST /scrape.
diff --git a/scraper/internal/novelfire/integration_test.go b/scraper/internal/novelfire/integration_test.go
new file mode 100644
index 0000000..98af698
--- /dev/null
+++ b/scraper/internal/novelfire/integration_test.go
@@ -0,0 +1,344 @@
+//go:build integration
+
+// Integration tests for the novelfire.net Scraper against a live Browserless instance.
+//
+// These tests exercise the full scraping stack — Browserless → raw HTML →
+// novelfire HTML parser — for the book:
+//
+//	https://novelfire.net/book/a-dragon-against-the-whole-world
+//
+// They are gated behind the "integration" build tag so they never run in a
+// normal `go test ./...` pass.
+//
+// Run with:
+//
+//	BROWSERLESS_URL=http://localhost:3000 \
+//	BROWSERLESS_TOKEN=your-token \        # omit if auth is disabled
+//	go test -v -tags integration -timeout 600s \
+//	    github.com/libnovel/scraper/internal/novelfire
+package novelfire
+
+import (
+	"context"
+	"fmt"
+	"os"
+	"strings"
+	"testing"
+	"time"
+
+	"github.com/libnovel/scraper/internal/browser"
+	"github.com/libnovel/scraper/internal/scraper"
+)
+
+const (
+	integrationBookURL   = "https://novelfire.net/book/a-dragon-against-the-whole-world"
+	integrationBookSlug  = "a-dragon-against-the-whole-world"
+	integrationBookTitle = "A Dragon against the Whole World"
+)
+
+// newIntegrationScraper reads BROWSERLESS_URL / BROWSERLESS_TOKEN from the
+// environment, constructs a real contentClient, and returns a novelfire Scraper
+// wired to it. The test is skipped when BROWSERLESS_URL is not set.
+func newIntegrationScraper(t *testing.T) *Scraper {
+	t.Helper()
+	baseURL := os.Getenv("BROWSERLESS_URL")
+	if baseURL == "" {
+		t.Skip("BROWSERLESS_URL not set — skipping integration test")
+	}
+	client := browser.NewContentClient(browser.Config{
+		BaseURL:       baseURL,
+		Token:         os.Getenv("BROWSERLESS_TOKEN"),
+		Timeout:       120 * time.Second,
+		MaxConcurrent: 1,
+	})
+	return New(client, nil)
+}
+
+// ── Metadata ──────────────────────────────────────────────────────────────────
+
+// TestIntegration_Novelfire_ScrapeMetadata_ReturnsTitle verifies that
+// ScrapeMetadata fetches the book page and correctly parses at minimum
+// the slug, title, and source URL.
+func TestIntegration_Novelfire_ScrapeMetadata_ReturnsTitle(t *testing.T) {
+	s := newIntegrationScraper(t)
+
+	ctx, cancel := context.WithTimeout(context.Background(), 30*time.Second)
+	defer cancel()
+
+	meta, err := s.ScrapeMetadata(ctx, integrationBookURL)
+	if err != nil {
+		t.Fatalf("ScrapeMetadata failed: %v", err)
+	}
+
+	t.Logf("slug:           %s", meta.Slug)
+	t.Logf("title:          %s", meta.Title)
+	t.Logf("author:         %s", meta.Author)
+	t.Logf("status:         %s", meta.Status)
+	t.Logf("genres:         %v", meta.Genres)
+	t.Logf("total_chapters: %d", meta.TotalChapters)
+	t.Logf("source_url:     %s", meta.SourceURL)
+
+	if meta.Slug != integrationBookSlug {
+		t.Errorf("slug = %q, want %q", meta.Slug, integrationBookSlug)
+	}
+	if meta.Title == "" {
+		t.Error("title is empty")
+	}
+	if !strings.EqualFold(meta.Title, integrationBookTitle) {
+		// Warn rather than hard-fail — the site may reword the title.
+		t.Logf("WARN: title = %q, expected something like %q", meta.Title, integrationBookTitle)
+	}
+	if meta.SourceURL != integrationBookURL {
+		t.Errorf("source_url = %q, want %q", meta.SourceURL, integrationBookURL)
+	}
+}
+
+// TestIntegration_Novelfire_ScrapeMetadata_ReturnsFullFields verifies that
+// every optional field (author, status, genres, summary, total_chapters) is
+// populated. A missing field is a warning, not a hard failure, because the
+// site may change its HTML structure.
+func TestIntegration_Novelfire_ScrapeMetadata_ReturnsFullFields(t *testing.T) {
+	s := newIntegrationScraper(t)
+
+	ctx, cancel := context.WithTimeout(context.Background(), 30*time.Second)
+	defer cancel()
+
+	meta, err := s.ScrapeMetadata(ctx, integrationBookURL)
+	if err != nil {
+		t.Fatalf("ScrapeMetadata failed: %v", err)
+	}
+
+	type check struct {
+		field string
+		empty bool
+	}
+	checks := []check{
+		{"author", meta.Author == ""},
+		{"status", meta.Status == ""},
+		{"summary", meta.Summary == ""},
+		{"genres", len(meta.Genres) == 0},
+		{"total_chapters", meta.TotalChapters == 0},
+	}
+	for _, c := range checks {
+		if c.empty {
+			t.Errorf("field %q is empty — HTML selector may have broken", c.field)
+		}
+	}
+
+	// total_chapters must be a positive integer.
+	if meta.TotalChapters < 1 {
+		t.Errorf("total_chapters = %d, want >= 1", meta.TotalChapters)
+	}
+}
+
+// ── Chapter list ──────────────────────────────────────────────────────────────
+
+// TestIntegration_Novelfire_ScrapeChapterList_ReturnsRefs verifies that
+// ScrapeChapterList returns a non-empty slice of chapter references with
+// valid URLs and numbers parsed from those URLs (not list position).
+func TestIntegration_Novelfire_ScrapeChapterList_ReturnsRefs(t *testing.T) {
+	s := newIntegrationScraper(t)
+
+	ctx, cancel := context.WithTimeout(context.Background(), 60*time.Second)
+	defer cancel()
+
+	refs, err := s.ScrapeChapterList(ctx, integrationBookURL)
+	if err != nil {
+		t.Fatalf("ScrapeChapterList failed: %v", err)
+	}
+
+	t.Logf("total refs returned: %d", len(refs))
+
+	if len(refs) == 0 {
+		t.Fatal("ScrapeChapterList returned 0 refs")
+	}
+
+	// Every ref must have a non-empty URL pointing at the correct book.
+	for i, ref := range refs {
+		if ref.URL == "" {
+			t.Errorf("refs[%d].URL is empty", i)
+		}
+		if !strings.Contains(ref.URL, integrationBookSlug) {
+			t.Errorf("refs[%d].URL %q does not contain book slug", i, ref.URL)
+		}
+		if ref.Number <= 0 {
+			t.Errorf("refs[%d].Number = %d, want > 0 (URL: %s)", i, ref.Number, ref.URL)
+		}
+		if ref.Title == "" {
+			t.Errorf("refs[%d].Title is empty (URL: %s)", i, ref.URL)
+		}
+	}
+}
+
+// TestIntegration_Novelfire_ScrapeChapterList_NumbersMatchURLs verifies the
+// fix for the newest-first ordering bug: each ref's Number must equal the
+// chapter number embedded in its URL, not its position in the list.
+func TestIntegration_Novelfire_ScrapeChapterList_NumbersMatchURLs(t *testing.T) {
+	s := newIntegrationScraper(t)
+
+	ctx, cancel := context.WithTimeout(context.Background(), 60*time.Second)
+	defer cancel()
+
+	refs, err := s.ScrapeChapterList(ctx, integrationBookURL)
+	if err != nil {
+		t.Fatalf("ScrapeChapterList failed: %v", err)
+	}
+	if len(refs) == 0 {
+		t.Fatal("ScrapeChapterList returned 0 refs")
+	}
+
+	mismatches := 0
+	for i, ref := range refs {
+		wantNum := chapterNumberFromURL(ref.URL)
+		if wantNum <= 0 {
+			// URL has no parseable number — skip this entry.
+			continue
+		}
+		if ref.Number != wantNum {
+			t.Errorf("refs[%d]: Number=%d but URL %q implies number=%d (position-based bug?)",
+				i, ref.Number, ref.URL, wantNum)
+			mismatches++
+			if mismatches >= 5 {
+				t.Log("… (further mismatches suppressed)")
+				break
+			}
+		}
+	}
+
+	// Log the first few refs so failures are easy to diagnose.
+	limit := 5
+	if len(refs) < limit {
+		limit = len(refs)
+	}
+	for i := 0; i < limit; i++ {
+		t.Logf("refs[%d]: Number=%d Title=%q URL=%s", i, refs[i].Number, refs[i].Title, refs[i].URL)
+	}
+}
+
+// ── Chapters ──────────────────────────────────────────────────────────────────
+
+// TestIntegration_Novelfire_ScrapeFirst3Chapters scrapes chapters 1, 2, and 3
+// via ScrapeChapterText and verifies each returns non-empty markdown text.
+// Chapters are run as sub-tests so a single failure does not abort the others.
+func TestIntegration_Novelfire_ScrapeFirst3Chapters(t *testing.T) {
+	s := newIntegrationScraper(t)
+
+	chapters := []scraper.ChapterRef{
+		{
+			Number: 1,
+			Title:  "Chapter 1",
+			URL:    integrationBookURL + "/chapter-1",
+		},
+		{
+			Number: 2,
+			Title:  "Chapter 2",
+			URL:    integrationBookURL + "/chapter-2",
+		},
+		{
+			Number: 3,
+			Title:  "Chapter 3",
+			URL:    integrationBookURL + "/chapter-3",
+		},
+	}
+
+	for _, ref := range chapters {
+		ref := ref // capture
+		t.Run(fmt.Sprintf("chapter-%d", ref.Number), func(t *testing.T) {
+			// Sequential: each chapter needs its own generous timeout.
+			ctx, cancel := context.WithTimeout(context.Background(), 110*time.Second)
+			defer cancel()
+
+			ch, err := s.ScrapeChapterText(ctx, ref)
+			if err != nil {
+				t.Fatalf("ScrapeChapterText failed: %v", err)
+			}
+
+			t.Logf("chapter %d: %d bytes of markdown", ref.Number, len(ch.Text))
+			t.Logf("first 300 chars:\n%s", truncateStr(ch.Text, 300))
+
+			// Ref fields must be echoed back unchanged.
+			if ch.Ref.Number != ref.Number {
+				t.Errorf("Ref.Number = %d, want %d", ch.Ref.Number, ref.Number)
+			}
+			if ch.Ref.URL != ref.URL {
+				t.Errorf("Ref.URL = %q, want %q", ch.Ref.URL, ref.URL)
+			}
+
+			// Text must be non-trivially long.
+			if len(ch.Text) < 100 {
+				t.Errorf("Text too short (%d bytes) — likely empty or parsing failed:\n%s",
+					len(ch.Text), ch.Text)
+			}
+
+			// Text must not contain raw HTML tags — NodeToMarkdown should have
+			// stripped them.
+			for _, tag := range []string{"<div", "<span", "<script", "<style"} {
+				if strings.Contains(ch.Text, tag) {
+					t.Errorf("Text contains raw HTML tag %q — markdown conversion may be broken", tag)
+				}
+			}
+		})
+	}
+}
+
+// TestIntegration_Novelfire_ScrapeFirst3Chapters_FromList is the end-to-end
+// variant: it first calls ScrapeChapterList to get the real refs (with
+// URL-derived numbers), then scrapes chapters 1–3 using those refs.
+// This catches any discrepancy between the list and the chapter URLs.
+func TestIntegration_Novelfire_ScrapeFirst3Chapters_FromList(t *testing.T) {
+	s := newIntegrationScraper(t)
+
+	// Step 1: fetch the chapter list.
+	listCtx, listCancel := context.WithTimeout(context.Background(), 60*time.Second)
+	defer listCancel()
+
+	refs, err := s.ScrapeChapterList(listCtx, integrationBookURL)
+	if err != nil {
+		t.Fatalf("ScrapeChapterList failed: %v", err)
+	}
+	if len(refs) == 0 {
+		t.Fatal("ScrapeChapterList returned 0 refs")
+	}
+
+	// Build a map number→ref for fast lookup.
+	byNumber := make(map[int]scraper.ChapterRef, len(refs))
+	for _, r := range refs {
+		byNumber[r.Number] = r
+	}
+
+	// Step 2: scrape chapters 1, 2, 3.
+	for _, wantNum := range []int{1, 2, 3} {
+		wantNum := wantNum
+		ref, ok := byNumber[wantNum]
+		if !ok {
+			t.Errorf("chapter %d not found in chapter list (list has %d entries)", wantNum, len(refs))
+			continue
+		}
+
+		t.Run(fmt.Sprintf("chapter-%d", wantNum), func(t *testing.T) {
+			ctx, cancel := context.WithTimeout(context.Background(), 110*time.Second)
+			defer cancel()
+
+			ch, err := s.ScrapeChapterText(ctx, ref)
+			if err != nil {
+				t.Fatalf("ScrapeChapterText(chapter %d, %s) failed: %v", wantNum, ref.URL, err)
+			}
+
+			t.Logf("chapter %d (%q): %d bytes", wantNum, ref.Title, len(ch.Text))
+			t.Logf("first 300 chars:\n%s", truncateStr(ch.Text, 300))
+
+			if len(ch.Text) < 100 {
+				t.Errorf("chapter %d text too short (%d bytes)", wantNum, len(ch.Text))
+			}
+		})
+	}
+}
+
+// ── helpers ───────────────────────────────────────────────────────────────────
+
+func truncateStr(s string, n int) string {
+	if len(s) <= n {
+		return s
+	}
+	return s[:n] + "…"
+}
diff --git a/scraper/internal/novelfire/scraper.go b/scraper/internal/novelfire/scraper.go
index 13f0f62..eb33f0e 100644
--- a/scraper/internal/novelfire/scraper.go
+++ b/scraper/internal/novelfire/scraper.go
@@ -13,6 +13,7 @@ import (
 	"fmt"
 	"log/slog"
 	"net/url"
+	"path"
 	"strconv"
 	"strings"
 	"time"
@@ -25,6 +26,7 @@ import (
 const (
 	baseURL       = "https://novelfire.net"
 	cataloguePath = "/genre-all/sort-new/status-all/all-novel"
+	rankingPath   = "/ranking"
 )
 
 // rejectResourceTypes lists Browserless resource types to block on every request.
@@ -40,8 +42,6 @@ var rejectResourceTypes = []string{
 	"media",
 	"other",
 	"ping",
-	"prefetch",
-	"preflight",
 	"signedexchange",
 	"stylesheet",
 	"texttrack",
@@ -51,16 +51,22 @@ var rejectResourceTypes = []string{
 // Scraper is the novelfire.net implementation of scraper.NovelScraper.
 // It uses the /content strategy by default (rendered HTML via Browserless).
 type Scraper struct {
-	client browser.BrowserClient
-	log    *slog.Logger
+	client    browser.BrowserClient
+	urlClient browser.BrowserClient // separate client for URL retrieval (uses browserless content strategy)
+	log       *slog.Logger
 }
 
 // New returns a new novelfire Scraper.
-func New(client browser.BrowserClient, log *slog.Logger) *Scraper {
+// client is used for content fetching, urlClient is used for URL retrieval (chapter list).
+// If urlClient is nil, client will be used for both.
+func New(client browser.BrowserClient, log *slog.Logger, urlClient browser.BrowserClient) *Scraper {
 	if log == nil {
 		log = slog.Default()
 	}
-	return &Scraper{client: client, log: log}
+	if urlClient == nil {
+		urlClient = client
+	}
+	return &Scraper{client: client, urlClient: urlClient, log: log}
 }
 
 // SourceName implements NovelScraper.
@@ -92,15 +98,14 @@ func (s *Scraper) ScrapeCatalogue(ctx context.Context) (<-chan scraper.Catalogue
 				"page", page,
 				"payload_url", pageURL,
 				"payload_wait_selector", ".novel-item",
-				"payload_wait_selector_timeout_ms", 10000,
-				"payload_wait_for_timeout_ms", 10000,
+				"payload_wait_selector_timeout_ms", 5000,
 			)
 
 			html, err := s.client.GetContent(ctx, browser.ContentRequest{
 				URL:                 pageURL,
-				WaitFor:             &browser.WaitForSelector{Selector: ".novel-item", Timeout: 10000},
-				WaitForTimeout:      10000,
+				WaitFor:             &browser.WaitForSelector{Selector: ".novel-item", Timeout: 5000},
 				RejectResourceTypes: rejectResourceTypes,
+				GotoOptions:         &browser.GotoOptions{Timeout: 60000},
 			})
 			if err != nil {
 				s.log.Debug("catalogue page fetch failed",
@@ -173,15 +178,14 @@ func (s *Scraper) ScrapeMetadata(ctx context.Context, bookURL string) (scraper.B
 	s.log.Debug("metadata fetch starting",
 		"payload_url", bookURL,
 		"payload_wait_selector", ".novel-title",
-		"payload_wait_selector_timeout_ms", 10000,
-		"payload_wait_for_timeout_ms", 10000,
+		"payload_wait_selector_timeout_ms", 5000,
 	)
 
 	raw, err := s.client.GetContent(ctx, browser.ContentRequest{
 		URL:                 bookURL,
-		WaitFor:             &browser.WaitForSelector{Selector: ".novel-title", Timeout: 10000},
-		WaitForTimeout:      10000,
+		WaitFor:             &browser.WaitForSelector{Selector: ".novel-title", Timeout: 5000},
 		RejectResourceTypes: rejectResourceTypes,
+		GotoOptions:         &browser.GotoOptions{Timeout: 60000},
 	})
 	if err != nil {
 		s.log.Debug("metadata fetch failed", "url", bookURL, "err", err)
@@ -198,8 +202,11 @@ func (s *Scraper) ScrapeMetadata(ctx context.Context, bookURL string) (scraper.B
 	title := htmlutil.ExtractFirst(root, scraper.Selector{Tag: "h1", Class: "novel-title"})
 	// <span class="author"><a>Author Name</a></span>
 	author := htmlutil.ExtractFirst(root, scraper.Selector{Tag: "span", Class: "author"})
-	// <img class="cover" src="...">
-	cover := htmlutil.ExtractFirst(root, scraper.Selector{Tag: "img", Class: "cover", Attr: "src"})
+	// <figure class="cover"><img src="..."></figure>
+	var cover string
+	if figureCover := htmlutil.FindFirst(root, scraper.Selector{Tag: "figure", Class: "cover"}); figureCover != nil {
+		cover = htmlutil.ExtractFirst(figureCover, scraper.Selector{Tag: "img", Attr: "src"})
+	}
 	// <span class="status">Ongoing</span>
 	status := htmlutil.ExtractFirst(root, scraper.Selector{Tag: "span", Class: "status"})
 
@@ -245,32 +252,41 @@ func (s *Scraper) ScrapeMetadata(ctx context.Context, bookURL string) (scraper.B
 
 func (s *Scraper) ScrapeChapterList(ctx context.Context, bookURL string) ([]scraper.ChapterRef, error) {
 	var refs []scraper.ChapterRef
-	// Chapter list URL: {bookURL}/chapters
-	pageURL := strings.TrimRight(bookURL, "/") + "/chapters"
+	// Chapter list URL: {bookURL}/chapters?page=N
+	baseChapterURL := strings.TrimRight(bookURL, "/") + "/chapters"
 	page := 1
 
-	for pageURL != "" {
+	for {
 		select {
 		case <-ctx.Done():
 			return refs, ctx.Err()
 		default:
 		}
 
+		pageURL := fmt.Sprintf("%s?page=%d", baseChapterURL, page)
 		s.log.Info("scraping chapter list", "page", page, "url", pageURL)
 
 		s.log.Debug("chapter list fetch starting",
 			"page", page,
 			"payload_url", pageURL,
 			"payload_wait_selector", ".chapter-list",
-			"payload_wait_selector_timeout_ms", 10000,
-			"payload_wait_for_timeout_ms", 10000,
+			"payload_wait_selector_timeout_ms", 15000,
+			"payload_wait_timeout_ms", 2000,
+			"strategy", s.urlClient.Strategy(),
 		)
 
-		raw, err := s.client.GetContent(ctx, browser.ContentRequest{
-			URL:                 pageURL,
-			WaitFor:             &browser.WaitForSelector{Selector: ".chapter-list", Timeout: 10000},
-			WaitForTimeout:      10000,
+		raw, err := s.urlClient.GetContent(ctx, browser.ContentRequest{
+			URL: pageURL,
+			// Wait up to 15 s for the chapter list container to appear in the DOM.
+			WaitFor: &browser.WaitForSelector{Selector: ".chapter-list", Timeout: 15000},
+			// After the selector is found, wait an additional 2 s for any
+			// deferred JS rendering (lazy-loaded links, infinite-scroll hydration).
+			WaitForTimeout:      2000,
 			RejectResourceTypes: rejectResourceTypes,
+			GotoOptions:         &browser.GotoOptions{Timeout: 60000},
+			// Do NOT use BestAttempt — we want a complete page or a clear error,
+			// not silently partial HTML that looks like "no more chapters".
+			BestAttempt: false,
 		})
 		if err != nil {
 			s.log.Debug("chapter list fetch failed",
@@ -293,10 +309,27 @@ func (s *Scraper) ScrapeChapterList(ctx context.Context, bookURL string) ([]scra
 
 		chapterList := htmlutil.FindFirst(root, scraper.Selector{Class: "chapter-list"})
 		if chapterList == nil {
+			// No chapter list container on this page — we've gone past the last page.
+			s.log.Debug("chapter list container not found, stopping pagination", "page", page)
 			break
 		}
+
 		// Each chapter row: <li class="chapter-item"><a href="...">Title</a></li>
 		items := htmlutil.FindAll(chapterList, scraper.Selector{Tag: "li"})
+
+		s.log.Debug("chapter list page parsed",
+			"page", page,
+			"url", pageURL,
+			"chapters_on_page", len(items),
+			"total_refs_so_far", len(refs),
+		)
+
+		// Zero items on this page means we've gone past the last page.
+		if len(items) == 0 {
+			s.log.Debug("no chapters on page, stopping pagination", "page", page)
+			break
+		}
+
 		for _, item := range items {
 			linkNode := htmlutil.FindFirst(item, scraper.Selector{Tag: "a"})
 			if linkNode == nil {
@@ -308,7 +341,15 @@ func (s *Scraper) ScrapeChapterList(ctx context.Context, bookURL string) ([]scra
 				continue
 			}
 			chURL := resolveURL(baseURL, href)
-			num := len(refs) + 1
+			num := chapterNumberFromURL(chURL)
+			if num <= 0 {
+				// Fall back to position if the URL has no parseable number.
+				num = len(refs) + 1
+				s.log.Warn("chapter number not parseable from URL, falling back to position",
+					"url", chURL,
+					"position", num,
+				)
+			}
 			refs = append(refs, scraper.ChapterRef{
 				Number: num,
 				Title:  strings.TrimSpace(chTitle),
@@ -316,30 +357,134 @@ func (s *Scraper) ScrapeChapterList(ctx context.Context, bookURL string) ([]scra
 			})
 		}
 
-		s.log.Debug("chapter list page parsed",
-			"page", page,
-			"url", pageURL,
-			"chapters_on_page", len(items),
-			"total_refs_so_far", len(refs),
-		)
-
-		// Next page: <a class="next" href="...">
-		nextHref := htmlutil.ExtractFirst(root, scraper.Selector{Tag: "a", Class: "next", Attr: "href"})
-		if nextHref == "" {
-			break
-		}
-		pageURL = resolveURL(baseURL, nextHref)
 		page++
 	}
 
 	return refs, nil
 }
 
+// ─── RankingProvider ───────────────────────────────────────────────────────────
+
+func (s *Scraper) ScrapeRanking(ctx context.Context) (<-chan scraper.BookMeta, <-chan error) {
+	entries := make(chan scraper.BookMeta, 64)
+	errs := make(chan error, 16)
+
+	go func() {
+		defer close(entries)
+		defer close(errs)
+
+		pageURL := baseURL + rankingPath
+		rank := 1
+
+		for pageURL != "" {
+			select {
+			case <-ctx.Done():
+				return
+			default:
+			}
+
+			s.log.Info("scraping ranking page", "url", pageURL)
+
+			// Use WaitFor only for browser-based strategies
+			var raw string
+			var err error
+			if s.client.Strategy() == browser.StrategyDirect {
+				raw, err = s.client.GetContent(ctx, browser.ContentRequest{
+					URL:                 pageURL,
+					RejectResourceTypes: rejectResourceTypes,
+				})
+			} else {
+				raw, err = s.client.GetContent(ctx, browser.ContentRequest{
+					URL:                 pageURL,
+					WaitFor:             &browser.WaitForSelector{Selector: ".rank-novels", Timeout: 30000},
+					RejectResourceTypes: rejectResourceTypes,
+					GotoOptions:         &browser.GotoOptions{Timeout: 60000},
+					BestAttempt:         true,
+				})
+			}
+			if err != nil {
+				s.log.Debug("ranking page fetch failed", "url", pageURL, "err", err)
+				errs <- fmt.Errorf("ranking page: %w", err)
+				return
+			}
+
+			root, err := htmlutil.ParseHTML(raw)
+			if err != nil {
+				errs <- fmt.Errorf("ranking page parse: %w", err)
+				return
+			}
+
+			rankList := htmlutil.FindFirst(root, scraper.Selector{Class: "rank-novels"})
+			if rankList == nil {
+				break
+			}
+
+			items := htmlutil.FindAll(rankList, scraper.Selector{Tag: "li", Class: "novel-item"})
+			for _, item := range items {
+				// Cover: <figure class="cover"><a href="/book/slug"><img data-src="..."></a></figure>
+				var cover string
+				if fig := htmlutil.FindFirst(item, scraper.Selector{Tag: "figure", Class: "cover"}); fig != nil {
+					cover = htmlutil.ExtractFirst(fig, scraper.Selector{Tag: "img", Attr: "data-src"})
+					if cover != "" {
+						cover = baseURL + cover
+					}
+				}
+
+				// Title and URL: <h2 class="title"><a href="/book/slug">Title</a></h2>
+				titleNode := htmlutil.FindFirst(item, scraper.Selector{Tag: "h2", Class: "title"})
+				var title, bookURL string
+				if titleNode != nil {
+					linkNode := htmlutil.FindFirst(titleNode, scraper.Selector{Tag: "a"})
+					if linkNode != nil {
+						title = htmlutil.ExtractText(linkNode, scraper.Selector{})
+						href := htmlutil.ExtractText(linkNode, scraper.Selector{Attr: "href"})
+						bookURL = resolveURL(baseURL, href)
+					}
+				}
+
+				// Status: <span class="status"> Ongoing/Completed </span>
+				status := htmlutil.ExtractFirst(item, scraper.Selector{Tag: "span", Class: "status"})
+
+				// Genres: <div class="categories"><div class="scroll"><span>Genre1</span><span>Genre2</span>...</div></div>
+				var genres []string
+				categoriesNode := htmlutil.FindFirst(item, scraper.Selector{Tag: "div", Class: "categories"})
+				if categoriesNode != nil {
+					genres = htmlutil.ExtractAll(categoriesNode, scraper.Selector{Tag: "span", Multiple: true})
+				}
+
+				slug := slugFromURL(bookURL)
+
+				meta := scraper.BookMeta{
+					Slug:      slug,
+					Title:     title,
+					Cover:     cover,
+					Status:    strings.TrimSpace(status),
+					Genres:    genres,
+					SourceURL: bookURL,
+					Ranking:   rank,
+				}
+				rank++
+
+				select {
+				case <-ctx.Done():
+					return
+				case entries <- meta:
+				}
+			}
+
+			// Next page - ranking pages use different pagination, just get first page for now
+			break
+		}
+	}()
+
+	return entries, errs
+}
+
 // ─── ChapterTextProvider ─────────────────────────────────────────────────────
 
 // retryGetContent calls client.GetContent up to maxAttempts times, backing off
 // exponentially between retries. Only errors that look like transient Browserless
-// 5xx responses (navigation timeouts, etc.) are retried; context cancellation and
+// failures (timeouts, 5xx responses) are retried; context cancellation and
 // permanent errors are returned immediately.
 func retryGetContent(
 	ctx context.Context,
@@ -363,11 +508,6 @@ func retryGetContent(
 			return "", err
 		}
 
-		// Only retry on Browserless 5xx responses.
-		if !strings.Contains(err.Error(), "unexpected status 5") {
-			return "", err
-		}
-
 		if attempt < maxAttempts {
 			log.Warn("chapter fetch failed, retrying",
 				"url", req.URL,
@@ -393,15 +533,15 @@ func (s *Scraper) ScrapeChapterText(ctx context.Context, ref scraper.ChapterRef)
 		"title", ref.Title,
 		"payload_url", ref.URL,
 		"payload_wait_selector", "#content",
-		"payload_wait_selector_timeout_ms", 75000,
-		"payload_wait_for_timeout_ms", 75000,
+		"payload_wait_selector_timeout_ms", 5000,
 	)
 
 	raw, err := retryGetContent(ctx, s.log, s.client, browser.ContentRequest{
 		URL:                 ref.URL,
-		WaitFor:             &browser.WaitForSelector{Selector: "#content", Timeout: 75000},
-		WaitForTimeout:      75000,
+		WaitFor:             &browser.WaitForSelector{Selector: "#content", Timeout: 5000},
 		RejectResourceTypes: rejectResourceTypes,
+		GotoOptions:         &browser.GotoOptions{Timeout: 60000},
+		BestAttempt:         true,
 	}, 9, 6*time.Second)
 	if err != nil {
 		s.log.Debug("chapter text fetch failed",
@@ -411,6 +551,18 @@ func (s *Scraper) ScrapeChapterText(ctx context.Context, ref scraper.ChapterRef)
 		)
 		return scraper.Chapter{}, fmt.Errorf("chapter %d fetch: %w", ref.Number, err)
 	}
+	if len(raw) > 0 {
+		preview := raw
+		if len(preview) > 500 {
+			preview = preview[:500]
+		}
+		s.log.Debug("chapter text fetch partial content",
+			"chapter", ref.Number,
+			"url", ref.URL,
+			"response_bytes", len(raw),
+			"preview", preview,
+		)
+	}
 	s.log.Debug("chapter text fetch completed",
 		"chapter", ref.Number,
 		"url", ref.URL,
@@ -484,3 +636,30 @@ func parseChapterCount(s string) int {
 	n, _ := strconv.Atoi(fields[0])
 	return n
 }
+
+// chapterNumberFromURL extracts the chapter number from a novelfire chapter URL.
+//
+// URL pattern: https://novelfire.net/book/{book-slug}/chapter-{N}
+// The last path segment is expected to be "chapter-{N}" or "{N}".
+// Returns 0 if no number can be parsed.
+func chapterNumberFromURL(chapterURL string) int {
+	u, err := url.Parse(chapterURL)
+	if err != nil {
+		return 0
+	}
+	seg := path.Base(u.Path) // e.g. "chapter-42" or "42"
+	// Strip a "chapter-" prefix if present.
+	seg = strings.TrimPrefix(seg, "chapter-")
+	// Also handle "chap-", "ch-" variants used by some sites.
+	seg = strings.TrimPrefix(seg, "chap-")
+	seg = strings.TrimPrefix(seg, "ch-")
+	// Take only the leading digits (handles slugs like "42-title-text").
+	digits := strings.FieldsFunc(seg, func(r rune) bool {
+		return r < '0' || r > '9'
+	})
+	if len(digits) == 0 {
+		return 0
+	}
+	n, _ := strconv.Atoi(digits[0])
+	return n
+}
diff --git a/scraper/internal/novelfire/scraper_test.go b/scraper/internal/novelfire/scraper_test.go
new file mode 100644
index 0000000..7d94e6b
--- /dev/null
+++ b/scraper/internal/novelfire/scraper_test.go
@@ -0,0 +1,217 @@
+package novelfire
+
+import (
+	"context"
+	"strings"
+	"testing"
+
+	"github.com/libnovel/scraper/internal/browser"
+	"github.com/libnovel/scraper/internal/scraper"
+)
+
+// ── stub browser client ───────────────────────────────────────────────────────
+
+// stubClient is a BrowserClient that returns a fixed HTML string for every
+// GetContent call. ScrapePage and CDPSession are not used by these tests.
+type stubClient struct {
+	html string
+}
+
+func (s *stubClient) Strategy() browser.Strategy { return browser.StrategyContent }
+
+func (s *stubClient) GetContent(_ context.Context, _ browser.ContentRequest) (string, error) {
+	return s.html, nil
+}
+
+func (s *stubClient) ScrapePage(_ context.Context, _ browser.ScrapeRequest) (browser.ScrapeResponse, error) {
+	return browser.ScrapeResponse{}, nil
+}
+
+func (s *stubClient) CDPSession(_ context.Context, _ string, _ browser.CDPSessionFunc) error {
+	return nil
+}
+
+// pagedStubClient returns a different HTML response for each successive call.
+// Once all pages are exhausted it returns an empty page (no chapter-list),
+// simulating the paginated chapter-list endpoint terminating correctly.
+type pagedStubClient struct {
+	pages []string
+	call  int
+}
+
+func (c *pagedStubClient) Strategy() browser.Strategy { return browser.StrategyContent }
+
+func (c *pagedStubClient) GetContent(_ context.Context, _ browser.ContentRequest) (string, error) {
+	if c.call < len(c.pages) {
+		html := c.pages[c.call]
+		c.call++
+		return html, nil
+	}
+	// Past the last page — return a page with no chapter-list to stop pagination.
+	return `<!DOCTYPE html><html><body><div class="no-content"></div></body></html>`, nil
+}
+
+func (c *pagedStubClient) ScrapePage(_ context.Context, _ browser.ScrapeRequest) (browser.ScrapeResponse, error) {
+	return browser.ScrapeResponse{}, nil
+}
+
+func (c *pagedStubClient) CDPSession(_ context.Context, _ string, _ browser.CDPSessionFunc) error {
+	return nil
+}
+
+// ── helpers ───────────────────────────────────────────────────────────────────
+
+func newScraper(html string) *Scraper {
+	return New(&stubClient{html: html}, nil, &stubClient{html: html})
+}
+
+func newPagedScraper(pages ...string) *Scraper {
+	urlClient := &pagedStubClient{pages: pages}
+	return New(&stubClient{}, nil, urlClient)
+}
+
+// ── ScrapeChapterText ─────────────────────────────────────────────────────────
+
+func TestScrapeChapterText_ExtractsInnerText(t *testing.T) {
+	html := `<!DOCTYPE html><html><body>
+		<div id="content">
+			<p>It was a dark and stormy night.</p>
+			<p>The hero stepped forward.</p>
+		</div>
+	</body></html>`
+
+	s := newScraper(html)
+	ref := scraper.ChapterRef{Number: 1, Title: "Chapter 1", URL: "https://novelfire.net/book/test-novel/chapter-1"}
+
+	ch, err := s.ScrapeChapterText(context.Background(), ref)
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+	if ch.Ref.Number != 1 {
+		t.Errorf("expected chapter number 1, got %d", ch.Ref.Number)
+	}
+	if !strings.Contains(ch.Text, "dark and stormy") {
+		t.Errorf("expected chapter text to contain 'dark and stormy', got: %q", ch.Text)
+	}
+	if !strings.Contains(ch.Text, "hero stepped forward") {
+		t.Errorf("expected chapter text to contain 'hero stepped forward', got: %q", ch.Text)
+	}
+}
+
+func TestScrapeChapterText_MissingContainer(t *testing.T) {
+	html := `<!DOCTYPE html><html><body><div class="other">nothing here</div></body></html>`
+
+	s := newScraper(html)
+	ref := scraper.ChapterRef{Number: 2, Title: "Chapter 2", URL: "https://novelfire.net/book/test-novel/chapter-2"}
+
+	_, err := s.ScrapeChapterText(context.Background(), ref)
+	if err == nil {
+		t.Fatal("expected an error when #content container is missing, got nil")
+	}
+}
+
+// ── chapterNumberFromURL ──────────────────────────────────────────────────────
+
+func TestChapterNumberFromURL(t *testing.T) {
+	cases := []struct {
+		url  string
+		want int
+	}{
+		// Standard novelfire pattern.
+		{"https://novelfire.net/book/a-dragon-against-the-whole-world/chapter-1", 1},
+		{"https://novelfire.net/book/a-dragon-against-the-whole-world/chapter-26", 26},
+		{"https://novelfire.net/book/a-dragon-against-the-whole-world/chapter-58", 58},
+		// Large chapter numbers.
+		{"https://novelfire.net/book/some-novel/chapter-1000", 1000},
+		// Path segment with trailing slash.
+		{"https://novelfire.net/book/some-novel/chapter-5/", 5},
+		// Slug with title appended after the number (hypothetical future format).
+		{"https://novelfire.net/book/some-novel/chapter-42-the-battle", 42},
+		// Unparseable — should return 0 so the caller can fall back.
+		{"https://novelfire.net/book/some-novel/prologue", 0},
+		{"https://novelfire.net/book/some-novel/", 0},
+		{"not-a-url", 0},
+	}
+
+	for _, tc := range cases {
+		got := chapterNumberFromURL(tc.url)
+		if got != tc.want {
+			t.Errorf("chapterNumberFromURL(%q) = %d, want %d", tc.url, got, tc.want)
+		}
+	}
+}
+
+// ── ScrapeChapterList (position vs URL numbering) ─────────────────────────────
+
+// TestScrapeChapterList_NumbersFromURL verifies that when the chapter list HTML
+// is served newest-first (as novelfire.net does), chapter numbers are still
+// assigned from the URL — not from list position — so that a re-run correctly
+// identifies which chapters are already on disk.
+func TestScrapeChapterList_NumbersFromURL(t *testing.T) {
+	// Simulate a newest-first chapter list with 5 chapters on a single page.
+	// Positions 1..5 correspond to chapters 5,4,3,2,1 in the site HTML.
+	page1 := `<!DOCTYPE html><html><body>
+		<ul class="chapter-list">
+			<li class="chapter-item"><a href="/book/test/chapter-5">Chapter 5</a></li>
+			<li class="chapter-item"><a href="/book/test/chapter-4">Chapter 4</a></li>
+			<li class="chapter-item"><a href="/book/test/chapter-3">Chapter 3</a></li>
+			<li class="chapter-item"><a href="/book/test/chapter-2">Chapter 2</a></li>
+			<li class="chapter-item"><a href="/book/test/chapter-1">Chapter 1</a></li>
+		</ul>
+	</body></html>`
+
+	s := newPagedScraper(page1)
+	refs, err := s.ScrapeChapterList(context.Background(), "https://novelfire.net/book/test")
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+	if len(refs) != 5 {
+		t.Fatalf("expected 5 refs, got %d", len(refs))
+	}
+
+	// With position-based numbering (the old bug), refs[0].Number would be 1
+	// even though its URL is /chapter-5. With URL-based numbering it must be 5.
+	wantNumbers := []int{5, 4, 3, 2, 1}
+	for i, ref := range refs {
+		if ref.Number != wantNumbers[i] {
+			t.Errorf("refs[%d].Number = %d, want %d (URL: %s)", i, ref.Number, wantNumbers[i], ref.URL)
+		}
+	}
+}
+
+// TestScrapeChapterList_Pagination verifies that the scraper correctly follows
+// ?page=N pagination and stops when a page returns no chapter items.
+func TestScrapeChapterList_Pagination(t *testing.T) {
+	page1 := `<!DOCTYPE html><html><body>
+		<ul class="chapter-list">
+			<li class="chapter-item"><a href="/book/test/chapter-3">Chapter 3</a></li>
+			<li class="chapter-item"><a href="/book/test/chapter-2">Chapter 2</a></li>
+			<li class="chapter-item"><a href="/book/test/chapter-1">Chapter 1</a></li>
+		</ul>
+	</body></html>`
+
+	page2 := `<!DOCTYPE html><html><body>
+		<ul class="chapter-list">
+			<li class="chapter-item"><a href="/book/test/chapter-6">Chapter 6</a></li>
+			<li class="chapter-item"><a href="/book/test/chapter-5">Chapter 5</a></li>
+			<li class="chapter-item"><a href="/book/test/chapter-4">Chapter 4</a></li>
+		</ul>
+	</body></html>`
+
+	// page3 is omitted — pagedStubClient will return empty page to stop pagination.
+	s := newPagedScraper(page1, page2)
+	refs, err := s.ScrapeChapterList(context.Background(), "https://novelfire.net/book/test")
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+	if len(refs) != 6 {
+		t.Fatalf("expected 6 refs (3 per page × 2 pages), got %d", len(refs))
+	}
+
+	wantNumbers := []int{3, 2, 1, 6, 5, 4}
+	for i, ref := range refs {
+		if ref.Number != wantNumbers[i] {
+			t.Errorf("refs[%d].Number = %d, want %d (URL: %s)", i, ref.Number, wantNumbers[i], ref.URL)
+		}
+	}
+}
diff --git a/scraper/internal/scraper/interfaces.go b/scraper/internal/scraper/interfaces.go
index cac8367..d98ec6a 100644
--- a/scraper/internal/scraper/interfaces.go
+++ b/scraper/internal/scraper/interfaces.go
@@ -27,6 +27,8 @@ type BookMeta struct {
 	TotalChapters int `yaml:"total_chapters,omitempty"`
 	// SourceURL is the canonical URL of the book's landing page.
 	SourceURL string `yaml:"source_url"`
+	// Ranking is the rank number from ranking pages.
+	Ranking int `yaml:"ranking,omitempty"`
 }
 
 // CatalogueEntry is a lightweight reference returned by CatalogueProvider.
@@ -108,6 +110,13 @@ type ChapterTextProvider interface {
 	ScrapeChapterText(ctx context.Context, ref ChapterRef) (Chapter, error)
 }
 
+// RankingProvider can enumerate novels from a ranking page.
+type RankingProvider interface {
+	// ScrapeRanking pages through the ranking list, sending BookMeta values
+	// (with basic info like title, cover, genres, status, sourceURL) to the returned channel.
+	ScrapeRanking(ctx context.Context) (<-chan BookMeta, <-chan error)
+}
+
 // NovelScraper is the full interface that a concrete novel source must implement.
 // It composes all four provider interfaces.
 type NovelScraper interface {
@@ -115,6 +124,7 @@ type NovelScraper interface {
 	MetadataProvider
 	ChapterListProvider
 	ChapterTextProvider
+	RankingProvider
 
 	// SourceName returns the human-readable name of this scraper, e.g. "novelfire.net".
 	SourceName() string
diff --git a/scraper/internal/server/server.go b/scraper/internal/server/server.go
index 0ae7d26..68105ae 100644
--- a/scraper/internal/server/server.go
+++ b/scraper/internal/server/server.go
@@ -13,6 +13,7 @@ import (
 	"fmt"
 	"log/slog"
 	"net/http"
+	"strconv"
 	"sync"
 	"time"
 
@@ -23,23 +24,27 @@ import (
 
 // Server wraps an HTTP mux with the scraping endpoints.
 type Server struct {
-	addr    string
-	oCfg    orchestrator.Config
-	novel   scraper.NovelScraper
-	log     *slog.Logger
-	writer  *writer.Writer
-	mu      sync.Mutex
-	running bool
+	addr        string
+	oCfg        orchestrator.Config
+	novel       scraper.NovelScraper
+	log         *slog.Logger
+	writer      *writer.Writer
+	mu          sync.Mutex
+	running     bool
+	kokoroURL   string // Kokoro-FastAPI base URL, e.g. http://kokoro:8880
+	kokoroVoice string // default voice, e.g. af_bella
 }
 
 // New creates a new Server.
-func New(addr string, oCfg orchestrator.Config, novel scraper.NovelScraper, log *slog.Logger) *Server {
+func New(addr string, oCfg orchestrator.Config, novel scraper.NovelScraper, log *slog.Logger, kokoroURL, kokoroVoice string) *Server {
 	return &Server{
-		addr:   addr,
-		oCfg:   oCfg,
-		novel:  novel,
-		log:    log,
-		writer: writer.New(oCfg.StaticRoot),
+		addr:        addr,
+		oCfg:        oCfg,
+		novel:       novel,
+		log:         log,
+		writer:      writer.New(oCfg.StaticRoot),
+		kokoroURL:   kokoroURL,
+		kokoroVoice: kokoroVoice,
 	}
 }
 
@@ -52,16 +57,21 @@ func (s *Server) ListenAndServe(ctx context.Context) error {
 	mux.HandleFunc("POST /scrape/book", s.handleScrapeBook)
 	// UI routes
 	mux.HandleFunc("GET /", s.handleHome)
+	mux.HandleFunc("GET /ranking", s.handleRanking)
+	mux.HandleFunc("POST /ranking/refresh", s.handleRankingRefresh)
+	mux.HandleFunc("GET /ranking/view", s.handleRankingView)
 	mux.HandleFunc("GET /books/{slug}", s.handleBook)
 	mux.HandleFunc("GET /books/{slug}/chapters/{n}", s.handleChapter)
 	mux.HandleFunc("POST /ui/scrape/book", s.handleUIScrapeBook)
 	mux.HandleFunc("GET /ui/scrape/status", s.handleUIScrapeStatus)
+	// Plain-text chapter content for browser-side TTS
+	mux.HandleFunc("GET /ui/chapter-text/{slug}/{n}", s.handleChapterText)
 
 	srv := &http.Server{
 		Addr:         s.addr,
 		Handler:      mux,
 		ReadTimeout:  15 * time.Second,
-		WriteTimeout: 15 * time.Second,
+		WriteTimeout: 60 * time.Second,
 		IdleTimeout:  60 * time.Second,
 	}
 
@@ -85,6 +95,25 @@ func (s *Server) handleHealth(w http.ResponseWriter, _ *http.Request) {
 	_ = json.NewEncoder(w).Encode(map[string]string{"status": "ok"})
 }
 
+// handleChapterText returns the plain text of a chapter (markdown stripped)
+// for browser-side TTS. The browser POSTs this directly to Kokoro-FastAPI.
+func (s *Server) handleChapterText(w http.ResponseWriter, r *http.Request) {
+	slug := r.PathValue("slug")
+	n, err := strconv.Atoi(r.PathValue("n"))
+	if err != nil || n < 1 {
+		http.NotFound(w, r)
+		return
+	}
+	raw, err := s.writer.ReadChapter(slug, n)
+	if err != nil {
+		http.NotFound(w, r)
+		return
+	}
+	w.Header().Set("Content-Type", "text/plain; charset=utf-8")
+	w.Header().Set("Cache-Control", "no-store")
+	fmt.Fprint(w, stripMarkdown(raw))
+}
+
 func (s *Server) handleScrapeCatalogue(w http.ResponseWriter, r *http.Request) {
 	cfg := s.oCfg
 	cfg.SingleBookURL = "" // full catalogue
diff --git a/scraper/internal/server/ui.go b/scraper/internal/server/ui.go
new file mode 100644
index 0000000..b9565b0
--- /dev/null
+++ b/scraper/internal/server/ui.go
@@ -0,0 +1,1331 @@
+package server
+
+import (
+	"bytes"
+	"context"
+	"fmt"
+	"html/template"
+	"net/http"
+	"regexp"
+	"strconv"
+	"strings"
+	"time"
+
+	"github.com/libnovel/scraper/internal/orchestrator"
+	"github.com/libnovel/scraper/internal/writer"
+	"github.com/yuin/goldmark"
+	"github.com/yuin/goldmark/extension"
+	goldhtml "github.com/yuin/goldmark/renderer/html"
+)
+
+// md is the shared goldmark instance used for all markdown→HTML conversions.
+var md = goldmark.New(
+	goldmark.WithExtensions(extension.Typographer, extension.Table),
+	goldmark.WithRendererOptions(goldhtml.WithUnsafe()),
+)
+
+// kokoroVoices is the full list of voices shipped with Kokoro-FastAPI,
+// grouped loosely by language prefix:
+//
+//	af_ / am_  American English female / male
+//	bf_ / bm_  British English female / male
+//	ef_ / em_  Spanish female / male
+//	ff_        French female
+//	hf_ / hm_  Hindi female / male
+//	if_ / im_  Italian female / male
+//	jf_ / jm_  Japanese female / male
+//	pf_ / pm_  Portuguese female / male
+//	zf_ / zm_  Chinese female / male
+var kokoroVoices = []string{
+	// American English
+	"af_alloy", "af_aoede", "af_bella", "af_heart", "af_jadzia",
+	"af_jessica", "af_kore", "af_nicole", "af_nova", "af_river",
+	"af_sarah", "af_sky",
+	"am_adam", "am_echo", "am_eric", "am_fenrir", "am_liam",
+	"am_michael", "am_onyx", "am_puck",
+	// British English
+	"bf_alice", "bf_emma", "bf_lily",
+	"bm_daniel", "bm_fable", "bm_george", "bm_lewis",
+	// Spanish
+	"ef_dora", "em_alex",
+	// French
+	"ff_siwis",
+	// Hindi
+	"hf_alpha", "hf_beta", "hm_omega", "hm_psi",
+	// Italian
+	"if_sara", "im_nicola",
+	// Japanese
+	"jf_alpha", "jf_gongitsune", "jf_nezumi", "jf_tebukuro", "jm_kumo",
+	// Portuguese
+	"pf_dora", "pm_alex",
+	// Chinese
+	"zf_xiaobei", "zf_xiaoni", "zf_xiaoxiao", "zf_xiaoyi",
+	"zm_yunjian", "zm_yunxi", "zm_yunxia", "zm_yunyang",
+}
+
+// ─── shared layout ────────────────────────────────────────────────────────────
+
+const layoutHead = `<!DOCTYPE html>
+<html lang="en" class="bg-zinc-950 text-zinc-100">
+<head>
+  <meta charset="UTF-8">
+  <meta name="viewport" content="width=device-width, initial-scale=1.0">
+  <title>{{.Title}} — libnovel</title>
+  <script src="https://cdn.tailwindcss.com"></script>
+  <script src="https://unpkg.com/htmx.org@2.0.4" crossorigin="anonymous"></script>
+  <style>
+    .prose p            { margin-bottom: 1em; }
+    .prose h1,.prose h2,
+    .prose h3,.prose h4 { font-weight: 700; margin: 1.4em 0 .5em; line-height: 1.25; }
+    .prose h4  { font-size: 1.05rem; }
+    .prose h3  { font-size: 1.2rem; }
+    .prose h2  { font-size: 1.4rem; }
+    .prose h1  { font-size: 1.7rem; }
+    .prose em  { font-style: italic; }
+    .prose strong { font-weight: 700; }
+    .prose hr  { border-color: #3f3f46; margin: 2em 0; }
+    .prose blockquote { border-left: 3px solid #52525b; padding-left: 1rem; color: #a1a1aa; }
+  </style>
+</head>
+<body class="min-h-screen">`
+
+const layoutFoot = `</body></html>`
+
+func renderPage(w http.ResponseWriter, title, body string) {
+	t := template.Must(template.New("layout").Parse(layoutHead + body + layoutFoot))
+	w.Header().Set("Content-Type", "text/html; charset=utf-8")
+	_ = t.Execute(w, struct{ Title string }{Title: title})
+}
+
+func renderFragment(w http.ResponseWriter, body string) {
+	w.Header().Set("Content-Type", "text/html; charset=utf-8")
+	fmt.Fprint(w, body)
+}
+
+func isHTMX(r *http.Request) bool {
+	return r.Header.Get("HX-Request") == "true"
+}
+
+// respond writes either a full page or an HTMX fragment depending on the request.
+func (s *Server) respond(w http.ResponseWriter, r *http.Request, title, fragment string) {
+	if isHTMX(r) {
+		renderFragment(w, fragment)
+		return
+	}
+	renderPage(w, title,
+		`<main id="main-content" class="min-h-screen">`+fragment+`</main>`)
+}
+
+// ─── GET / — book catalogue ───────────────────────────────────────────────────
+
+const homeTmpl = `
+<div class="max-w-4xl mx-auto px-4 py-10">
+  <div class="flex items-center justify-between mb-2">
+    <h1 class="text-3xl font-bold text-zinc-100">libnovel</h1>
+    <a href="/ranking" hx-get="/ranking" hx-target="#main-content" hx-push-url="true" hx-swap="innerHTML" class="text-sm px-3 py-1.5 rounded-lg bg-amber-700 hover:bg-amber-600 text-white">Browse Rankings</a>
+  </div>
+  <p class="text-zinc-400 mb-8">{{len .Books}} book{{if ne (len .Books) 1}}s{{end}} on disk</p>
+
+  <!-- Scrape form -->
+  <div class="mb-10 rounded-xl border border-zinc-800 bg-zinc-900 p-5">
+    <h2 class="text-sm font-semibold text-zinc-300 mb-3">Scrape a new book</h2>
+    <form hx-post="/ui/scrape/book"
+          hx-target="#scrape-status"
+          hx-swap="innerHTML"
+          class="flex gap-2">
+      <input type="url"
+             name="url"
+             required
+             placeholder="https://novelfire.net/book/some-book"
+             class="flex-1 rounded-lg bg-zinc-800 border border-zinc-700 px-3 py-2 text-sm text-zinc-100 placeholder-zinc-500 focus:outline-none focus:border-amber-500 transition-colors" />
+      <button type="submit"
+              class="px-4 py-2 rounded-lg bg-amber-600 hover:bg-amber-500 text-white text-sm font-medium transition-colors whitespace-nowrap">
+        Scrape
+      </button>
+    </form>
+    <div id="scrape-status" class="mt-3"></div>
+  </div>
+
+  <!-- Book grid -->
+  <div class="grid gap-4 sm:grid-cols-2">
+    {{range .Books}}
+    <a href="/books/{{.Slug}}"
+       hx-get="/books/{{.Slug}}"
+       hx-target="#main-content"
+       hx-push-url="true"
+       hx-swap="innerHTML"
+       class="group block rounded-xl border border-zinc-800 bg-zinc-900 p-5 hover:border-amber-500 transition-colors cursor-pointer">
+      <div class="flex gap-4">
+        {{if .Cover}}
+        <img src="{{.Cover}}" alt="cover" class="w-14 h-20 object-cover rounded flex-shrink-0">
+        {{end}}
+        <div class="min-w-0">
+          <h2 class="font-semibold text-zinc-100 group-hover:text-amber-400 truncate">{{.Title}}</h2>
+          {{if .Author}}<p class="text-sm text-zinc-400 mt-0.5">{{.Author}}</p>{{end}}
+          <div class="flex gap-2 mt-2 flex-wrap">
+            {{if .Status}}<span class="text-xs px-2 py-0.5 rounded-full bg-zinc-800 text-zinc-300">{{.Status}}</span>{{end}}
+            {{if .TotalChapters}}<span class="text-xs px-2 py-0.5 rounded-full bg-zinc-800 text-zinc-300">{{.TotalChapters}} ch</span>{{end}}
+          </div>
+        </div>
+      </div>
+    </a>
+    {{else}}
+    <p class="text-zinc-500 col-span-2">No books scraped yet.</p>
+    {{end}}
+  </div>
+</div>`
+
+func (s *Server) handleHome(w http.ResponseWriter, r *http.Request) {
+	if r.URL.Path != "/" {
+		http.NotFound(w, r)
+		return
+	}
+
+	books, err := s.writer.ListBooks()
+	if err != nil {
+		http.Error(w, "failed to list books: "+err.Error(), http.StatusInternalServerError)
+		return
+	}
+
+	t := template.Must(template.New("home").Parse(homeTmpl))
+	var buf bytes.Buffer
+	_ = t.Execute(&buf, struct{ Books interface{} }{Books: books})
+
+	s.respond(w, r, "Home", buf.String())
+}
+
+// ─── GET /ranking — ranking page ───────────────────────────────────────────────
+
+const rankingTmpl = `
+<div class="max-w-4xl mx-auto px-4 py-10">
+  <a href="/"
+     hx-get="/"
+     hx-target="#main-content"
+     hx-push-url="true"
+     hx-swap="innerHTML"
+     class="text-sm text-zinc-400 hover:text-amber-400 mb-6 inline-flex items-center gap-1">
+    ← All books
+  </a>
+
+  <div class="flex items-start justify-between gap-4 mb-2 flex-wrap">
+    <div>
+      <h1 class="text-3xl font-bold text-zinc-100">Novel Rankings</h1>
+      <p class="text-zinc-400 mt-1">Top novels from novelfire.net</p>
+      {{if .CachedAt}}<p class="text-xs text-zinc-500 mt-1">Cached {{.CachedAt}}</p>{{end}}
+    </div>
+    <div class="flex gap-2 mt-1">
+      <a href="/ranking/view"
+         hx-get="/ranking/view"
+         hx-target="#main-content"
+         hx-push-url="true"
+         hx-swap="innerHTML"
+         class="text-sm px-3 py-1.5 rounded-lg bg-zinc-700 hover:bg-zinc-600 text-white inline-flex items-center gap-1">
+        View Markdown
+      </a>
+      <button
+        hx-post="/ranking/refresh"
+        hx-target="#main-content"
+        hx-swap="innerHTML"
+        hx-indicator="#refresh-spinner"
+        hx-push-url="/ranking"
+        class="text-sm px-3 py-1.5 rounded-lg bg-amber-700 hover:bg-amber-600 text-white inline-flex items-center gap-2">
+        <span id="refresh-spinner" class="htmx-indicator animate-spin">&#8635;</span>
+        Refresh Rankings
+      </button>
+    </div>
+  </div>
+
+  <!-- Book grid -->
+  <div class="grid gap-4 sm:grid-cols-2 mt-8">
+    {{range .Books}}
+    {{if .Local}}
+    {{/* Book is in local library — wrap entire card in a clickable link */}}
+    <a href="/books/{{.Slug}}"
+       hx-get="/books/{{.Slug}}"
+       hx-target="#main-content"
+       hx-push-url="true"
+       hx-swap="innerHTML"
+       class="group block rounded-xl border border-teal-700 bg-teal-950 p-4 hover:border-teal-400 transition-colors">
+      <div class="flex gap-4">
+        {{if .Cover}}
+        <img src="{{.Cover}}" alt="cover" class="w-14 h-20 object-cover rounded flex-shrink-0">
+        {{end}}
+        <div class="min-w-0 flex-1">
+          <div class="flex items-center gap-2">
+            {{if .Rank}}<span class="text-xs font-bold text-amber-400">#{{.Rank}}</span>{{end}}
+            <h2 class="font-semibold text-zinc-100 group-hover:text-teal-300 truncate">{{.Title}}</h2>
+            <span class="ml-auto text-xs px-1.5 py-0.5 rounded bg-teal-800 text-teal-300 flex-shrink-0">In library</span>
+          </div>
+          {{if .Author}}<p class="text-sm text-zinc-400 mt-0.5">{{.Author}}</p>{{end}}
+          <div class="flex gap-2 mt-2 flex-wrap">
+            {{if .Status}}<span class="text-xs px-2 py-0.5 rounded-full bg-teal-900 text-teal-300">{{.Status}}</span>{{end}}
+          </div>
+          {{if .Genres}}
+          <div class="flex gap-1 mt-2 flex-wrap">
+            {{range .Genres}}<span class="text-xs px-1.5 py-0.5 rounded bg-teal-900 text-teal-400">{{.}}</span>{{end}}
+          </div>
+          {{end}}
+        </div>
+      </div>
+    </a>
+    {{else}}
+    {{/* Book not yet in local library */}}
+    <div class="group block rounded-xl border border-zinc-800 bg-zinc-900 p-4 hover:border-amber-500 transition-colors">
+      <div class="flex gap-4">
+        {{if .Cover}}
+        <img src="{{.Cover}}" alt="cover" class="w-14 h-20 object-cover rounded flex-shrink-0">
+        {{end}}
+        <div class="min-w-0 flex-1">
+          <div class="flex items-center gap-2">
+            {{if .Rank}}<span class="text-xs font-bold text-amber-400">#{{.Rank}}</span>{{end}}
+            <h2 class="font-semibold text-zinc-100 group-hover:text-amber-400 truncate">{{.Title}}</h2>
+          </div>
+          {{if .Author}}<p class="text-sm text-zinc-400 mt-0.5">{{.Author}}</p>{{end}}
+          <div class="flex gap-2 mt-2 flex-wrap">
+            {{if .Status}}<span class="text-xs px-2 py-0.5 rounded-full bg-zinc-800 text-zinc-300">{{.Status}}</span>{{end}}
+          </div>
+          {{if .Genres}}
+          <div class="flex gap-1 mt-2 flex-wrap">
+            {{range .Genres}}<span class="text-xs px-1.5 py-0.5 rounded bg-zinc-800 text-zinc-400">{{.}}</span>{{end}}
+          </div>
+          {{end}}
+          {{if .SourceURL}}
+          <div class="mt-3">
+            <form hx-post="/ui/scrape/book" hx-swap="outerHTML" hx-target="closest div">
+              <input type="hidden" name="url" value="{{.SourceURL}}">
+              <button type="submit"
+                class="text-xs px-2 py-1 rounded bg-amber-700 hover:bg-amber-600 text-white"
+                title="Scrape full content">
+                Scrape
+              </button>
+            </form>
+          </div>
+          {{end}}
+        </div>
+      </div>
+    </div>
+    {{end}}
+    {{else}}
+    <p class="text-zinc-500 col-span-2">No ranking data available. Click "Refresh Rankings" to fetch from novelfire.net.</p>
+    {{end}}
+  </div>
+</div>`
+
+// rankingViewItem enriches a RankingItem with whether it is present in the
+// local book library, so the template can highlight it differently.
+type rankingViewItem struct {
+	writer.RankingItem
+	Local bool
+}
+
+// toRankingViewItems annotates items with Local=true for slugs found in localSlugs.
+func toRankingViewItems(items []writer.RankingItem, localSlugs map[string]bool) []rankingViewItem {
+	out := make([]rankingViewItem, len(items))
+	for i, it := range items {
+		out[i] = rankingViewItem{
+			RankingItem: it,
+			Local:       localSlugs[it.Slug],
+		}
+	}
+	return out
+}
+
+// handleRanking serves the ranking page from the cached ranking.md file.
+// It does NOT trigger a live scrape; use POST /ranking/refresh for that.
+func (s *Server) handleRanking(w http.ResponseWriter, r *http.Request) {
+	rankingItems, err := s.writer.ReadRankingItems()
+	if err != nil {
+		s.log.Error("failed to read cached ranking", "err", err)
+	}
+
+	cachedAt := ""
+	if info, statErr := s.writer.RankingFileInfo(); statErr == nil {
+		cachedAt = info.ModTime().Format("Jan 2, 2006 at 15:04")
+	}
+
+	t := template.Must(template.New("ranking").Parse(rankingTmpl))
+	var buf bytes.Buffer
+	_ = t.Execute(&buf, struct {
+		Books    interface{}
+		CachedAt string
+	}{Books: toRankingViewItems(rankingItems, s.writer.LocalSlugs()), CachedAt: cachedAt})
+	s.respond(w, r, "Rankings", buf.String())
+}
+
+// handleRankingRefresh triggers a live scrape of novelfire.net/ranking,
+// persists the result to ranking.md, then re-renders the ranking page.
+func (s *Server) handleRankingRefresh(w http.ResponseWriter, r *http.Request) {
+	ctx, cancel := context.WithTimeout(r.Context(), 60*time.Second)
+	defer cancel()
+
+	rankingCh, errCh := s.novel.ScrapeRanking(ctx)
+
+	var rankingItems []writer.RankingItem
+	for {
+		select {
+		case meta, ok := <-rankingCh:
+			if !ok {
+				rankingCh = nil
+				continue
+			}
+			rankingItems = append(rankingItems, writer.RankingItem{
+				Rank:      meta.Ranking,
+				Slug:      meta.Slug,
+				Title:     meta.Title,
+				Author:    meta.Author,
+				Cover:     meta.Cover,
+				Status:    meta.Status,
+				Genres:    meta.Genres,
+				SourceURL: meta.SourceURL,
+			})
+		case err, ok := <-errCh:
+			if !ok {
+				errCh = nil
+				continue
+			}
+			if err != nil {
+				s.log.Error("ranking scrape error", "err", err)
+			}
+		}
+
+		if rankingCh == nil && errCh == nil {
+			break
+		}
+	}
+
+	if len(rankingItems) > 0 {
+		if err := s.writer.WriteRanking(rankingItems); err != nil {
+			s.log.Error("failed to save ranking", "err", err)
+		}
+	}
+
+	cachedAt := ""
+	if info, statErr := s.writer.RankingFileInfo(); statErr == nil {
+		cachedAt = info.ModTime().Format("Jan 2, 2006 at 15:04")
+	}
+
+	t := template.Must(template.New("ranking").Parse(rankingTmpl))
+	var buf bytes.Buffer
+	_ = t.Execute(&buf, struct {
+		Books    interface{}
+		CachedAt string
+	}{Books: toRankingViewItems(rankingItems, s.writer.LocalSlugs()), CachedAt: cachedAt})
+	s.respond(w, r, "Rankings", buf.String())
+}
+
+// ─── GET /ranking/view — view ranking markdown ─────────────────────────────────
+
+const rankingViewTmpl = `
+<div class="max-w-4xl mx-auto px-4 py-10">
+  <a href="/ranking"
+     hx-get="/ranking"
+     hx-target="#main-content"
+     hx-push-url="true"
+     hx-swap="innerHTML"
+     class="text-sm text-zinc-400 hover:text-amber-400 mb-6 inline-flex items-center gap-1">
+    ← Back to Rankings
+  </a>
+
+  <h1 class="text-3xl font-bold text-zinc-100 mb-6">Ranking Data</h1>
+
+  <div class="prose prose-invert max-w-none">
+    {{.HTML}}
+  </div>
+</div>`
+
+func (s *Server) handleRankingView(w http.ResponseWriter, r *http.Request) {
+	markdown, err := s.writer.ReadRanking()
+	if err != nil {
+		http.Error(w, "failed to read ranking: "+err.Error(), http.StatusInternalServerError)
+		return
+	}
+	if markdown == "" {
+		http.NotFound(w, r)
+		return
+	}
+
+	var htmlBuf bytes.Buffer
+	if err := md.Convert([]byte(markdown), &htmlBuf); err != nil {
+		http.Error(w, "markdown render error: "+err.Error(), http.StatusInternalServerError)
+		return
+	}
+
+	t := template.Must(template.New("rankingView").Parse(rankingViewTmpl))
+	var buf bytes.Buffer
+	_ = t.Execute(&buf, struct{ HTML template.HTML }{HTML: template.HTML(htmlBuf.String())})
+
+	s.respond(w, r, "Ranking Data", buf.String())
+}
+
+// ─── GET /books/{slug} — chapter list ────────────────────────────────────────
+
+const bookTmpl = `
+<div class="max-w-2xl mx-auto px-4 py-10">
+  <a href="/"
+     hx-get="/"
+     hx-target="#main-content"
+     hx-push-url="true"
+     hx-swap="innerHTML"
+     class="text-sm text-zinc-400 hover:text-amber-400 mb-6 inline-flex items-center gap-1">
+    ← All books
+  </a>
+
+  <div class="flex gap-5 mb-8 mt-4">
+    {{if .Meta.Cover}}
+    <img src="{{.Meta.Cover}}" alt="cover" class="w-24 h-36 object-cover rounded-lg flex-shrink-0 shadow-lg">
+    {{end}}
+    <div>
+      <div class="flex items-center gap-3">
+        <h1 class="text-2xl font-bold text-zinc-100">{{.Meta.Title}}</h1>
+        {{if .Meta.SourceURL}}
+        <form hx-post="/ui/scrape/book" hx-swap="outerHTML" hx-target="closest div">
+          <input type="hidden" name="url" value="{{.Meta.SourceURL}}">
+          <button type="submit"
+            class="text-xs px-2 py-1 rounded bg-amber-700 hover:bg-amber-600 text-white"
+            title="Re-scrape from source">
+            Refresh
+          </button>
+        </form>
+        {{end}}
+      </div>
+      {{if .Meta.Author}}<p class="text-zinc-400 mt-1">{{.Meta.Author}}</p>{{end}}
+      <div class="flex gap-2 mt-2 flex-wrap">
+        {{if .Meta.Status}}<span class="text-xs px-2 py-0.5 rounded-full bg-zinc-800 text-zinc-300">{{.Meta.Status}}</span>{{end}}
+        {{if .Meta.TotalChapters}}<span class="text-xs px-2 py-0.5 rounded-full bg-zinc-800 text-zinc-300">{{.Meta.TotalChapters}} ch total</span>{{end}}
+        <span class="text-xs px-2 py-0.5 rounded-full bg-amber-900 text-amber-300">{{len .Chapters}} downloaded</span>
+      </div>
+      {{if .Meta.Summary}}
+      <p class="text-zinc-400 text-sm mt-3 line-clamp-3">{{.Meta.Summary}}</p>
+      {{end}}
+    </div>
+  </div>
+
+  <h2 class="text-lg font-semibold text-zinc-200 mb-3">Chapters</h2>
+  <ul class="space-y-1">
+    {{range .Chapters}}
+    <li>
+      <a href="/books/{{$.Slug}}/chapters/{{.Number}}"
+         hx-get="/books/{{$.Slug}}/chapters/{{.Number}}"
+         hx-target="#main-content"
+         hx-push-url="true"
+         hx-swap="innerHTML"
+         class="flex items-center gap-3 px-3 py-2 rounded-lg hover:bg-zinc-800 transition-colors group cursor-pointer">
+        <span class="text-xs text-zinc-500 w-10 text-right flex-shrink-0">{{.Number}}</span>
+        <div class="min-w-0">
+          <span class="text-zinc-300 group-hover:text-amber-400 truncate block">{{.Title}}</span>
+          {{if .Date}}<span class="text-xs text-zinc-500 block mt-0.5">{{.Date}}</span>{{end}}
+        </div>
+      </a>
+    </li>
+    {{else}}
+    <li class="text-zinc-500 px-3 py-2">No chapters downloaded yet.</li>
+    {{end}}
+  </ul>
+</div>`
+
+func (s *Server) handleBook(w http.ResponseWriter, r *http.Request) {
+	slug := r.PathValue("slug")
+
+	meta, ok, err := s.writer.ReadMetadata(slug)
+	if err != nil {
+		http.Error(w, "failed to read metadata: "+err.Error(), http.StatusInternalServerError)
+		return
+	}
+	if !ok {
+		http.NotFound(w, r)
+		return
+	}
+
+	chapters, err := s.writer.ListChapters(slug)
+	if err != nil {
+		http.Error(w, "failed to list chapters: "+err.Error(), http.StatusInternalServerError)
+		return
+	}
+
+	t := template.Must(template.New("book").Parse(bookTmpl))
+	var buf bytes.Buffer
+	_ = t.Execute(&buf, struct {
+		Slug     string
+		Meta     interface{}
+		Chapters interface{}
+	}{Slug: slug, Meta: meta, Chapters: chapters})
+
+	s.respond(w, r, meta.Title, buf.String())
+}
+
+// ─── GET /books/{slug}/chapters/{n} — chapter reader ─────────────────────────
+
+const chapterTmpl = `
+<div class="max-w-2xl mx-auto px-4 py-10">
+  <div class="flex items-center justify-between mb-8">
+    <a href="/books/{{.Slug}}"
+       hx-get="/books/{{.Slug}}"
+       hx-target="#main-content"
+       hx-push-url="true"
+       hx-swap="innerHTML"
+       class="text-sm text-zinc-400 hover:text-amber-400 inline-flex items-center gap-1">
+      ← Chapter list
+    </a>
+    <div class="flex gap-2">
+      {{if .PrevN}}
+      <a href="/books/{{.Slug}}/chapters/{{.PrevN}}"
+         hx-get="/books/{{.Slug}}/chapters/{{.PrevN}}"
+         hx-target="#main-content"
+         hx-push-url="true"
+         hx-swap="innerHTML"
+         class="text-sm px-3 py-1.5 rounded-lg bg-zinc-800 hover:bg-zinc-700 text-zinc-300 transition-colors">
+        ← Prev
+      </a>
+      {{end}}
+      {{if .NextN}}
+      <a href="/books/{{.Slug}}/chapters/{{.NextN}}"
+         hx-get="/books/{{.Slug}}/chapters/{{.NextN}}"
+         hx-target="#main-content"
+         hx-push-url="true"
+         hx-swap="innerHTML"
+         class="text-sm px-3 py-1.5 rounded-lg bg-zinc-800 hover:bg-zinc-700 text-zinc-300 transition-colors">
+        Next →
+      </a>
+      {{end}}
+    </div>
+  </div>
+
+  <!-- TTS player bar — calls Kokoro directly from the browser -->
+  <div id="tts-bar" class="mb-6 rounded-xl border border-zinc-800 bg-zinc-900 px-4 py-3">
+    <div class="flex items-center gap-3 flex-wrap">
+
+      <!-- Play/pause button -->
+      <button id="tts-btn"
+              onclick="ttsToggle()"
+              class="flex items-center gap-2 text-sm px-3 py-1.5 rounded-lg bg-amber-600 hover:bg-amber-500 text-white font-medium transition-colors">
+        <span id="tts-icon">&#9654;</span>
+        <span id="tts-label">Listen</span>
+      </button>
+
+      <!-- Voice selector -->
+      <select id="tts-voice"
+              class="rounded-lg bg-zinc-800 border border-zinc-700 px-2 py-1.5 text-sm text-zinc-200 focus:outline-none focus:border-amber-500 transition-colors">
+        {{range .Voices}}
+        <option value="{{.}}"{{if eq . $.DefaultVoice}} selected{{end}}>{{.}}</option>
+        {{end}}
+      </select>
+
+      <!-- Speed control -->
+      <div class="flex items-center gap-1.5">
+        <span class="text-xs text-zinc-500 whitespace-nowrap">Speed</span>
+        <input id="tts-speed" type="range"
+               min="0.5" max="2" step="0.1" value="1"
+               class="w-20 accent-amber-500 cursor-pointer" />
+        <span id="tts-speed-label" class="text-xs text-zinc-400 w-7 text-right">1.0×</span>
+      </div>
+
+      <div id="tts-status" class="text-xs text-zinc-500 ml-1"></div>
+
+      <!-- Auto-play next chapter toggle -->
+      <label class="flex items-center gap-1.5 ml-auto cursor-pointer select-none" title="Automatically start the next chapter when this one finishes">
+        <input id="tts-autoplay" type="checkbox" class="accent-amber-500 cursor-pointer" />
+        <span class="text-xs text-zinc-400 whitespace-nowrap">Auto-next</span>
+      </label>
+    </div>
+    <audio id="tts-audio" style="display:none"></audio>
+  </div>
+
+  <!-- Paragraphs get data-para-idx injected by JS after render -->
+  <article id="chapter-article" class="prose text-zinc-300 leading-relaxed text-[1.05rem]">
+    {{.HTML}}
+  </article>
+
+  <div class="flex justify-between mt-12 pt-6 border-t border-zinc-800">
+    {{if .PrevN}}
+    <a href="/books/{{.Slug}}/chapters/{{.PrevN}}"
+       hx-get="/books/{{.Slug}}/chapters/{{.PrevN}}"
+       hx-target="#main-content"
+       hx-push-url="true"
+       hx-swap="innerHTML"
+       class="text-sm px-4 py-2 rounded-lg bg-zinc-800 hover:bg-zinc-700 text-zinc-300 transition-colors">
+      ← Previous chapter
+    </a>
+    {{else}}<span></span>{{end}}
+    {{if .NextN}}
+    <a href="/books/{{.Slug}}/chapters/{{.NextN}}"
+       hx-get="/books/{{.Slug}}/chapters/{{.NextN}}"
+       hx-target="#main-content"
+       hx-push-url="true"
+       hx-swap="innerHTML"
+       class="text-sm px-4 py-2 rounded-lg bg-zinc-800 hover:bg-zinc-700 text-zinc-300 transition-colors">
+      Next chapter →
+    </a>
+    {{else}}<span></span>{{end}}
+  </div>
+</div>
+
+<style>
+  /* Paragraph click-to-play affordance */
+  #chapter-article p {
+    cursor: pointer;
+    border-radius: 0.375rem;
+    margin-left: -0.5rem;
+    padding-left: 0.5rem;
+    transition: background 0.15s;
+  }
+  #chapter-article p:hover {
+    background: rgba(251,191,36,0.07);
+  }
+  #chapter-article p.tts-active {
+    background: rgba(251,191,36,0.13);
+    border-left: 2px solid #f59e0b;
+    padding-left: calc(0.5rem - 2px);
+  }
+</style>
+
+<script>
+(function () {
+  var KOKORO_URL = '{{.KokoroURL}}';
+  var NEXT_N     = {{.NextN}};
+  var SLUG       = '{{.Slug}}';
+
+  var audio     = document.getElementById('tts-audio');
+  var btn       = document.getElementById('tts-btn');
+  var icon      = document.getElementById('tts-icon');
+  var label     = document.getElementById('tts-label');
+  var status    = document.getElementById('tts-status');
+  var voiceSel  = document.getElementById('tts-voice');
+  var speedSlider = document.getElementById('tts-speed');
+  var speedLabel  = document.getElementById('tts-speed-label');
+  var autoplayChk = document.getElementById('tts-autoplay');
+  var article   = document.getElementById('chapter-article');
+
+  var abortCtrl  = null;
+  var mse        = null;
+  var srcBuf     = null;
+  var queue      = [];
+  var appending  = false;
+  var fetchDone  = false;
+  var activePara = null; // currently highlighted <p> element
+
+  // ── next-chapter prefetch state ───────────────────────────────────────────────
+  // When auto-play is on we begin fetching the next chapter's audio in the
+  // background as soon as Kokoro finishes streaming the current chapter.
+  // The result is held in a second <audio>/MSE pipeline so that when the
+  // current chapter ends we can play it without any buffering wait.
+
+  var prefetchAudio  = null; // hidden <audio> element used for prefetch
+  var prefetchMSE    = null;
+  var prefetchBuf    = null;
+  var prefetchQueue  = [];
+  var prefetchAppending = false;
+  var prefetchDone   = false;
+  var prefetchAbort  = null;
+  var prefetchReady  = false; // true once canplay fired on prefetchAudio
+
+  // ── speed slider ─────────────────────────────────────────────────────────────
+
+  speedSlider.addEventListener('input', function () {
+    speedLabel.textContent = parseFloat(speedSlider.value).toFixed(1) + '\u00D7';
+  });
+
+  // ── paragraph indexing ───────────────────────────────────────────────────────
+  // Collect all <p> elements inside the article, assign data-para-idx,
+  // and wire click handlers so any paragraph starts TTS from that point.
+
+  var paras = Array.prototype.slice.call(article.querySelectorAll('p'));
+  paras.forEach(function (p, i) {
+    p.dataset.paraIdx = i;
+    p.title = 'Click to read from here';
+    p.addEventListener('click', function () {
+      startFromPara(i);
+    });
+  });
+
+  function textFromPara(startIdx) {
+    return paras
+      .slice(startIdx)
+      .map(function (p) { return p.innerText.trim(); })
+      .filter(function (t) { return t.length > 0; })
+      .join('\n\n');
+  }
+
+  function highlightPara(idx) {
+    if (activePara) activePara.classList.remove('tts-active');
+    activePara = (idx >= 0 && idx < paras.length) ? paras[idx] : null;
+    if (activePara) {
+      activePara.classList.add('tts-active');
+      activePara.scrollIntoView({ behavior: 'smooth', block: 'nearest' });
+    }
+  }
+
+  // ── state helpers ─────────────────────────────────────────────────────────────
+
+  function setLoading(paraIdx) {
+    highlightPara(paraIdx);
+    icon.textContent   = '\u231B';
+    label.textContent  = 'Buffering';
+    status.textContent = 'Fetching from Kokoro\u2026';
+    btn.disabled = true;
+    btn.classList.add('opacity-60', 'cursor-not-allowed');
+    voiceSel.disabled  = true;
+    speedSlider.disabled = true;
+  }
+
+  function setPlaying() {
+    icon.innerHTML     = '&#9646;&#9646;';
+    label.textContent  = 'Pause';
+    status.textContent = 'Playing';
+    btn.disabled = false;
+    btn.classList.remove('opacity-60', 'cursor-not-allowed');
+  }
+
+  function setPaused() {
+    icon.innerHTML     = '&#9654;';
+    label.textContent  = 'Resume';
+    status.textContent = 'Paused';
+  }
+
+  function setStopped() {
+    highlightPara(-1);
+    icon.innerHTML     = '&#9654;';
+    label.textContent  = 'Listen';
+    status.textContent = '';
+    btn.disabled = false;
+    btn.classList.remove('opacity-60', 'cursor-not-allowed');
+    voiceSel.disabled    = false;
+    speedSlider.disabled = false;
+  }
+
+  function setError(msg) {
+    highlightPara(-1);
+    icon.innerHTML     = '&#9654;';
+    label.textContent  = 'Listen';
+    status.textContent = 'Error: ' + msg;
+    btn.disabled = false;
+    btn.classList.remove('opacity-60', 'cursor-not-allowed');
+    voiceSel.disabled    = false;
+    speedSlider.disabled = false;
+  }
+
+  // ── MSE helpers ───────────────────────────────────────────────────────────────
+
+  function flushQueue() {
+    if (appending || !srcBuf || srcBuf.updating || queue.length === 0) return;
+    appending = true;
+    var chunk = queue.shift();
+    try {
+      srcBuf.appendBuffer(chunk);
+    } catch (e) {
+      appending = false;
+      setError(e.message);
+    }
+  }
+
+  function endStream() {
+    if (mse && mse.readyState === 'open' && srcBuf && !srcBuf.updating) {
+      try { mse.endOfStream(); } catch(_) {}
+    }
+    // Current chapter audio is fully received — good time to start prefetching
+    // the next chapter so it's ready by the time playback ends.
+    if (autoplayChk.checked && NEXT_N && !prefetchAbort) {
+      startPrefetch();
+    }
+  }
+
+  // ── next-chapter prefetch ─────────────────────────────────────────────────────
+
+  function stopPrefetch() {
+    if (prefetchAbort) { prefetchAbort.abort(); prefetchAbort = null; }
+    if (prefetchAudio) {
+      if (prefetchAudio.src && prefetchAudio.src.startsWith('blob:')) {
+        URL.revokeObjectURL(prefetchAudio.src);
+      }
+      prefetchAudio.src = '';
+      prefetchAudio = null;
+    }
+    prefetchMSE       = null;
+    prefetchBuf       = null;
+    prefetchQueue     = [];
+    prefetchAppending = false;
+    prefetchDone      = false;
+    prefetchReady     = false;
+  }
+
+  function flushPrefetchQueue() {
+    if (prefetchAppending || !prefetchBuf || prefetchBuf.updating || prefetchQueue.length === 0) return;
+    prefetchAppending = true;
+    var chunk = prefetchQueue.shift();
+    try {
+      prefetchBuf.appendBuffer(chunk);
+    } catch (e) {
+      prefetchAppending = false;
+    }
+  }
+
+  function startPrefetch() {
+    if (!KOKORO_URL || !NEXT_N) return;
+
+    // Fetch the next chapter's plain text from the server's chapter-text endpoint.
+    fetch('/ui/chapter-text/' + SLUG + '/' + NEXT_N)
+      .then(function (res) { return res.ok ? res.text() : Promise.reject(res.status); })
+      .then(function (text) {
+        text = text.trim();
+        if (!text) return;
+
+        prefetchAbort = new AbortController();
+        prefetchMSE   = new MediaSource();
+        prefetchQueue = [];
+        prefetchAppending = false;
+        prefetchDone  = false;
+        prefetchReady = false;
+
+        prefetchAudio = document.createElement('audio');
+        prefetchAudio.style.display = 'none';
+        prefetchAudio.src = URL.createObjectURL(prefetchMSE);
+
+        prefetchAudio.addEventListener('canplay', function () {
+          prefetchReady = true;
+        });
+
+        prefetchMSE.addEventListener('sourceopen', function () {
+          try {
+            prefetchBuf = prefetchMSE.addSourceBuffer('audio/mpeg');
+          } catch (e) { return; }
+
+          prefetchBuf.addEventListener('updateend', function () {
+            prefetchAppending = false;
+            if (prefetchDone && prefetchQueue.length === 0) {
+              if (prefetchMSE.readyState === 'open' && !prefetchBuf.updating) {
+                try { prefetchMSE.endOfStream(); } catch(_) {}
+              }
+            } else {
+              flushPrefetchQueue();
+            }
+          });
+
+          fetch(KOKORO_URL + '/v1/audio/speech', {
+            method:  'POST',
+            signal:  prefetchAbort.signal,
+            headers: { 'Content-Type': 'application/json' },
+            body: JSON.stringify({
+              model:           'kokoro',
+              input:           text,
+              voice:           voiceSel.value,
+              response_format: 'mp3',
+              speed:           parseFloat(speedSlider.value),
+              stream:          true
+            })
+          })
+          .then(function (res) {
+            if (!res.ok) return;
+            var reader = res.body.getReader();
+            function pump() {
+              reader.read().then(function (ref) {
+                if (ref.done) {
+                  prefetchDone = true;
+                  if (prefetchBuf && !prefetchBuf.updating && prefetchQueue.length === 0) {
+                    if (prefetchMSE && prefetchMSE.readyState === 'open') {
+                      try { prefetchMSE.endOfStream(); } catch(_) {}
+                    }
+                  }
+                  return;
+                }
+                prefetchQueue.push(ref.value);
+                flushPrefetchQueue();
+                pump();
+              }).catch(function () {});
+            }
+            pump();
+          })
+          .catch(function () {});
+        });
+
+        prefetchAudio.load();
+      })
+      .catch(function () {});
+  }
+
+  // ── core stream logic ─────────────────────────────────────────────────────────
+
+  function stop() {
+    if (abortCtrl) { abortCtrl.abort(); abortCtrl = null; }
+    if (audio.src && audio.src.startsWith('blob:')) {
+      URL.revokeObjectURL(audio.src);
+    }
+    audio.src  = '';
+    mse        = null;
+    srcBuf     = null;
+    queue      = [];
+    appending  = false;
+    fetchDone  = false;
+    stopPrefetch();
+    setStopped();
+  }
+
+  function startStream(text, paraIdx) {
+    abortCtrl = new AbortController();
+    mse       = new MediaSource();
+    queue     = [];
+    appending = false;
+    fetchDone = false;
+
+    audio.src = URL.createObjectURL(mse);
+
+    mse.addEventListener('sourceopen', function () {
+      try {
+        srcBuf = mse.addSourceBuffer('audio/mpeg');
+      } catch (e) {
+        setError('MSE: ' + e.message);
+        return;
+      }
+
+      srcBuf.addEventListener('updateend', function () {
+        appending = false;
+        if (fetchDone && queue.length === 0) {
+          endStream();
+        } else {
+          flushQueue();
+        }
+      });
+
+      fetch(KOKORO_URL + '/v1/audio/speech', {
+        method:  'POST',
+        signal:  abortCtrl.signal,
+        headers: { 'Content-Type': 'application/json' },
+        body: JSON.stringify({
+          model:           'kokoro',
+          input:           text,
+          voice:           voiceSel.value,
+          response_format: 'mp3',
+          speed:           parseFloat(speedSlider.value),
+          stream:          true
+        })
+      })
+      .then(function (res) {
+        if (!res.ok) {
+          return res.text().then(function (t) { throw new Error(res.status + ': ' + t); });
+        }
+        var reader = res.body.getReader();
+        function pump() {
+          reader.read().then(function (ref) {
+            if (ref.done) {
+              fetchDone = true;
+              if (!srcBuf.updating && queue.length === 0) { endStream(); }
+              return;
+            }
+            queue.push(ref.value);
+            flushQueue();
+            pump();
+          }).catch(function (e) {
+            if (e.name !== 'AbortError') setError(e.message);
+          });
+        }
+        pump();
+      })
+      .catch(function (e) {
+        if (e.name !== 'AbortError') setError(e.message);
+      });
+    });
+
+    audio.load();
+  }
+
+  // startFromPara stops any current stream and begins a new one from paraIdx.
+  function startFromPara(paraIdx) {
+    if (!KOKORO_URL) { setError('KOKORO_URL not configured on server'); return; }
+    stop();
+    var text = textFromPara(paraIdx);
+    if (!text) { setError('no text found'); return; }
+    setLoading(paraIdx);
+    startStream(text, paraIdx);
+  }
+
+  // ── auto-play next chapter ────────────────────────────────────────────────────
+  // When auto-play is on we try to hand off directly from the prefetched audio
+  // pipeline.  The page navigation still happens (so the URL and chapter title
+  // update correctly) but audio starts immediately from the prefetch buffer
+  // instead of waiting for a cold Kokoro request.
+
+  function goNextChapter() {
+    if (!NEXT_N) return;
+    var nextURL = '/books/' + SLUG + '/chapters/' + NEXT_N;
+
+    if (prefetchAudio && prefetchAbort) {
+      // We have a prefetch in progress (or complete).  Swap the prefetch audio
+      // element into the main player so it plays without delay.
+      var pa = prefetchAudio;
+      // Detach from prefetch state so stopPrefetch() called by htmx:beforeSwap
+      // doesn't destroy it before we hand it off.
+      prefetchAudio = null;
+      prefetchAbort = null;
+
+      // Navigate the page (URL + content swap) without the ?autoplay=1 flag
+      // because we are starting audio ourselves right here.
+      htmx.ajax('GET', nextURL, {
+        target:  '#main-content',
+        swap:    'innerHTML',
+        pushURL: nextURL
+      });
+
+      // Play prefetched audio immediately (or as soon as it can).
+      // The new page's script will take over its own audio element, so we
+      // drive this orphaned element directly until the user interacts.
+      // Use the main audio element to carry the blob URL across the swap.
+      if (pa.src && pa.src.startsWith('blob:')) {
+        audio.src = pa.src;
+        pa.src = '';       // transfer ownership so revokeObjectURL isn't called twice
+        if (prefetchReady || pa.readyState >= 3 /* HAVE_FUTURE_DATA */) {
+          audio.play().catch(function () {});
+        } else {
+          audio.addEventListener('canplay', function onCp() {
+            audio.removeEventListener('canplay', onCp);
+            audio.play().catch(function () {});
+          });
+        }
+      }
+
+      // Clean up the rest of the prefetch state (don't abort — the fetch
+      // may still be pumping chunks into the buffer we are now playing).
+      prefetchMSE = null; prefetchBuf = null;
+      prefetchQueue = []; prefetchAppending = false;
+      prefetchDone = false; prefetchReady = false;
+    } else {
+      // No prefetch available — fall back to cold navigation with ?autoplay=1.
+      htmx.ajax('GET', nextURL + '?autoplay=1', {
+        target:  '#main-content',
+        swap:    'innerHTML',
+        pushURL: nextURL
+      });
+    }
+  }
+
+  // ── audio events ──────────────────────────────────────────────────────────────
+
+  audio.addEventListener('canplay', function () {
+    if (audio.paused) {
+      audio.play().then(setPlaying).catch(function (e) { setError(e.message); });
+    }
+  });
+  audio.addEventListener('waiting', function () { status.textContent = 'Buffering\u2026'; });
+  audio.addEventListener('playing', setPlaying);
+  audio.addEventListener('ended', function () {
+    // Cancel the main stream state but keep prefetch alive — goNextChapter needs it.
+    if (abortCtrl) { abortCtrl.abort(); abortCtrl = null; }
+    if (audio.src && audio.src.startsWith('blob:')) URL.revokeObjectURL(audio.src);
+    audio.src = ''; mse = null; srcBuf = null; queue = []; appending = false; fetchDone = false;
+    if (autoplayChk.checked && NEXT_N) {
+      goNextChapter();
+    } else {
+      stopPrefetch();
+      setStopped();
+    }
+  });
+  audio.addEventListener('error',   function () { setError('audio decode error'); });
+  audio.addEventListener('pause',   function () { if (!audio.ended) setPaused(); });
+  audio.addEventListener('play',    setPlaying);
+
+  // ── toolbar toggle (plays from paragraph 0) ───────────────────────────────────
+
+  window.ttsToggle = function () {
+    if (audio.src && !audio.ended) {
+      if (audio.paused) {
+        audio.play().then(setPlaying).catch(function (e) { setError(e.message); });
+      } else {
+        audio.pause();
+      }
+      return;
+    }
+    startFromPara(0);
+  };
+
+  // Stop when HTMX navigates away.
+  document.body.addEventListener('htmx:beforeSwap', stop);
+
+  // ── auto-start TTS when arriving via auto-play navigation ────────────────────
+  // The previous chapter's goNextChapter() appends ?autoplay=1. Detect it here
+  // and kick off playback from paragraph 0 once the page is ready.
+
+  if (new URLSearchParams(window.location.search).get('autoplay') === '1') {
+    autoplayChk.checked = true; // keep the toggle on for the chain to continue
+    // Small delay to let the DOM settle before starting the stream.
+    setTimeout(function () { startFromPara(0); }, 150);
+  }
+}());
+</script>`
+
+func (s *Server) handleChapter(w http.ResponseWriter, r *http.Request) {
+	slug := r.PathValue("slug")
+	n, err := strconv.Atoi(r.PathValue("n"))
+	if err != nil || n < 1 {
+		http.NotFound(w, r)
+		return
+	}
+
+	raw, err := s.writer.ReadChapter(slug, n)
+	if err != nil {
+		http.NotFound(w, r)
+		return
+	}
+
+	var htmlBuf bytes.Buffer
+	if err := md.Convert([]byte(raw), &htmlBuf); err != nil {
+		http.Error(w, "markdown render error: "+err.Error(), http.StatusInternalServerError)
+		return
+	}
+
+	chapters, _ := s.writer.ListChapters(slug)
+	prevN, nextN := adjacentChapters(chapters, n)
+
+	title := firstHeading(raw, fmt.Sprintf("Chapter %d", n))
+
+	t := template.Must(template.New("chapter").Parse(chapterTmpl))
+	var buf bytes.Buffer
+	_ = t.Execute(&buf, struct {
+		Slug         string
+		HTML         template.HTML
+		PrevN        int
+		NextN        int
+		ChapterN     int
+		KokoroURL    string
+		Voices       []string
+		DefaultVoice string
+	}{
+		Slug:         slug,
+		HTML:         template.HTML(htmlBuf.String()),
+		PrevN:        prevN,
+		NextN:        nextN,
+		ChapterN:     n,
+		KokoroURL:    s.kokoroURL,
+		Voices:       kokoroVoices,
+		DefaultVoice: s.kokoroVoice,
+	})
+
+	s.respond(w, r, title, buf.String())
+}
+
+// ─── helpers ──────────────────────────────────────────────────────────────────
+
+// stripMarkdown removes Markdown syntax and returns clean plain text.
+func stripMarkdown(src string) string {
+	src = regexp.MustCompile(`(?m)^#{1,6}\s+`).ReplaceAllString(src, "")
+	src = regexp.MustCompile(`\*{1,3}|_{1,3}`).ReplaceAllString(src, "")
+	src = regexp.MustCompile("(?s)```.*?```").ReplaceAllString(src, "")
+	src = regexp.MustCompile("`[^`]*`").ReplaceAllString(src, "")
+	src = regexp.MustCompile(`\[([^\]]+)\]\([^)]+\)`).ReplaceAllString(src, "$1")
+	src = regexp.MustCompile(`!\[[^\]]*\]\([^)]+\)`).ReplaceAllString(src, "")
+	src = regexp.MustCompile(`(?m)^>\s?`).ReplaceAllString(src, "")
+	src = regexp.MustCompile(`(?m)^[-*_]{3,}\s*$`).ReplaceAllString(src, "")
+	src = regexp.MustCompile(`\n{3,}`).ReplaceAllString(src, "\n\n")
+	return strings.TrimSpace(src)
+}
+
+// adjacentChapters returns the chapter numbers immediately before and after n
+// in the sorted chapters list. 0 means "does not exist".
+func adjacentChapters(chapters []writer.ChapterInfo, n int) (prev, next int) {
+	for i, ch := range chapters {
+		if ch.Number == n {
+			if i > 0 {
+				prev = chapters[i-1].Number
+			}
+			if i < len(chapters)-1 {
+				next = chapters[i+1].Number
+			}
+			return
+		}
+	}
+	return
+}
+
+// firstHeading returns the text of the first non-empty line, stripping a
+// leading "# " markdown heading marker. Falls back to fallback.
+func firstHeading(md, fallback string) string {
+	for _, line := range strings.SplitN(md, "\n", 20) {
+		line = strings.TrimSpace(line)
+		if line == "" {
+			continue
+		}
+		return strings.TrimPrefix(line, "# ")
+	}
+	return fallback
+}
+
+// ─── POST /ui/scrape/book — form submission ───────────────────────────────────
+
+func (s *Server) handleUIScrapeBook(w http.ResponseWriter, r *http.Request) {
+	bookURL := strings.TrimSpace(r.FormValue("url"))
+	if bookURL == "" {
+		renderFragment(w, scrapeStatusHTML("error", "Please enter a book URL."))
+		return
+	}
+
+	s.mu.Lock()
+	already := s.running
+	if !already {
+		s.running = true
+	}
+	s.mu.Unlock()
+
+	if already {
+		renderFragment(w, scrapeStatusHTML("busy", "A scrape job is already running. Please wait."))
+		return
+	}
+
+	cfg := s.oCfg
+	cfg.SingleBookURL = bookURL
+
+	go func() {
+		defer func() {
+			s.mu.Lock()
+			s.running = false
+			s.mu.Unlock()
+		}()
+
+		ctx, cancel := context.WithTimeout(context.Background(), 24*time.Hour)
+		defer cancel()
+
+		o := orchestrator.New(cfg, s.novel, s.log)
+		if err := o.Run(ctx); err != nil {
+			s.log.Error("UI scrape job failed", "url", bookURL, "err", err)
+		}
+	}()
+
+	// Return a status badge that polls until the job finishes.
+	renderFragment(w, scrapeStatusHTML("running", "Scraping "+bookURL+"…"))
+}
+
+// ─── GET /ui/scrape/status — polling endpoint ─────────────────────────────────
+
+func (s *Server) handleUIScrapeStatus(w http.ResponseWriter, r *http.Request) {
+	s.mu.Lock()
+	running := s.running
+	s.mu.Unlock()
+
+	if running {
+		// Keep polling every 3 s while the job is in progress.
+		renderFragment(w, scrapeStatusHTML("running", "Scraping in progress…"))
+		return
+	}
+	// Job finished — show a done badge and stop polling.
+	renderFragment(w, scrapeStatusHTML("done", "Done! Refresh the page to see new books."))
+}
+
+// scrapeStatusHTML returns a self-contained status badge fragment.
+// state is one of: "running" | "done" | "busy" | "error".
+func scrapeStatusHTML(state, msg string) string {
+	var colour, dot, poll string
+	switch state {
+	case "running":
+		colour = "text-amber-300 bg-amber-950 border-amber-800"
+		dot = `<span class="inline-block w-2 h-2 rounded-full bg-amber-400 animate-pulse mr-2"></span>`
+		poll = `hx-get="/ui/scrape/status" hx-trigger="every 3s" hx-target="this" hx-swap="outerHTML"`
+	case "done":
+		colour = "text-green-300 bg-green-950 border-green-800"
+		dot = `<span class="inline-block w-2 h-2 rounded-full bg-green-400 mr-2"></span>`
+	case "busy":
+		colour = "text-yellow-300 bg-yellow-950 border-yellow-800"
+		dot = `<span class="inline-block w-2 h-2 rounded-full bg-yellow-400 mr-2"></span>`
+	default: // error
+		colour = "text-red-300 bg-red-950 border-red-800"
+		dot = `<span class="inline-block w-2 h-2 rounded-full bg-red-400 mr-2"></span>`
+	}
+	return fmt.Sprintf(
+		`<div class="flex items-center text-sm px-3 py-2 rounded-lg border %s" %s>%s%s</div>`,
+		colour, poll, dot, template.HTMLEscapeString(msg),
+	)
+}
diff --git a/scraper/internal/writer/writer.go b/scraper/internal/writer/writer.go
index a3092c1..167e0c2 100644
--- a/scraper/internal/writer/writer.go
+++ b/scraper/internal/writer/writer.go
@@ -19,6 +19,7 @@ import (
 	"fmt"
 	"os"
 	"path/filepath"
+	"regexp"
 	"sort"
 	"strconv"
 	"strings"
@@ -144,10 +145,32 @@ func (w *Writer) ListBooks() ([]scraper.BookMeta, error) {
 	return books, nil
 }
 
+// LocalSlugs returns the set of book slugs that have a metadata.yaml on disk.
+// It is cheaper than ListBooks because it only checks for file existence rather
+// than fully parsing every YAML file.
+func (w *Writer) LocalSlugs() map[string]bool {
+	entries, err := os.ReadDir(w.root)
+	if err != nil {
+		return map[string]bool{}
+	}
+	slugs := make(map[string]bool, len(entries))
+	for _, e := range entries {
+		if !e.IsDir() {
+			continue
+		}
+		metaPath := filepath.Join(w.root, e.Name(), "metadata.yaml")
+		if _, err := os.Stat(metaPath); err == nil {
+			slugs[e.Name()] = true
+		}
+	}
+	return slugs
+}
+
 // ChapterInfo is a lightweight chapter descriptor derived from on-disk files.
 type ChapterInfo struct {
 	Number int
-	Title  string // first line of the markdown file (without the leading "# ")
+	Title  string // chapter name, cleaned of number prefix and trailing date
+	Date   string // relative date scraped alongside the title, e.g. "1 year ago"
 }
 
 // ListChapters returns all chapters on disk for slug, sorted by number.
@@ -171,8 +194,8 @@ func (w *Writer) ListChapters(slug string) ([]ChapterInfo, error) {
 				if err != nil {
 					continue
 				}
-				title := chapterTitle(f, n)
-				chapters = append(chapters, ChapterInfo{Number: n, Title: title})
+				title, date := chapterTitle(f, n)
+				chapters = append(chapters, ChapterInfo{Number: n, Title: title, Date: date})
 			}
 		}
 	}
@@ -184,19 +207,55 @@ func (w *Writer) ListChapters(slug string) ([]ChapterInfo, error) {
 
 // chapterTitle reads the first non-empty line of a markdown file and strips
 // the leading "# " heading marker. Falls back to "Chapter N".
-func chapterTitle(path string, n int) string {
+func chapterTitle(path string, n int) (title, date string) {
 	data, err := os.ReadFile(path)
 	if err != nil {
-		return fmt.Sprintf("Chapter %d", n)
+		return fmt.Sprintf("Chapter %d", n), ""
 	}
 	for _, line := range strings.SplitN(string(data), "\n", 10) {
 		line = strings.TrimSpace(line)
 		if line == "" {
 			continue
 		}
-		return strings.TrimPrefix(line, "# ")
+		line = strings.TrimPrefix(line, "# ")
+		return splitChapterTitle(line)
 	}
-	return fmt.Sprintf("Chapter %d", n)
+	return fmt.Sprintf("Chapter %d", n), ""
+}
+
+// splitChapterTitle separates the human-readable chapter name from the
+// trailing relative-date string that novelfire.net appends to the heading.
+// Examples of raw heading text (after stripping "# "):
+//
+//	"1                                    Chapter 1 - 1: The Academy's Weakest1 year ago"
+//	"2  Chapter 2 - Enter the Storm3 months ago"
+//
+// The pattern is: optional leading number+whitespace, then the real title,
+// then a date that matches /\d+\s+(second|minute|hour|day|week|month|year)s?\s+ago$/
+func splitChapterTitle(raw string) (title, date string) {
+	// Strip a leading chapter-number index that novelfire sometimes prepends.
+	// It looks like "1   " or "12  " at the very start.
+	raw = strings.TrimSpace(raw)
+	if idx := strings.IndexFunc(raw, func(r rune) bool { return r == ' ' || r == '\t' }); idx > 0 {
+		prefix := raw[:idx]
+		allDigit := true
+		for _, c := range prefix {
+			if c < '0' || c > '9' {
+				allDigit = false
+				break
+			}
+		}
+		if allDigit {
+			raw = strings.TrimSpace(raw[idx:])
+		}
+	}
+
+	// Match a trailing relative date: "<n> <unit>[s] ago"
+	dateRe := regexp.MustCompile(`\s*(\d+\s+(?:second|minute|hour|day|week|month|year)s?\s+ago)\s*$`)
+	if m := dateRe.FindStringSubmatchIndex(raw); m != nil {
+		return strings.TrimSpace(raw[:m[0]]), strings.TrimSpace(raw[m[2]:m[3]])
+	}
+	return raw, ""
 }
 
 // ReadChapter returns the raw markdown content for chapter number n of slug.
@@ -211,6 +270,139 @@ func (w *Writer) ReadChapter(slug string, n int) (string, error) {
 	return string(data), nil
 }
 
+// ─── Ranking ─────────────────────────────────────────────────────────────────
+
+// RankingItem represents a single entry in the ranking.
+type RankingItem struct {
+	Rank      int      `yaml:"rank"`
+	Slug      string   `yaml:"slug"`
+	Title     string   `yaml:"title"`
+	Author    string   `yaml:"author,omitempty"`
+	Cover     string   `yaml:"cover,omitempty"`
+	Status    string   `yaml:"status,omitempty"`
+	Genres    []string `yaml:"genres,omitempty"`
+	SourceURL string   `yaml:"source_url,omitempty"`
+}
+
+// WriteRanking saves the ranking items as markdown to static/ranking.md.
+func (w *Writer) WriteRanking(items []RankingItem) error {
+	path := filepath.Clean(w.rankingPath())
+	dir := filepath.Dir(path)
+	if err := os.MkdirAll(dir, 0o755); err != nil {
+		return fmt.Errorf("writer: mkdir %s: %w", dir, err)
+	}
+
+	var sb strings.Builder
+	sb.WriteString("# Novel Rankings\n\n")
+	sb.WriteString("| Rank | Title | Cover | Status | Genres | URL |\n")
+	sb.WriteString("|------|-------|-------|--------|--------|-----|\n")
+	for _, item := range items {
+		genres := strings.Join(item.Genres, ", ")
+		if genres == "" {
+			genres = "-"
+		}
+		sb.WriteString(fmt.Sprintf("| %d | %s | %s | %s | %s | %s |\n",
+			item.Rank, item.Title, item.Cover, item.Status, genres, item.SourceURL))
+	}
+
+	if err := os.WriteFile(path, []byte(sb.String()), 0o644); err != nil {
+		return fmt.Errorf("writer: write ranking %s: %w", path, err)
+	}
+	return nil
+}
+
+// ReadRanking reads the ranking.md file if it exists.
+func (w *Writer) ReadRanking() (string, error) {
+	path := w.rankingPath()
+	data, err := os.ReadFile(path)
+	if err != nil {
+		if os.IsNotExist(err) {
+			return "", nil
+		}
+		return "", fmt.Errorf("writer: read ranking: %w", err)
+	}
+	return string(data), nil
+}
+
+// ReadRankingItems parses ranking.md back into a slice of RankingItem.
+// Returns nil slice (not an error) when the file does not exist yet.
+func (w *Writer) ReadRankingItems() ([]RankingItem, error) {
+	markdown, err := w.ReadRanking()
+	if err != nil || markdown == "" {
+		return nil, err
+	}
+
+	var items []RankingItem
+	for _, line := range strings.Split(markdown, "\n") {
+		// Only process data rows: start and end with '|', not header/separator rows.
+		line = strings.TrimSpace(line)
+		if !strings.HasPrefix(line, "|") || !strings.HasSuffix(line, "|") {
+			continue
+		}
+		// Strip leading/trailing '|' and split on '|'.
+		inner := strings.TrimPrefix(strings.TrimSuffix(line, "|"), "|")
+		cols := strings.Split(inner, "|")
+		if len(cols) < 6 {
+			continue
+		}
+		for i, c := range cols {
+			cols[i] = strings.TrimSpace(c)
+		}
+		// Skip header row and separator row.
+		if cols[0] == "Rank" || strings.HasPrefix(cols[0], "---") {
+			continue
+		}
+		rank, err := strconv.Atoi(cols[0])
+		if err != nil {
+			continue
+		}
+		title := cols[1]
+		cover := cols[2]
+		status := cols[3]
+		genresStr := cols[4]
+		sourceURL := cols[5]
+
+		var genres []string
+		if genresStr != "-" && genresStr != "" {
+			for _, g := range strings.Split(genresStr, ",") {
+				g = strings.TrimSpace(g)
+				if g != "" {
+					genres = append(genres, g)
+				}
+			}
+		}
+
+		// Derive slug from source URL (last path segment).
+		slug := ""
+		if sourceURL != "" {
+			parts := strings.Split(strings.TrimRight(sourceURL, "/"), "/")
+			if len(parts) > 0 {
+				slug = parts[len(parts)-1]
+			}
+		}
+
+		items = append(items, RankingItem{
+			Rank:      rank,
+			Slug:      slug,
+			Title:     title,
+			Cover:     cover,
+			Status:    status,
+			Genres:    genres,
+			SourceURL: sourceURL,
+		})
+	}
+	return items, nil
+}
+
+// RankingFileInfo returns os.FileInfo for the ranking.md file, if it exists.
+func (w *Writer) RankingFileInfo() (os.FileInfo, error) {
+	return os.Stat(w.rankingPath())
+}
+
+func (w *Writer) rankingPath() string {
+	return filepath.Join(w.root, "ranking.md")
+}
+
 // bookDir returns the root directory for a book slug.
 func (w *Writer) bookDir(slug string) string {
 	return filepath.Join(w.root, slug)