diff --git a/automation/app.py b/automation/app.py
index 07e4e88..a592c64 100644
--- a/automation/app.py
+++ b/automation/app.py
@@ -1,4 +1,11 @@
-"""FastAPI application entrypoint."""
+"""FastAPI application with Temporal workflow execution.
+
+This application uses Temporal for durable workflow execution:
+- Temporal worker runs as a background task
+- Temporal Schedules handle cron-based automation triggers
+- Activities handle sandbox operations with automatic retries
+- Workflows provide crash-proof execution guarantees
+"""
 
 import asyncio
 import logging
@@ -9,16 +16,14 @@
 from fastapi.responses import JSONResponse
 from sqlalchemy import text
 
-from automation.auth import create_http_client
 from automation.config import get_settings
 from automation.db import create_engine, create_session_factory
-from automation.dispatcher import dispatcher_loop
 from automation.logger import setup_all_loggers
 from automation.preset_router import router as preset_router
 from automation.router import router
-from automation.scheduler import scheduler_loop
+from automation.temporal.client import close_temporal_client, get_temporal_client
+from automation.temporal.worker import create_worker
 from automation.uploads import router as uploads_router
-from automation.watchdog import watchdog_loop
 
 
 logger = logging.getLogger("automation.app")
@@ -26,105 +31,91 @@
 
 @asynccontextmanager
 async def lifespan(app: FastAPI):
-    """Application startup/shutdown lifecycle."""
-    # Startup
+    """Application startup/shutdown lifecycle with Temporal."""
     settings = get_settings()
 
-    # Apply the repo-wide JSON structured-logging convention
+    # Apply structured logging
     setup_all_loggers()
 
-    # Silence noisy third-party loggers
+    # Silence noisy loggers
     for noisy_logger in (
         "ddtrace",
         "httpx",
         "httpcore",
-        "sqlalchemy.engine",  # Suppress SQL statement logging
+        "sqlalchemy.engine",
     ):
         logging.getLogger(noisy_logger).setLevel(logging.WARNING)
 
     logger.info("Starting OpenHands Automations Service")
 
-    # Create shared httpx client for auth (stored in app.state for DI)
-    app.state.http_client = create_http_client()
-
-    # Create engine and session factory, store in app.state
+    # Create database engine and session factory
     engine_result = await create_engine(settings)
     app.state.engine_result = engine_result
     app.state.engine = engine_result.engine
     app.state.session_factory = create_session_factory(engine_result.engine)
 
-    # Start the background scheduler and dispatcher
+    # Initialize Temporal client
+    try:
+        temporal_client = await get_temporal_client()
+        app.state.temporal_client = temporal_client
+        logger.info("Temporal client connected")
+    except Exception as e:
+        logger.error("Failed to connect to Temporal: %s", e)
+        raise
+
+    # Start Temporal worker as background task (unless skip_worker is set)
+    # When running with separate worker pods, skip_worker should be True to avoid
+    # conflicts between ddtrace instrumentation and Temporal's workflow sandbox
     shutdown_event = asyncio.Event()
     app.state.shutdown_event = shutdown_event
+    worker_task = None
 
-    # Scheduler: polls automations and creates PENDING runs
-    scheduler_task = asyncio.create_task(
-        scheduler_loop(
-            app.state.session_factory,
-            interval_seconds=settings.scheduler_interval_seconds,
-            shutdown_event=shutdown_event,
-        )
-    )
-    app.state.scheduler_task = scheduler_task
-    logger.info("Background scheduler started")
-
-    # Dispatcher: picks up PENDING runs and dispatches them
-    if not settings.base_url:
-        logger.warning(
-            "AUTOMATION_BASE_URL not set — using localhost. "
-            "Sandboxes in the cloud won't be able to reach this URL."
-        )
-    dispatcher_task = asyncio.create_task(
-        dispatcher_loop(
-            app.state.session_factory,
-            settings=settings,
-            interval_seconds=settings.dispatcher_interval_seconds,
-            shutdown_event=shutdown_event,
-        )
-    )
-    app.state.dispatcher_task = dispatcher_task
-    logger.info("Background dispatcher started")
-
-    # Watchdog: marks stale RUNNING runs as FAILED
-    watchdog_task = asyncio.create_task(
-        watchdog_loop(
-            app.state.session_factory,
-            settings=settings,
-            shutdown_event=shutdown_event,
+    if not settings.skip_worker:
+        worker = await create_worker(temporal_client, settings)
+        worker_task = asyncio.create_task(
+            _run_worker_with_shutdown(worker, shutdown_event),
+            name="temporal-worker",
         )
-    )
-    app.state.watchdog_task = watchdog_task
-    logger.info("Background watchdog started")
+        app.state.worker_task = worker_task
+        logger.info("Temporal worker started")
+    else:
+        logger.info("Skipping in-process worker (AUTOMATION_SKIP_WORKER=true)")
 
     yield
 
     # Shutdown
-    logger.info("Shutting down background tasks...")
+    logger.info("Shutting down...")
     shutdown_event.set()
 
-    # Wait for all tasks to exit gracefully
-    for task_name, task in [
-        ("scheduler", scheduler_task),
-        ("dispatcher", dispatcher_task),
-        ("watchdog", watchdog_task),
-    ]:
+    # Wait for worker to stop (if we started one)
+    if worker_task is not None:
         try:
-            await asyncio.wait_for(task, timeout=5.0)
+            await asyncio.wait_for(worker_task, timeout=10.0)
         except TimeoutError:
-            logger.warning("%s did not exit in time, cancelling", task_name)
-            task.cancel()
+            logger.warning("Worker did not stop in time, cancelling")
+            worker_task.cancel()
             try:
-                await task
+                await worker_task
             except asyncio.CancelledError:
                 pass
 
-    await app.state.http_client.aclose()
-    await app.state.engine_result.dispose()
+    # Close Temporal client
+    await close_temporal_client()
+
+    # Close database
+    await engine_result.dispose()
     logger.info("Automations service shut down")
 
 
+async def _run_worker_with_shutdown(worker, shutdown_event: asyncio.Event):
+    """Run worker until shutdown event is set."""
+    async with worker:
+        await shutdown_event.wait()
+        logger.info("Worker received shutdown signal")
+
+
 def _build_cors_origins() -> list[str]:
-    """Build the list of allowed CORS origins from settings."""
+    """Build the list of allowed CORS origins."""
     settings = get_settings()
     origins = [o.strip() for o in settings.cors_origins.split(",") if o.strip()]
     if not origins:
@@ -135,14 +126,10 @@ def _build_cors_origins() -> list[str]:
 def _create_app() -> FastAPI:
     """Create and configure the FastAPI application."""
     settings = get_settings()
-    # root_path is derived from AUTOMATION_BASE_URL path component.
-    # e.g., https://app.all-hands.dev/api/automation -> /api/automation
     return FastAPI(
         title="OpenHands Automations Service",
-        description=(
-            "Scheduled and event-driven automation execution for OpenHands Cloud"
-        ),
-        version="0.1.0",
+        description="Scheduled and event-driven automation execution using Temporal",
+        version="0.2.0",
         lifespan=lifespan,
         root_path=settings.root_path,
     )
@@ -158,9 +145,7 @@ def _create_app() -> FastAPI:
     allow_headers=["*"],
 )
 
-# Include uploads_router and preset_router BEFORE router to avoid route conflict.
-# The main router has /v1/{automation_id} which would match /v1/uploads
-# or /v1/preset/prompt and fail UUID validation if included first.
+# Include routers (order matters - more specific routes first)
 app.include_router(uploads_router)
 app.include_router(preset_router)
 app.include_router(router)
@@ -168,22 +153,37 @@ def _create_app() -> FastAPI:
 
 @app.get("/health")
 async def health():
+    """Health check endpoint."""
     return {"status": "ok"}
 
 
 @app.get("/ready")
 async def readiness():
-    """Readiness probe — checks DB connectivity.
+    """Readiness probe — checks DB and Temporal connectivity."""
+    errors = []
 
-    Returns 503 when the DB is unreachable so Kubernetes stops routing traffic.
-    """
+    # Check database
     try:
         async with app.state.engine.connect() as conn:
             await conn.execute(text("SELECT 1"))
-        return {"status": "ready"}
     except Exception as e:
-        logger.error("Readiness check failed: %s", e, exc_info=True)
+        logger.error("Database check failed: %s", e)
+        errors.append("database unavailable")
+
+    # Check Temporal
+    try:
+        client = app.state.temporal_client
+        # Simple connectivity check - list workflows with limit 1
+        async for _ in client.list_workflows(query="", page_size=1):
+            break
+    except Exception as e:
+        logger.error("Temporal check failed: %s", e)
+        errors.append("temporal unavailable")
+
+    if errors:
         return JSONResponse(
             status_code=503,
-            content={"status": "not_ready", "error": "database unavailable"},
+            content={"status": "not_ready", "errors": errors},
         )
+
+    return {"status": "ready"}
diff --git a/automation/config.py b/automation/config.py
index 88b3e3e..3d17585 100644
--- a/automation/config.py
+++ b/automation/config.py
@@ -26,14 +26,21 @@ class Settings(BaseSettings):
     # OpenHands SaaS API
     openhands_api_base_url: str = "https://app.all-hands.dev"
 
-    # Scheduler (polls automations table for due cron jobs)
-    scheduler_interval_seconds: int = 60
-
-    # Dispatcher (polls automation_runs table for pending jobs)
-    dispatcher_interval_seconds: int = 10
-
-    # Watchdog (scans for stale RUNNING runs past their timeout)
-    watchdog_interval_seconds: int = 60
+    # Temporal configuration
+    temporal_host: str = "localhost"
+    temporal_port: int = 7233
+    temporal_namespace: str = "default"
+    temporal_task_queue: str = "automations"
+    # For Temporal Cloud: set to True and provide TLS cert/key paths
+    temporal_tls_enabled: bool = False
+    temporal_tls_cert_path: str | None = None
+    temporal_tls_key_path: str | None = None
+    # Skip starting an in-process worker (use when running separate worker pods)
+    # This avoids conflicts between ddtrace and Temporal's workflow sandbox
+    skip_worker: bool = False
+    # Fast-fail mode: disable retries for faster test feedback
+    # When True, all activity retry policies use maximum_attempts=1
+    fast_fail: bool = False
 
     # Service key for authenticating with the SaaS API to fetch per-user
     # API keys (called by the dispatcher before each automation run).
@@ -56,6 +63,11 @@ class Settings(BaseSettings):
 
     model_config = {"env_prefix": "AUTOMATION_"}
 
+    @property
+    def temporal_address(self) -> str:
+        """Full Temporal server address."""
+        return f"{self.temporal_host}:{self.temporal_port}"
+
     @property
     def resolved_base_url(self) -> str:
         """Public base URL with localhost fallback for dev."""
diff --git a/automation/dispatcher.py b/automation/dispatcher.py
deleted file mode 100644
index 6a49341..0000000
--- a/automation/dispatcher.py
+++ /dev/null
@@ -1,350 +0,0 @@
-"""Dispatcher for processing pending automation runs.
-
-Polls the automation_runs table for PENDING jobs and dispatches them
-to sandboxes via the SaaS API.  Uses FOR UPDATE SKIP LOCKED for
-multi-worker safety.
-
-Completion is handled asynchronously: the SDK running inside the sandbox
-POSTs to ``/v1/runs/{id}/complete`` when the entry-point
-exits, so the dispatcher does **not** block waiting for results.
-"""
-
-import asyncio
-import json
-import logging
-import uuid
-from datetime import timedelta
-from typing import Any
-
-from sqlalchemy import select
-from sqlalchemy.ext.asyncio import AsyncSession, async_sessionmaker
-from sqlalchemy.orm import selectinload
-
-from automation.config import Settings
-from automation.constants import MAX_RUN_DURATION, MAX_RUN_DURATION_SECONDS
-from automation.exceptions import PermanentDispatchError, TarballNotFoundError
-from automation.execution import dispatch_automation
-from automation.models import AutomationRun, AutomationRunStatus, TarballUpload
-from automation.utils.api_key import APIKeyError, get_api_key_for_automation_run
-from automation.utils.run import (
-    disable_automation,
-    mark_run_status,
-    mark_run_terminal,
-    update_sandbox_id,
-)
-from automation.utils.tarball_validation import is_http_url, parse_internal_upload_id
-
-
-logger = logging.getLogger("automation.dispatcher")
-
-
-def _run_extra(
-    run_id: str | None = None,
-    automation_id: str | None = None,
-    sandbox_id: str | None = None,
-) -> dict[str, Any]:
-    """Build extra dict for structured logging with run/automation/sandbox IDs."""
-    extra: dict[str, Any] = {}
-    if run_id:
-        extra["run_id"] = run_id
-    if automation_id:
-        extra["automation_id"] = automation_id
-    if sandbox_id:
-        extra["sandbox_id"] = sandbox_id
-    return extra
-
-
-DEFAULT_BATCH_SIZE = 10
-POLL_INTERVAL_SECONDS = 30
-
-
-async def _download_internal_tarball(
-    upload_id: uuid.UUID,
-    session: AsyncSession | None,
-) -> bytes:
-    """Download a tarball from storage using the TarballUpload record.
-
-    Raises:
-        TarballNotFoundError: If the tarball upload record doesn't exist.
-            This is a permanent error that should disable the automation.
-        ValueError: If no database session is provided.
-    """
-    if session is None:
-        raise ValueError("Database session required to resolve oh-internal:// URLs")
-
-    result = await session.execute(
-        select(TarballUpload).where(TarballUpload.id == upload_id)
-    )
-    upload = result.scalars().first()
-    if upload is None:
-        raise TarballNotFoundError(
-            f"Internal tarball upload not found: {upload_id}. "
-            "The tarball may have been deleted."
-        )
-
-    from automation.storage import get_file_store
-
-    store = get_file_store()
-    return store.read(upload.storage_path)
-
-
-async def _poll_pending_runs(
-    session: AsyncSession,
-    batch_size: int,
-) -> list[AutomationRun]:
-    """Poll pending runs using FOR UPDATE SKIP LOCKED.
-
-    Eagerly loads the ``automation`` relationship so that ``user_id``,
-    ``org_id``, and tarball config are available for dispatch.
-    """
-    select_query = (
-        select(AutomationRun)
-        .options(selectinload(AutomationRun.automation))
-        .where(AutomationRun.status == AutomationRunStatus.PENDING)
-        .order_by(AutomationRun.created_at.asc())
-        .limit(batch_size)
-        .with_for_update(skip_locked=True)
-    )
-    result = await session.execute(select_query)
-    return list(result.scalars().all())
-
-
-async def _execute_run(
-    run: AutomationRun,
-    settings: Settings,
-    session_factory: async_sessionmaker[AsyncSession],
-) -> None:
-    """Execute a single run in a background task (fire-and-forget).
-
-    1. Fetch a per-user API key from the SaaS service (on demand, never stored).
-    2. Determine tarball source:
-       - Internal (oh-internal://): Download from GCS and upload to sandbox.
-       - External (http/https): Pass URL for direct download inside sandbox.
-    3. Call ``dispatch_automation()`` to spin up a sandbox and start the entrypoint.
-    4. Store sandbox_id on the run for later verification.
-    5. If the sandbox fails to start, mark the run FAILED.
-
-    The SDK inside the sandbox fires the completion callback on exit.
-    The watchdog will verify status via sandbox if the callback is missed.
-    """
-    run_id = str(run.id)
-    automation = run.automation
-    automation_id = str(automation.id)
-    tarball_path = automation.tarball_path
-
-    # Helper for consistent structured logging
-    def log_extra(sandbox_id: str | None = None) -> dict[str, Any]:
-        return _run_extra(
-            run_id=run_id, automation_id=automation_id, sandbox_id=sandbox_id
-        )
-
-    callback_url = f"{settings.resolved_base_url.rstrip('/')}/v1/runs/{run_id}/complete"
-
-    try:
-        # 1. Fetch a per-user API key from the SaaS service
-        api_key = await get_api_key_for_automation_run(run)
-
-        # 2. Determine tarball source
-        tarball_source: bytes | str
-        if is_http_url(tarball_path):
-            # HTTP(S) URL: download directly inside sandbox (untrusted/large)
-            tarball_source = tarball_path
-            logger.info("HTTP URL tarball, will download in sandbox", extra=log_extra())
-        else:
-            # Internal (oh-internal://): download from GCS, upload to sandbox
-            upload_id = parse_internal_upload_id(tarball_path)
-            if upload_id is None:
-                raise ValueError(f"Unsupported tarball_path: {tarball_path!r}")
-
-            async with session_factory() as session:
-                tarball_source = await _download_internal_tarball(upload_id, session)
-            logger.info(
-                "Internal tarball downloaded (%d bytes)",
-                len(tarball_source),
-                extra=log_extra(),
-            )
-
-        # 3. Build env vars for the sandbox
-        env_vars = {
-            "OPENHANDS_API_KEY": api_key,
-            "OPENHANDS_CLOUD_API_URL": settings.openhands_api_base_url,
-        }
-
-        # Trigger context so the SDK script knows *why* it was invoked
-        event_payload = {
-            "trigger": automation.trigger,
-            "automation_id": str(automation.id),
-            "automation_name": automation.name,
-        }
-        env_vars["AUTOMATION_EVENT_PAYLOAD"] = json.dumps(event_payload)
-
-        # 4. Calculate effective timeout: use automation's timeout if set,
-        # capped at system maximum; otherwise use system default
-        if automation.timeout is not None:
-            effective_timeout = min(automation.timeout, MAX_RUN_DURATION_SECONDS)
-        else:
-            effective_timeout = MAX_RUN_DURATION_SECONDS
-
-        # 5. Dispatch to sandbox (fire-and-forget)
-        result = await dispatch_automation(
-            api_url=settings.openhands_api_base_url,
-            api_key=api_key,
-            entrypoint=automation.entrypoint,
-            tarball_source=tarball_source,
-            env_vars=env_vars,
-            timeout=effective_timeout,
-            callback_url=callback_url,
-            run_id=run_id,
-        )
-
-        sandbox_extra = log_extra(sandbox_id=result.sandbox_id)
-        if result.success:
-            # Store sandbox_id for later verification by the watchdog
-            if result.sandbox_id:
-                await update_sandbox_id(session_factory, run.id, result.sandbox_id)
-            logger.info(
-                "Automation dispatched successfully, waiting for callback",
-                extra=sandbox_extra,
-            )
-            # Don't mark as COMPLETED here - wait for the callback
-        else:
-            logger.warning(
-                "Sandbox dispatch failed: %s",
-                result.error,
-                extra=sandbox_extra,
-            )
-            await mark_run_terminal(
-                session_factory, run, AutomationRunStatus.FAILED, result.error
-            )
-
-    except PermanentDispatchError as exc:
-        # Permanent configuration error - disable the automation
-        logger.error(
-            "Permanent dispatch error, disabling automation: %s",
-            exc,
-            exc_info=True,
-            extra=log_extra(),
-        )
-        await mark_run_terminal(
-            session_factory, run, AutomationRunStatus.FAILED, str(exc)
-        )
-        await disable_automation(session_factory, automation.id, str(exc))
-
-    except (APIKeyError, ValueError) as exc:
-        logger.error("Dispatch error: %s", exc, exc_info=True, extra=log_extra())
-        await mark_run_terminal(
-            session_factory, run, AutomationRunStatus.FAILED, str(exc)
-        )
-    except Exception:
-        logger.exception("Background execution failed", extra=log_extra())
-        await mark_run_terminal(
-            session_factory, run, AutomationRunStatus.FAILED, "Internal error"
-        )
-
-
-async def dispatch_pending_runs(
-    session_factory: async_sessionmaker[AsyncSession],
-    settings: Settings,
-    batch_size: int = DEFAULT_BATCH_SIZE,
-) -> list[AutomationRun]:
-    """Poll for pending runs, mark RUNNING, and launch sandboxes.
-
-    Each run is dispatched as an ``asyncio.create_task`` so the
-    dispatcher loop is not blocked by long-running automations.
-    """
-    async with session_factory() as session:
-        pending_runs = await _poll_pending_runs(session, batch_size)
-
-        dispatched_runs = []
-        for run in pending_runs:
-            run_id = str(run.id)
-            automation_id = str(run.automation_id) if run.automation_id else None
-            extra = _run_extra(run_id=run_id, automation_id=automation_id)
-            try:
-                logger.info("Dispatching automation run", extra=extra)
-                # Use automation's custom timeout if set, otherwise use default
-                max_duration = (
-                    timedelta(seconds=run.automation.timeout)
-                    if run.automation and run.automation.timeout
-                    else MAX_RUN_DURATION
-                )
-                await mark_run_status(
-                    session, run, AutomationRunStatus.RUNNING, max_duration=max_duration
-                )
-                dispatched_runs.append(run)
-            except Exception:
-                logger.exception("Failed to dispatch run", extra=extra)
-
-        await session.commit()
-
-        for run in dispatched_runs:
-            asyncio.create_task(
-                _execute_run_safe(run, settings, session_factory),
-                name=f"execute-run-{run.id}",
-            )
-
-        return dispatched_runs
-
-
-async def _execute_run_safe(
-    run: AutomationRun,
-    settings: Settings,
-    session_factory: async_sessionmaker[AsyncSession],
-) -> None:
-    """Wrapper around ``_execute_run`` that never lets exceptions escape.
-
-    ``asyncio.create_task`` silently swallows exceptions from background
-    tasks, so this wrapper ensures every failure is logged and the run is
-    marked FAILED.
-    """
-    run_id = str(run.id)
-    automation_id = str(run.automation_id) if run.automation_id else None
-    extra = _run_extra(run_id=run_id, automation_id=automation_id)
-    try:
-        await _execute_run(run, settings, session_factory)
-    except Exception:
-        logger.exception("Background execution failed", extra=extra)
-        await mark_run_terminal(
-            session_factory, run, AutomationRunStatus.FAILED, "Internal error"
-        )
-
-
-async def dispatcher_loop(
-    session_factory: async_sessionmaker[AsyncSession],
-    settings: Settings,
-    interval_seconds: int = POLL_INTERVAL_SECONDS,
-    shutdown_event: asyncio.Event | None = None,
-    batch_size: int = DEFAULT_BATCH_SIZE,
-) -> None:
-    """Main dispatcher loop — polls for pending runs and dispatches them."""
-    logger.info(
-        "Dispatcher started, polling every %d seconds (batch_size=%d)",
-        interval_seconds,
-        batch_size,
-    )
-
-    while True:
-        if shutdown_event is not None and shutdown_event.is_set():
-            logger.info("Dispatcher received shutdown signal, exiting")
-            break
-
-        try:
-            dispatched = await dispatch_pending_runs(
-                session_factory, settings=settings, batch_size=batch_size
-            )
-            if dispatched:
-                logger.info("Dispatched %d run(s)", len(dispatched))
-            else:
-                logger.debug("No pending runs to dispatch")
-        except Exception:
-            logger.error("Error dispatching pending runs", exc_info=True)
-
-        if shutdown_event is not None:
-            try:
-                await asyncio.wait_for(shutdown_event.wait(), timeout=interval_seconds)
-                logger.info("Dispatcher received shutdown signal, exiting")
-                break
-            except TimeoutError:
-                pass
-        else:
-            await asyncio.sleep(interval_seconds)
diff --git a/automation/execution.py b/automation/execution.py
deleted file mode 100644
index bad398f..0000000
--- a/automation/execution.py
+++ /dev/null
@@ -1,580 +0,0 @@
-"""Sandbox execution for automation runs.
-
-One function does the whole job: spin up a sandbox, upload a tarball,
-extract it, run setup, run the entrypoint, tear down.
-"""
-
-import asyncio
-import io
-import logging
-import re
-import tarfile
-from typing import Any
-
-import httpx
-from pydantic.dataclasses import dataclass
-from tenacity import (
-    before_sleep_log,
-    retry,
-    retry_if_exception,
-    stop_after_attempt,
-    wait_exponential,
-)
-
-from automation.constants import (
-    EXTERNAL_DOWNLOAD_TIMEOUT,
-    EXTERNAL_MAX_FILESIZE,
-    MAX_RUN_DURATION_SECONDS,
-    RATE_LIMIT_MAX_RETRIES,
-    RATE_LIMIT_MAX_WAIT,
-    RATE_LIMIT_MIN_WAIT,
-    SANDBOX_POLL_INTERVAL,
-    SANDBOX_READY_TIMEOUT,
-    TARBALL_PATH,
-    WORK_DIR,
-)
-from automation.exceptions import PermanentDispatchError, TarballNotFoundError
-from automation.utils.sandbox import delete_sandbox
-
-
-logger = logging.getLogger(__name__)
-
-
-def _is_rate_limit_error(exc: BaseException) -> bool:
-    """Check if exception is a 429 rate limit error."""
-    if isinstance(exc, httpx.HTTPStatusError):
-        return exc.response.status_code == 429
-    return False
-
-
-def _log_extra(
-    run_id: str | None = None, sandbox_id: str | None = None
-) -> dict[str, Any]:
-    """Build extra dict for structured logging with run/sandbox IDs."""
-    extra: dict[str, Any] = {}
-    if run_id:
-        extra["run_id"] = run_id
-    if sandbox_id:
-        extra["sandbox_id"] = sandbox_id
-    return extra
-
-
-# Tenacity retry decorator for rate limit handling
-_retry_on_rate_limit = retry(
-    retry=retry_if_exception(_is_rate_limit_error),
-    stop=stop_after_attempt(RATE_LIMIT_MAX_RETRIES),
-    wait=wait_exponential(min=RATE_LIMIT_MIN_WAIT, max=RATE_LIMIT_MAX_WAIT),
-    before_sleep=before_sleep_log(logger, logging.WARNING),
-    reraise=True,
-)
-
-
-def build_tarball(files: dict[str, str | bytes]) -> bytes:
-    """Build a .tar.gz in memory from ``{relative_path: content}``."""
-    buf = io.BytesIO()
-    with tarfile.open(fileobj=buf, mode="w:gz") as tar:
-        for name, content in files.items():
-            data = content.encode() if isinstance(content, str) else content
-            info = tarfile.TarInfo(name=name)
-            info.size = len(data)
-            tar.addfile(info, io.BytesIO(data))
-    return buf.getvalue()
-
-
-# -- Sandbox helpers (private) ------------------------------------------------
-
-
-def _find_agent_server_url(sandbox: dict) -> tuple[str, str] | None:
-    """Return ``(agent_url, session_key)`` if an AGENT_SERVER URL exists."""
-    for url_info in sandbox.get("exposed_urls") or []:
-        if url_info.get("name") == "AGENT_SERVER":
-            return url_info["url"].rstrip("/"), sandbox.get("session_api_key", "")
-    return None
-
-
-@_retry_on_rate_limit
-async def _create_sandbox(
-    client: httpx.AsyncClient, api_url: str, headers: dict[str, str]
-) -> str:
-    """Create a sandbox and return its ID. Retries on rate limit."""
-    resp = await client.post(f"{api_url}/api/v1/sandboxes", headers=headers)
-    resp.raise_for_status()
-    return resp.json()["id"]
-
-
-@_retry_on_rate_limit
-async def _poll_sandbox(
-    client: httpx.AsyncClient, api_url: str, sandbox_id: str, headers: dict[str, str]
-) -> dict[str, Any]:
-    """Poll sandbox status. Retries on rate limit."""
-    resp = await client.get(
-        f"{api_url}/api/v1/sandboxes",
-        params={"id": sandbox_id},
-        headers=headers,
-    )
-    resp.raise_for_status()
-    items = resp.json()
-    if not items:
-        raise RuntimeError(f"Sandbox {sandbox_id} disappeared")
-    return items[0]
-
-
-async def _create_and_wait(
-    client: httpx.AsyncClient,
-    api_url: str,
-    api_key: str,
-    ready_timeout: float = SANDBOX_READY_TIMEOUT,
-) -> tuple[str, str, str]:
-    """Create a sandbox and poll until RUNNING.
-
-    Returns ``(sandbox_id, session_api_key, agent_server_url)``.
-    Handles 429 rate limits via tenacity retry.
-    """
-    headers = {"Authorization": f"Bearer {api_key}"}
-
-    sandbox_id = await _create_sandbox(client, api_url, headers)
-
-    elapsed = 0.0
-    while elapsed < ready_timeout:
-        sb = await _poll_sandbox(client, api_url, sandbox_id, headers)
-        status = sb.get("status", "UNKNOWN")
-
-        if status == "RUNNING":
-            result = _find_agent_server_url(sb)
-            if result is None:
-                raise RuntimeError(f"No AGENT_SERVER URL in sandbox {sandbox_id}")
-            agent_url, session_key = result
-            return sandbox_id, session_key, agent_url
-
-        if status in ("ERROR", "MISSING"):
-            # Extract error details from sandbox response
-            error_code = sb.get("error_code", "")
-            error_message = sb.get("error_message", "")
-            error_detail = f"status={status}"
-            if error_code:
-                error_detail += f", error_code={error_code}"
-            if error_message:
-                error_detail += f", error_message={error_message}"
-            raise RuntimeError(f"Sandbox {sandbox_id} failed: {error_detail}")
-
-        await asyncio.sleep(SANDBOX_POLL_INTERVAL)
-        elapsed += SANDBOX_POLL_INTERVAL
-
-    raise TimeoutError(f"Sandbox {sandbox_id} not ready after {ready_timeout}s")
-
-
-async def _upload(
-    client: httpx.AsyncClient,
-    agent_url: str,
-    session_key: str,
-    data: bytes,
-    dest: str,
-) -> None:
-    """Upload bytes to the sandbox via the agent-server file API.
-
-    The agent-server expects the absolute path in the URL, e.g.
-    ``POST /api/file/upload//tmp/file.tar.gz`` (double-slash is correct).
-    """
-    resp = await client.post(
-        f"{agent_url}/api/file/upload/{dest}",
-        files={"file": ("upload", data)},
-        headers={"X-Session-API-Key": session_key},
-    )
-    resp.raise_for_status()
-
-
-async def _bash(
-    client: httpx.AsyncClient,
-    agent_url: str,
-    session_key: str,
-    command: str,
-    timeout: int = MAX_RUN_DURATION_SECONDS,
-) -> tuple[int | None, str, str]:
-    """Run a bash command synchronously. Returns ``(exit_code, stdout, stderr)``."""
-    resp = await client.post(
-        f"{agent_url}/api/bash/execute_bash_command",
-        json={"command": command, "timeout": timeout},
-        headers={"X-Session-API-Key": session_key},
-        timeout=httpx.Timeout(timeout + 30),
-    )
-    resp.raise_for_status()
-    body = resp.json()
-    return body.get("exit_code"), body.get("stdout") or "", body.get("stderr") or ""
-
-
-async def _start_bash(
-    client: httpx.AsyncClient,
-    agent_url: str,
-    session_key: str,
-    command: str,
-    timeout: int = MAX_RUN_DURATION_SECONDS,
-) -> str:
-    """Start a bash command in the background. Returns the command ID."""
-    resp = await client.post(
-        f"{agent_url}/api/bash/start_bash_command",
-        json={"command": command, "timeout": timeout},
-        headers={"X-Session-API-Key": session_key},
-        timeout=30.0,
-    )
-    resp.raise_for_status()
-    body = resp.json()
-    return body.get("id")
-
-
-def _is_permanent_http_error(stderr: str) -> bool:
-    """Check if curl stderr indicates a permanent HTTP error (4xx client errors).
-
-    We only treat 4xx errors as permanent because they indicate the URL is wrong
-    or inaccessible (404 Not Found, 403 Forbidden, 401 Unauthorized, etc.).
-    5xx errors are transient server issues that may resolve on retry.
-
-    Returns True if the error is permanent and the automation should be disabled.
-    """
-    # curl error format: "The requested URL returned error: 404"
-    # We look for 4xx status codes
-    match = re.search(r"returned error:\s*(\d{3})", stderr)
-    if match:
-        status_code = int(match.group(1))
-        return 400 <= status_code < 500
-    return False
-
-
-async def _download_in_sandbox(
-    client: httpx.AsyncClient,
-    agent_url: str,
-    session_key: str,
-    tarball_url: str,
-    dest: str,
-    timeout: int = EXTERNAL_DOWNLOAD_TIMEOUT,
-    max_filesize: int = EXTERNAL_MAX_FILESIZE,
-) -> None:
-    """Download a tarball directly inside the sandbox using curl.
-
-    This is used for external URLs (https://) to avoid downloading
-    untrusted, potentially large files on the automation service.
-
-    Raises:
-        TarballNotFoundError: If the URL returns a 4xx HTTP error (permanent).
-            This indicates the URL is wrong or inaccessible.
-        RuntimeError: For other download failures (transient).
-    """
-    # Use curl with safety limits:
-    # -f: fail silently on HTTP errors (returns exit code 22)
-    # -s: silent mode (no progress)
-    # -S: show errors even in silent mode
-    # -L: follow redirects
-    # --max-filesize: limit download size
-    # --max-time: limit total time
-    cmd = (
-        f"curl -fsSL "
-        f"--max-filesize {max_filesize} "
-        f"--max-time {timeout} "
-        f"-o {dest} "
-        f"{_shell_quote(tarball_url)}"
-    )
-
-    exit_code, stdout, stderr = await _bash(
-        client, agent_url, session_key, cmd, timeout=timeout + 30
-    )
-
-    if exit_code != 0:
-        # curl exit codes: 22 = HTTP error, 63 = max filesize exceeded
-        if exit_code == 63:
-            raise RuntimeError(
-                f"Tarball exceeds size limit ({max_filesize // 1024 // 1024} MB)"
-            )
-
-        # Check if this is a permanent HTTP error (4xx)
-        if exit_code == 22 and _is_permanent_http_error(stderr):
-            raise TarballNotFoundError(
-                f"External tarball URL is not accessible: {tarball_url}. "
-                f"HTTP error: {stderr.strip()}"
-            )
-
-        raise RuntimeError(f"Failed to download tarball (exit={exit_code}): {stderr}")
-
-
-# -- Public API ---------------------------------------------------------------
-
-
-@dataclass(frozen=True)
-class DispatchResult:
-    """Result of dispatching an automation to a sandbox (fire-and-forget)."""
-
-    success: bool
-    sandbox_id: str | None = None
-    error: str | None = None
-
-
-async def dispatch_automation(
-    api_url: str,
-    api_key: str,
-    entrypoint: str,
-    tarball_source: bytes | str,
-    env_vars: dict[str, str] | None = None,
-    timeout: int = MAX_RUN_DURATION_SECONDS,
-    callback_url: str | None = None,
-    run_id: str | None = None,
-) -> DispatchResult:
-    """Dispatch an automation to a sandbox (fire-and-forget).
-
-    1. Create sandbox and wait until RUNNING.
-    2. Get tarball into sandbox (upload bytes OR download from URL).
-    3. Extract it, run ``setup.sh`` (if present), then start *entrypoint*.
-    4. Return immediately without waiting for the entrypoint to complete.
-
-    The SDK inside the sandbox will POST to callback_url when finished.
-    The caller should store sandbox_id to verify status later if needed.
-
-    *tarball_source*: Either raw bytes (uploaded to sandbox) or a URL string
-    (downloaded directly inside sandbox via curl). URLs avoid downloading
-    untrusted/large files on the automation service.
-
-    *env_vars* are exported before the entrypoint runs.  The sandbox
-    identity env vars (``SANDBOX_ID``, ``SESSION_API_KEY``) are
-    **always** injected so the SDK's ``local_agent_server_mode`` works.
-    If *callback_url* / *run_id* are set they are injected as
-    ``AUTOMATION_CALLBACK_URL`` / ``AUTOMATION_RUN_ID`` so the SDK's
-    ``OpenHandsCloudWorkspace`` can POST completion status on exit.
-    """
-    env_vars = dict(env_vars) if env_vars else {}
-    if callback_url:
-        env_vars["AUTOMATION_CALLBACK_URL"] = callback_url
-    if run_id:
-        env_vars["AUTOMATION_RUN_ID"] = run_id
-    api_url = api_url.rstrip("/")
-    sandbox_id: str | None = None
-
-    # Helper for consistent structured logging with run_id/sandbox_id
-    def log_extra() -> dict[str, Any]:
-        return _log_extra(run_id=run_id, sandbox_id=sandbox_id)
-
-    logger.info("Dispatching automation to sandbox", extra=log_extra())
-
-    async with httpx.AsyncClient(timeout=60.0) as client:
-        try:
-            sandbox_id, session_key, agent_url = await _create_and_wait(
-                client, api_url, api_key
-            )
-            logger.info(
-                "Sandbox ready: %s at %s", sandbox_id, agent_url, extra=log_extra()
-            )
-        except Exception as e:
-            # If sandbox creation started but failed to reach RUNNING,
-            # still attempt cleanup.
-            logger.exception("Sandbox creation failed", extra=log_extra())
-            if sandbox_id:
-                await delete_sandbox(client, api_url, api_key, sandbox_id)
-            return DispatchResult(success=False, sandbox_id=sandbox_id, error=str(e))
-
-        try:
-            # Always inject sandbox identity so the SDK can call
-            # get_llm() / get_secrets() inside the sandbox.
-            env_vars.setdefault("SANDBOX_ID", sandbox_id)
-            env_vars.setdefault("SESSION_API_KEY", session_key)
-
-            # Get tarball into sandbox: upload bytes or download from URL
-            if isinstance(tarball_source, bytes):
-                logger.info("Uploading tarball to sandbox", extra=log_extra())
-                await _upload(
-                    client, agent_url, session_key, tarball_source, TARBALL_PATH
-                )
-            else:
-                logger.info(
-                    "Downloading tarball in sandbox from URL", extra=log_extra()
-                )
-                await _download_in_sandbox(
-                    client, agent_url, session_key, tarball_source, TARBALL_PATH
-                )
-
-            exports = ""
-            if env_vars:
-                parts = [f"export {k}={_shell_quote(v)}" for k, v in env_vars.items()]
-                exports = " && ".join(parts) + " && "
-
-            cmd = (
-                f"mkdir -p {WORK_DIR}"
-                f" && tar xzf {TARBALL_PATH} -C {WORK_DIR}"
-                f" && cd {WORK_DIR}"
-                f" && ([ ! -f setup.sh ] || bash setup.sh)"
-                f" && {exports}{entrypoint}"
-            )
-
-            logger.info("Starting entrypoint: %s", entrypoint, extra=log_extra())
-            command_id = await _start_bash(
-                client, agent_url, session_key, cmd, timeout=timeout
-            )
-            logger.info(
-                "Entrypoint started (command_id=%s), disconnecting",
-                command_id,
-                extra=log_extra(),
-            )
-
-            return DispatchResult(success=True, sandbox_id=sandbox_id)
-
-        except PermanentDispatchError:
-            # Clean up sandbox before re-raising so dispatcher can disable automation
-            if sandbox_id:
-                try:
-                    await delete_sandbox(client, api_url, api_key, sandbox_id)
-                except Exception:
-                    logger.exception("Failed to delete sandbox during error cleanup")
-            raise
-        except Exception as e:
-            logger.exception("Automation dispatch failed", extra=log_extra())
-            # Delete sandbox on dispatch failure to avoid orphaned sandboxes
-            if sandbox_id:
-                await delete_sandbox(client, api_url, api_key, sandbox_id)
-            return DispatchResult(success=False, sandbox_id=sandbox_id, error=str(e))
-
-
-@dataclass(frozen=True)
-class AutomationResult:
-    """Result of running an automation (blocking mode)."""
-
-    success: bool
-    sandbox_id: str | None = None
-    exit_code: int | None = None
-    stdout: str = ""
-    stderr: str = ""
-    error: str | None = None
-
-
-async def run_automation(
-    api_url: str,
-    api_key: str,
-    entrypoint: str,
-    tarball_source: bytes | str,
-    env_vars: dict[str, str] | None = None,
-    timeout: int = MAX_RUN_DURATION_SECONDS,
-    callback_url: str | None = None,
-    run_id: str | None = None,
-    keep_sandbox: bool = False,
-) -> AutomationResult:
-    """Execute an automation end-to-end in a fresh sandbox (blocking).
-
-    Use this for testing or when you need to wait for the result immediately.
-    For production async execution, use dispatch_automation() instead.
-
-    1. Create sandbox and wait until RUNNING.
-    2. Get tarball into sandbox (upload bytes OR download from URL).
-    3. Extract it, run ``setup.sh`` (if present), then run *entrypoint*.
-    4. Wait for completion and return the result.
-    5. Delete the sandbox (unless *keep_sandbox* is True).
-
-    *tarball_source*: Either raw bytes (uploaded to sandbox) or a URL string
-    (downloaded directly inside sandbox via curl). URLs avoid downloading
-    untrusted/large files on the automation service.
-
-    *env_vars* are exported before the entrypoint runs.  The sandbox
-    identity env vars (``SANDBOX_ID``, ``SESSION_API_KEY``) are
-    **always** injected so the SDK's ``local_agent_server_mode`` works.
-    If *callback_url* / *run_id* are set they are injected as
-    ``AUTOMATION_CALLBACK_URL`` / ``AUTOMATION_RUN_ID`` so the SDK's
-    ``OpenHandsCloudWorkspace`` can POST completion status on exit.
-    """
-    env_vars = dict(env_vars) if env_vars else {}
-    if callback_url:
-        env_vars["AUTOMATION_CALLBACK_URL"] = callback_url
-    if run_id:
-        env_vars["AUTOMATION_RUN_ID"] = run_id
-    api_url = api_url.rstrip("/")
-    sandbox_id: str | None = None
-
-    # Helper for consistent structured logging with run_id/sandbox_id
-    def log_extra() -> dict[str, Any]:
-        return _log_extra(run_id=run_id, sandbox_id=sandbox_id)
-
-    logger.info("Starting automation execution", extra=log_extra())
-
-    async with httpx.AsyncClient(timeout=60.0) as client:
-        try:
-            sandbox_id, session_key, agent_url = await _create_and_wait(
-                client, api_url, api_key
-            )
-            logger.info(
-                "Sandbox ready: %s at %s", sandbox_id, agent_url, extra=log_extra()
-            )
-        except Exception as e:
-            # If sandbox creation started but failed to reach RUNNING,
-            # still attempt cleanup.
-            logger.exception("Sandbox creation failed", extra=log_extra())
-            if sandbox_id:
-                await delete_sandbox(client, api_url, api_key, sandbox_id)
-            return AutomationResult(success=False, sandbox_id=sandbox_id, error=str(e))
-
-        try:
-            # Always inject sandbox identity so the SDK can call
-            # get_llm() / get_secrets() inside the sandbox.
-            env_vars.setdefault("SANDBOX_ID", sandbox_id)
-            env_vars.setdefault("SESSION_API_KEY", session_key)
-
-            # Get tarball into sandbox: upload bytes or download from URL
-            if isinstance(tarball_source, bytes):
-                logger.info("Uploading tarball to sandbox", extra=log_extra())
-                await _upload(
-                    client, agent_url, session_key, tarball_source, TARBALL_PATH
-                )
-            else:
-                logger.info(
-                    "Downloading tarball in sandbox from URL", extra=log_extra()
-                )
-                await _download_in_sandbox(
-                    client, agent_url, session_key, tarball_source, TARBALL_PATH
-                )
-
-            exports = ""
-            if env_vars:
-                parts = [f"export {k}={_shell_quote(v)}" for k, v in env_vars.items()]
-                exports = " && ".join(parts) + " && "
-
-            cmd = (
-                f"mkdir -p {WORK_DIR}"
-                f" && tar xzf {TARBALL_PATH} -C {WORK_DIR}"
-                f" && cd {WORK_DIR}"
-                f" && ([ ! -f setup.sh ] || bash setup.sh)"
-                f" && {exports}{entrypoint}"
-            )
-
-            logger.info("Executing entrypoint: %s", entrypoint, extra=log_extra())
-            exit_code, stdout, stderr = await _bash(
-                client, agent_url, session_key, cmd, timeout=timeout
-            )
-
-            success = exit_code == 0
-            error_msg = None
-            if not success:
-                # Include both stderr and stdout tail - some errors go to stdout
-                error_parts = [f"exit_code={exit_code}"]
-                if stderr:
-                    error_parts.append(f"stderr: {stderr[-1000:]}")
-                if stdout:
-                    error_parts.append(f"stdout: {stdout[-500:]}")
-                error_msg = "\n".join(error_parts)
-                logger.warning(
-                    "Entrypoint failed with exit_code=%s", exit_code, extra=log_extra()
-                )
-            else:
-                logger.info("Entrypoint completed successfully", extra=log_extra())
-
-            return AutomationResult(
-                success=success,
-                sandbox_id=sandbox_id,
-                exit_code=exit_code,
-                stdout=stdout,
-                stderr=stderr,
-                error=error_msg,
-            )
-
-        except Exception as e:
-            logger.exception("Automation execution failed", extra=log_extra())
-            return AutomationResult(success=False, sandbox_id=sandbox_id, error=str(e))
-        finally:
-            if not keep_sandbox:
-                logger.info("Deleting sandbox", extra=log_extra())
-                await delete_sandbox(client, api_url, api_key, sandbox_id)
-
-
-def _shell_quote(s: str) -> str:
-    """Single-quote a string for safe shell interpolation."""
-    return "'" + s.replace("'", "'\\''") + "'"
diff --git a/automation/router.py b/automation/router.py
index 983a1b1..db523db 100644
--- a/automation/router.py
+++ b/automation/router.py
@@ -1,16 +1,22 @@
-"""FastAPI router for the automations CRUD API."""
+"""FastAPI router for the automations CRUD API.
+
+Uses Temporal for workflow execution:
+- Creating/updating automations creates/updates Temporal Schedules
+- Manual dispatch starts a Temporal Workflow
+- Run completion updates database records
+"""
 
-import asyncio
 import logging
 import uuid
 
 from fastapi import APIRouter, Depends, HTTPException, Query, status
 from sqlalchemy import func, select, update
-from sqlalchemy.engine import CursorResult
 from sqlalchemy.ext.asyncio import AsyncSession
-from sqlalchemy.orm import selectinload
+from temporalio.client import Client
 
 from automation.auth import AuthenticatedUser, authenticate_request
+from automation.config import get_settings
+from automation.constants import MAX_RUN_DURATION_SECONDS
 from automation.db import get_session
 from automation.models import Automation, AutomationRun, AutomationRunStatus
 from automation.schemas import (
@@ -22,9 +28,19 @@
     RunCompleteRequest,
     UpdateAutomationRequest,
 )
+from automation.temporal.client import get_temporal_client
+from automation.temporal.schedules import (
+    create_schedule,
+    delete_schedule,
+    update_schedule,
+)
+from automation.temporal.types import (
+    AutomationConfig,
+    TriggerContext,
+    WorkflowInput,
+)
+from automation.temporal.workflows import AutomationWorkflow
 from automation.utils import utcnow
-from automation.utils.run import create_pending_run
-from automation.utils.sandbox import cleanup_sandbox
 from automation.utils.tarball_validation import validate_tarball_path
 
 
@@ -33,6 +49,14 @@
 router = APIRouter(prefix="/v1", tags=["Automations"])
 
 
+# --- Dependencies ---
+
+
+async def get_client() -> Client:
+    """Dependency to get the Temporal client."""
+    return await get_temporal_client()
+
+
 # --- CRUD ---
 
 
@@ -41,14 +65,14 @@ async def create_automation(
     body: CreateAutomationRequest,
     user: AuthenticatedUser = Depends(authenticate_request),
     session: AsyncSession = Depends(get_session),
+    client: Client = Depends(get_client),
 ) -> AutomationResponse:
-    """Create a new automation.
+    """Create a new automation with Temporal scheduling.
 
-    The tarball_path can be either:
-    - Internal upload: oh-internal://uploads/{uuid} (from /v1/uploads)
-    - External public URL: https://, s3://, or gs:// URLs
+    Creates the automation in the database and a corresponding Temporal
+    Schedule if the trigger is cron-based.
     """
-    # Validate tarball_path (checks ownership for internal uploads)
+    # Validate tarball_path
     await validate_tarball_path(
         tarball_path=body.tarball_path,
         user_id=user.user_id,
@@ -69,6 +93,20 @@ async def create_automation(
     session.add(auto)
     await session.flush()
     await session.refresh(auto)
+
+    # Create Temporal Schedule for cron triggers
+    if body.trigger.type == "cron":
+        try:
+            await create_schedule(client, auto)
+        except Exception as e:
+            logger.error("Failed to create Temporal schedule: %s", e)
+            # Rollback the automation creation
+            await session.rollback()
+            raise HTTPException(
+                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+                detail=f"Failed to create schedule: {e}",
+            )
+
     return AutomationResponse.model_validate(auto)
 
 
@@ -79,7 +117,7 @@ async def list_automations(
     user: AuthenticatedUser = Depends(authenticate_request),
     session: AsyncSession = Depends(get_session),
 ) -> AutomationListResponse:
-    """List automations for the authenticated user (excludes soft-deleted)."""
+    """List automations for the authenticated user."""
     base_query = select(Automation).where(
         Automation.user_id == user.user_id,
         Automation.org_id == user.org_id,
@@ -114,41 +152,57 @@ async def get_automation(
 
 
 @router.patch("/{automation_id}")
-async def update_automation(
+async def update_automation_endpoint(
     automation_id: uuid.UUID,
     body: UpdateAutomationRequest,
     user: AuthenticatedUser = Depends(authenticate_request),
     session: AsyncSession = Depends(get_session),
+    client: Client = Depends(get_client),
 ) -> AutomationResponse:
-    """Partially update an automation."""
+    """Update an automation and its Temporal Schedule."""
     auto = await _get_user_automation(session, automation_id, user.user_id, user.org_id)
 
     update_data = body.model_dump(exclude_unset=True)
-    # Handle trigger field mapping (only if trigger has a real value)
     if body.trigger is not None:
         update_data["trigger"] = body.trigger.model_dump()
 
     for field, value in update_data.items():
         setattr(auto, field, value)
 
-    # Note: updated_at is handled automatically by the model's onupdate=utcnow
     await session.flush()
     await session.refresh(auto)
+
+    # Update Temporal Schedule
+    if auto.trigger.get("type") == "cron":
+        try:
+            await update_schedule(client, auto)
+        except Exception as e:
+            logger.warning("Failed to update Temporal schedule: %s", e)
+            # Try to create it if it doesn't exist
+            try:
+                await create_schedule(client, auto)
+            except Exception:
+                pass
+
     return AutomationResponse.model_validate(auto)
 
 
 @router.delete("/{automation_id}", status_code=status.HTTP_204_NO_CONTENT)
-async def delete_automation(
+async def delete_automation_endpoint(
     automation_id: uuid.UUID,
     user: AuthenticatedUser = Depends(authenticate_request),
     session: AsyncSession = Depends(get_session),
+    client: Client = Depends(get_client),
 ) -> None:
-    """Soft delete an automation."""
+    """Soft delete an automation and its Temporal Schedule."""
     auto = await _get_user_automation(session, automation_id, user.user_id, user.org_id)
     auto.enabled = False
     auto.deleted_at = utcnow()
     await session.flush()
 
+    # Delete Temporal Schedule
+    await delete_schedule(client, automation_id)
+
 
 # --- Runs ---
 
@@ -158,16 +212,77 @@ async def dispatch_automation(
     automation_id: uuid.UUID,
     user: AuthenticatedUser = Depends(authenticate_request),
     session: AsyncSession = Depends(get_session),
+    client: Client = Depends(get_client),
 ) -> AutomationRunResponse:
-    """Manually dispatch an automation run.
+    """Manually dispatch an automation run using Temporal.
 
-    Creates a PENDING run for the specified automation, which will be
-    picked up by the dispatcher and executed.
+    Starts a Temporal Workflow for immediate execution instead of
+    creating a PENDING database record.
     """
     auto = await _get_user_automation(session, automation_id, user.user_id, user.org_id)
-    run = await create_pending_run(session, auto)
+    settings = get_settings()
+
+    # Create a database record for tracking
+    run = AutomationRun(
+        automation_id=automation_id,
+        status=AutomationRunStatus.RUNNING,
+        started_at=utcnow(),
+    )
+    session.add(run)
     await session.flush()
     await session.refresh(run)
+
+    # Build workflow input
+    automation_config = AutomationConfig(
+        automation_id=str(auto.id),
+        user_id=str(auto.user_id),
+        org_id=str(auto.org_id),
+        name=auto.name,
+        tarball_path=auto.tarball_path,
+        entrypoint=auto.entrypoint,
+        timeout_seconds=auto.timeout or MAX_RUN_DURATION_SECONDS,
+        trigger=auto.trigger,
+        setup_script_path=auto.setup_script_path,
+    )
+
+    trigger_context = TriggerContext(
+        trigger_type="manual",
+        triggered_by=str(user.user_id),
+    )
+
+    workflow_input = WorkflowInput(
+        automation=automation_config,
+        trigger_context=trigger_context,
+        run_id=str(run.id),
+        callback_url=f"{settings.resolved_base_url}/v1/runs/{run.id}/complete",
+    )
+
+    # Start the workflow
+    workflow_id = f"automation-run-{run.id}"
+    try:
+        await client.start_workflow(
+            AutomationWorkflow.run,
+            workflow_input,
+            id=workflow_id,
+            task_queue=settings.temporal_task_queue,
+        )
+        logger.info(
+            "Started workflow: workflow_id=%s run_id=%s automation_id=%s",
+            workflow_id,
+            run.id,
+            automation_id,
+        )
+    except Exception as e:
+        # Mark run as failed if workflow couldn't start
+        run.status = AutomationRunStatus.FAILED
+        run.error_detail = f"Failed to start workflow: {e}"
+        run.completed_at = utcnow()
+        await session.flush()
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"Failed to start workflow: {e}",
+        )
+
     return AutomationRunResponse.model_validate(run)
 
 
@@ -179,20 +294,14 @@ async def list_automation_runs(
     user: AuthenticatedUser = Depends(authenticate_request),
     session: AsyncSession = Depends(get_session),
 ) -> AutomationRunListResponse:
-    """List runs for a specific automation.
-
-    Returns runs ordered by creation time (latest first), with pagination.
-    """
-    # Verify the automation exists and belongs to the user
+    """List runs for a specific automation."""
     await _get_user_automation(session, automation_id, user.user_id, user.org_id)
 
-    # Count total runs for this automation
     count_result = await session.execute(
         select(func.count()).where(AutomationRun.automation_id == automation_id)
     )
     total = count_result.scalar() or 0
 
-    # Fetch paginated runs ordered by latest first
     result = await session.execute(
         select(AutomationRun)
         .where(AutomationRun.automation_id == automation_id)
@@ -218,19 +327,17 @@ async def complete_run(
     user: AuthenticatedUser = Depends(authenticate_request),
     session: AsyncSession = Depends(get_session),
 ) -> AutomationRunResponse:
-    """Receive completion callback from the SDK running inside a sandbox.
-
-    Called by ``OpenHandsCloudWorkspace.__exit__`` when the automation
-    entry-point finishes (success or failure).  Transitions the run from
-    RUNNING → COMPLETED or RUNNING → FAILED.
+    """Receive completion callback from the SDK.
 
-    Authenticated via the same ``OPENHANDS_API_KEY`` that was passed into
-    the sandbox.  The key is validated against ``/api/keys/current`` (by
-    ``authenticate_request``) and the resulting user must own the run's
-    parent automation.
+    This endpoint is called by the SDK running inside a sandbox when
+    the automation entrypoint finishes. It updates the database record.
 
-    If keep_alive is False, deletes the sandbox after updating the run status.
+    Note: With Temporal, workflow completion is also tracked in Temporal's
+    event history, but this callback updates our database for API queries.
     """
+    from sqlalchemy.engine import CursorResult
+    from sqlalchemy.orm import selectinload
+
     result = await session.execute(
         select(AutomationRun)
         .where(AutomationRun.id == run_id)
@@ -240,19 +347,17 @@ async def complete_run(
     if run is None:
         raise HTTPException(status.HTTP_404_NOT_FOUND, detail="Run not found")
 
-    # Verify the caller owns this automation
     automation = run.automation
     if automation.user_id != user.user_id or automation.org_id != user.org_id:
         raise HTTPException(status.HTTP_403_FORBIDDEN, detail="Not your automation")
 
-    # Optimistic locking: only update if the run is still RUNNING.
-    # This prevents races between the watchdog and the callback.
     now = utcnow()
     new_status = (
         AutomationRunStatus.COMPLETED
         if body.status == "COMPLETED"
         else AutomationRunStatus.FAILED
     )
+
     values: dict = {
         "status": new_status,
         "completed_at": now,
@@ -262,6 +367,7 @@ async def complete_run(
     if body.status == "FAILED" and body.error:
         values["error_detail"] = body.error
 
+    # Optimistic update
     stmt = (
         update(AutomationRun)
         .where(
@@ -279,22 +385,7 @@ async def complete_run(
         )
 
     await session.refresh(run)
-    logger.info("Run %s → %s", run_id, new_status.value)
-
-    # Clean up sandbox if not keeping alive
-    if not run.keep_alive and run.sandbox_id:
-        # Fire-and-forget sandbox deletion in background
-        from automation.config import get_settings
-
-        settings = get_settings()
-        asyncio.create_task(
-            cleanup_sandbox(
-                api_url=settings.openhands_api_base_url,
-                api_key=user.api_key,
-                sandbox_id=run.sandbox_id,
-                run_id=str(run_id),
-            )
-        )
+    logger.info("Run completed: run_id=%s status=%s", run_id, new_status.value)
 
     return AutomationRunResponse.model_validate(run)
 
@@ -308,7 +399,7 @@ async def _get_user_automation(
     user_id: uuid.UUID,
     org_id: uuid.UUID,
 ) -> Automation:
-    """Fetch a non-deleted automation, ensuring it belongs to the given user and org."""
+    """Fetch a non-deleted automation belonging to the user."""
     result = await session.execute(
         select(Automation).where(
             Automation.id == automation_id,
diff --git a/automation/scheduler.py b/automation/scheduler.py
deleted file mode 100644
index 8d5dc26..0000000
--- a/automation/scheduler.py
+++ /dev/null
@@ -1,192 +0,0 @@
-"""Background scheduler for polling due cron automations.
-
-Runs as an in-process background task within the FastAPI app. Polls the database
-every N seconds (configurable via AUTOMATION_SCHEDULER_INTERVAL_SECONDS) for
-enabled cron automations whose next fire time is due.
-
-Uses FOR UPDATE SKIP LOCKED for multi-worker safety in PostgreSQL.
-"""
-
-import asyncio
-import logging
-from datetime import datetime, timedelta
-
-from sqlalchemy import select, update
-from sqlalchemy.ext.asyncio import AsyncSession, async_sessionmaker
-
-from automation.models import Automation, AutomationRun
-from automation.utils import is_automation_due, utcnow
-from automation.utils.run import create_pending_run
-
-
-logger = logging.getLogger("automation.scheduler")
-
-# Default batch size for polling
-DEFAULT_BATCH_SIZE = 50
-
-# Minimum interval between polling the same automation (seconds)
-POLL_INTERVAL_SECONDS = 60
-
-
-async def _fetch_enabled_automations(
-    session: AsyncSession,
-    batch_size: int,
-    poll_threshold: datetime,
-) -> list[Automation]:
-    """Fetch enabled automations using FOR UPDATE SKIP LOCKED.
-
-    This allows multiple workers to poll concurrently without picking
-    the same rows. Each worker claims a batch atomically.
-
-    The poll_threshold filters out automations that were recently polled,
-    ensuring fair rotation through all automations when using batching.
-
-    Args:
-        session: Database session
-        batch_size: Maximum number of automations to fetch
-        poll_threshold: Only poll automations not polled since this time
-
-    Returns:
-        List of claimed automations
-    """
-    select_query = (
-        select(Automation)
-        .where(
-            Automation.enabled.is_(True),
-            Automation.deleted_at.is_(None),
-            (Automation.last_polled_at.is_(None))
-            | (Automation.last_polled_at < poll_threshold),
-        )
-        .order_by(Automation.last_polled_at.asc().nulls_first())
-        .limit(batch_size)
-        .with_for_update(skip_locked=True)
-    )
-
-    result = await session.execute(select_query)
-    return list(result.scalars().all())
-
-
-async def poll_and_schedule(
-    session_factory: async_sessionmaker[AsyncSession],
-    batch_size: int = DEFAULT_BATCH_SIZE,
-) -> list[AutomationRun]:
-    """Poll for due automations and create pending runs atomically.
-
-    Fetches enabled automations using FOR UPDATE SKIP LOCKED for multi-worker
-    safety, updates last_polled_at for ALL fetched automations (to ensure fair
-    batch rotation), filters to those that are due, and creates PENDING runs.
-    All within a single transaction so row locks are held throughout and no
-    schedules can be lost or duplicated.
-
-    Args:
-        session_factory: SQLAlchemy async session factory
-        batch_size: Maximum number of automations to poll per batch
-
-    Returns:
-        List of AutomationRun objects created
-    """
-    now = utcnow()
-    poll_threshold = now - timedelta(seconds=POLL_INTERVAL_SECONDS)
-    created_runs: list[AutomationRun] = []
-
-    async with session_factory() as session:
-        automations = await _fetch_enabled_automations(
-            session, batch_size, poll_threshold
-        )
-
-        # Update last_polled_at for ALL fetched automations to ensure fair
-        # batch rotation. Without this, non-due automations would be re-polled
-        # every cycle, starving other automations in subsequent batches.
-        if automations:
-            automation_ids = [a.id for a in automations]
-            await session.execute(
-                update(Automation)
-                .where(Automation.id.in_(automation_ids))
-                .values(last_polled_at=now)
-            )
-            for automation in automations:
-                automation.last_polled_at = now
-
-        due_automations = [a for a in automations if is_automation_due(a, now)]
-
-        for automation in due_automations:
-            try:
-                run = await create_pending_run(session, automation)
-                created_runs.append(run)
-                logger.info(
-                    "Created pending run: run_id=%s automation_id=%s "
-                    "name=%s schedule=%s",
-                    run.id,
-                    automation.id,
-                    automation.name,
-                    automation.trigger.get("schedule"),
-                )
-            except Exception:
-                logger.exception(
-                    "Failed to create run for automation %s",
-                    automation.id,
-                )
-
-        # Always commit to release row locks from FOR UPDATE SKIP LOCKED,
-        # even if no runs were created
-        await session.commit()
-
-    return created_runs
-
-
-async def scheduler_loop(
-    session_factory: async_sessionmaker[AsyncSession],
-    interval_seconds: int = 60,
-    shutdown_event: asyncio.Event | None = None,
-    batch_size: int = DEFAULT_BATCH_SIZE,
-) -> None:
-    """Main scheduler loop that polls for due automations.
-
-    For each due automation, creates a PENDING run in the automation_runs table.
-    The dispatcher (separate process) picks up PENDING runs and executes them.
-
-    Args:
-        session_factory: SQLAlchemy async session factory
-        interval_seconds: Polling interval in seconds
-        shutdown_event: Event to signal shutdown (for graceful stop)
-        batch_size: Maximum number of automations to poll per batch
-    """
-    logger.info(
-        "Scheduler started, polling every %d seconds (batch_size=%d)",
-        interval_seconds,
-        batch_size,
-    )
-
-    while True:
-        if shutdown_event is not None and shutdown_event.is_set():
-            logger.info("Scheduler received shutdown signal, exiting")
-            break
-
-        try:
-            created_runs = await poll_and_schedule(
-                session_factory, batch_size=batch_size
-            )
-
-            if created_runs:
-                logger.info(
-                    "Found %d due automation(s) to schedule",
-                    len(created_runs),
-                )
-            else:
-                logger.debug("No automations due at this time")
-
-        except Exception:
-            logger.exception("Error in scheduler poll cycle")
-
-        if shutdown_event is not None:
-            try:
-                await asyncio.wait_for(
-                    shutdown_event.wait(),
-                    timeout=interval_seconds,
-                )
-                logger.info("Scheduler received shutdown signal, exiting")
-                break
-            except TimeoutError:
-                pass
-        else:
-            await asyncio.sleep(interval_seconds)
diff --git a/automation/temporal/__init__.py b/automation/temporal/__init__.py
new file mode 100644
index 0000000..4d17f94
--- /dev/null
+++ b/automation/temporal/__init__.py
@@ -0,0 +1,64 @@
+"""Temporal workflow execution for automations.
+
+This package provides durable workflow execution using Temporal:
+
+- activities: Activity definitions for sandbox operations (API key, sandbox
+  creation, tarball handling, entrypoint execution, cleanup)
+- workflows: AutomationWorkflow orchestrates the full automation lifecycle
+- worker: Temporal worker setup for processing tasks
+- client: Temporal client factory for connecting to the service
+- schedules: Temporal Schedule management for cron automations
+- types: Data classes for workflow inputs/outputs
+
+The main application (automation.app) uses this package to:
+1. Run a Temporal worker as a background task
+2. Create Temporal Schedules when automations are created
+3. Start workflows when automations are manually triggered
+
+To run a standalone worker:
+    python -m automation.temporal.worker
+
+Note: This __init__.py intentionally does NOT import activities, workflows,
+or worker modules at package level. Those modules import httpx and other
+libraries that conflict with Temporal's workflow sandbox import system.
+Import them directly when needed:
+    from automation.temporal.activities import ALL_ACTIVITIES
+    from automation.temporal.workflows import ALL_WORKFLOWS
+"""
+
+# Only import modules that don't have heavy dependencies (no httpx, sqlalchemy, etc.)
+# These are safe to import at package level
+from automation.temporal.client import (
+    close_temporal_client,
+    create_temporal_client,
+    get_temporal_client,
+)
+from automation.temporal.types import (
+    AutomationConfig,
+    ExecutionResult,
+    SandboxInfo,
+    TriggerContext,
+    WorkflowInput,
+    WorkflowResult,
+)
+
+# DO NOT import these at package level - they contain httpx, sqlalchemy, or
+# other imports that conflict with Temporal's workflow sandbox:
+# - activities (imports httpx)
+# - workflows (imports activities transitively via the sandbox)
+# - worker (imports both)
+# - schedules (imports automation.models which uses sqlalchemy)
+
+__all__ = [
+    # Data classes (safe - no heavy deps)
+    "AutomationConfig",
+    "TriggerContext",
+    "WorkflowInput",
+    "WorkflowResult",
+    "SandboxInfo",
+    "ExecutionResult",
+    # Client (safe - only temporalio)
+    "get_temporal_client",
+    "create_temporal_client",
+    "close_temporal_client",
+]
diff --git a/automation/temporal/activities.py b/automation/temporal/activities.py
new file mode 100644
index 0000000..841bab9
--- /dev/null
+++ b/automation/temporal/activities.py
@@ -0,0 +1,472 @@
+"""Temporal Activity definitions for automation execution.
+
+Activities are the building blocks of workflows. Each activity represents
+a single unit of work that may fail and be retried. Activities can have
+side effects (HTTP calls, database writes, etc.) unlike workflows which
+must be deterministic.
+
+Key activities:
+- get_api_key: Fetch per-user API key from OpenHands SaaS
+- create_sandbox: Create sandbox and wait until RUNNING
+- download_tarball: Download internal tarball from storage
+- upload_tarball: Upload tarball to sandbox or trigger download
+- execute_entrypoint: Start entrypoint command and wait for completion
+- cleanup_sandbox: Delete sandbox (runs even on failure)
+"""
+
+import asyncio
+import logging
+import uuid
+
+import httpx
+from temporalio import activity
+
+from automation.config import get_settings
+from automation.constants import (
+    EXTERNAL_DOWNLOAD_TIMEOUT,
+    EXTERNAL_MAX_FILESIZE,
+    SANDBOX_POLL_INTERVAL,
+    SANDBOX_READY_TIMEOUT,
+    TARBALL_PATH,
+    WORK_DIR,
+)
+from automation.temporal.types import (
+    CleanupSandboxInput,
+    CreateSandboxInput,
+    DownloadTarballInput,
+    ExecuteEntrypointInput,
+    ExecutionResult,
+    GetApiKeyInput,
+    SandboxInfo,
+    UploadTarballInput,
+)
+
+
+logger = logging.getLogger(__name__)
+
+
+# --- API Key Activity ---
+
+
+@activity.defn
+async def get_api_key(input: GetApiKeyInput) -> str:
+    """Fetch a per-user API key from the OpenHands SaaS service.
+
+    This creates a temporary API key for the user/org that can be used
+    to authenticate sandbox operations.
+
+    Raises:
+        Exception: If the API key cannot be retrieved.
+    """
+    settings = get_settings()
+
+    url = (
+        f"{settings.openhands_api_base_url}/api/service/users/{input.user_id}"
+        f"/orgs/{input.org_id}/api-keys"
+    )
+
+    headers = {
+        "X-Service-API-Key": settings.service_key,
+        "Content-Type": "application/json",
+    }
+
+    payload = {"name": "automation"}
+
+    logger.info(
+        "Fetching API key for user=%s org=%s run=%s",
+        input.user_id,
+        input.org_id,
+        input.run_id,
+    )
+
+    async with httpx.AsyncClient(timeout=30.0) as client:
+        response = await client.post(url, headers=headers, json=payload)
+        response.raise_for_status()
+
+        data = response.json()
+        api_key = data.get("key")
+
+        if not api_key:
+            raise ValueError(f"API key not found in response: {list(data.keys())}")
+
+        logger.info("API key created for run=%s", input.run_id)
+        return api_key
+
+
+# --- Sandbox Creation Activity ---
+
+
+def _find_agent_server_url(sandbox: dict) -> tuple[str, str] | None:
+    """Extract agent server URL and session key from sandbox response."""
+    for url_info in sandbox.get("exposed_urls") or []:
+        if url_info.get("name") == "AGENT_SERVER":
+            return url_info["url"].rstrip("/"), sandbox.get("session_api_key", "")
+    return None
+
+
+@activity.defn
+async def create_sandbox(input: CreateSandboxInput) -> SandboxInfo:
+    """Create a sandbox and wait until it's RUNNING.
+
+    This activity polls the sandbox status until it becomes RUNNING,
+    then returns the sandbox info including agent URL and session key.
+
+    Heartbeats during polling to let Temporal know we're still alive.
+
+    Raises:
+        TimeoutError: If sandbox doesn't become ready in time.
+        RuntimeError: If sandbox enters ERROR or MISSING state.
+    """
+    api_url = input.api_url.rstrip("/")
+    headers = {"Authorization": f"Bearer {input.api_key}"}
+
+    logger.info("Creating sandbox for run=%s", input.run_id)
+
+    async with httpx.AsyncClient(timeout=60.0) as client:
+        # Create sandbox
+        resp = await client.post(f"{api_url}/api/v1/sandboxes", headers=headers)
+        resp.raise_for_status()
+        sandbox_id = resp.json()["id"]
+
+        logger.info("Sandbox created: sandbox_id=%s run=%s", sandbox_id, input.run_id)
+
+        # Poll until RUNNING
+        elapsed = 0.0
+        while elapsed < SANDBOX_READY_TIMEOUT:
+            # Heartbeat to Temporal so it knows we're still working
+            activity.heartbeat(f"Waiting for sandbox {sandbox_id}: {elapsed:.0f}s")
+
+            resp = await client.get(
+                f"{api_url}/api/v1/sandboxes",
+                params={"id": sandbox_id},
+                headers=headers,
+            )
+            resp.raise_for_status()
+            items = resp.json()
+
+            if not items:
+                raise RuntimeError(f"Sandbox {sandbox_id} disappeared")
+
+            sandbox = items[0]
+            status = sandbox.get("status", "UNKNOWN")
+
+            if status == "RUNNING":
+                result = _find_agent_server_url(sandbox)
+                if result is None:
+                    raise RuntimeError(f"No AGENT_SERVER URL in sandbox {sandbox_id}")
+
+                agent_url, session_key = result
+                logger.info(
+                    "Sandbox ready: sandbox_id=%s agent_url=%s run=%s",
+                    sandbox_id,
+                    agent_url,
+                    input.run_id,
+                )
+                return SandboxInfo(
+                    sandbox_id=sandbox_id,
+                    agent_url=agent_url,
+                    session_key=session_key,
+                    api_key=input.api_key,
+                )
+
+            if status in ("ERROR", "MISSING"):
+                error_code = sandbox.get("error_code", "")
+                error_message = sandbox.get("error_message", "")
+                error_detail = f"status={status}"
+                if error_code:
+                    error_detail += f", error_code={error_code}"
+                if error_message:
+                    error_detail += f", error_message={error_message}"
+                raise RuntimeError(f"Sandbox {sandbox_id} failed: {error_detail}")
+
+            await asyncio.sleep(SANDBOX_POLL_INTERVAL)
+            elapsed += SANDBOX_POLL_INTERVAL
+
+        raise TimeoutError(
+            f"Sandbox {sandbox_id} not ready after {SANDBOX_READY_TIMEOUT}s"
+        )
+
+
+# --- Tarball Activities ---
+
+
+@activity.defn
+async def download_tarball(input: DownloadTarballInput) -> bytes:
+    """Download an internal tarball from storage.
+
+    Internal tarballs are stored in GCS/S3 and referenced by upload ID.
+    This activity downloads the tarball content as bytes.
+
+    Raises:
+        ValueError: If the tarball upload record doesn't exist.
+    """
+    from sqlalchemy import select
+
+    from automation.db import create_engine, create_session_factory
+    from automation.models import TarballUpload
+    from automation.storage import get_file_store
+
+    logger.info("Downloading internal tarball: upload_id=%s", input.upload_id)
+
+    settings = get_settings()
+    engine_result = await create_engine(settings)
+    session_factory = create_session_factory(engine_result.engine)
+
+    try:
+        async with session_factory() as session:
+            result = await session.execute(
+                select(TarballUpload).where(
+                    TarballUpload.id == uuid.UUID(input.upload_id)
+                )
+            )
+            upload = result.scalars().first()
+
+            if upload is None:
+                raise ValueError(
+                    f"Internal tarball upload not found: {input.upload_id}"
+                )
+
+            store = get_file_store()
+            data = store.read(upload.storage_path)
+            logger.info("Downloaded tarball: %d bytes, run=%s", len(data), input.run_id)
+            return data
+    finally:
+        await engine_result.dispose()
+
+
+@activity.defn
+async def upload_tarball(input: UploadTarballInput) -> None:
+    """Upload tarball to sandbox or trigger download inside sandbox.
+
+    For internal tarballs (tarball_data set): uploads bytes to sandbox.
+    For external tarballs (tarball_url set): runs curl inside sandbox.
+
+    Raises:
+        RuntimeError: If upload/download fails.
+    """
+    sandbox = input.sandbox_info
+    logger.info(
+        "Uploading tarball to sandbox: sandbox_id=%s run=%s",
+        sandbox.sandbox_id,
+        input.run_id,
+    )
+
+    async with httpx.AsyncClient(timeout=120.0) as client:
+        if input.tarball_data is not None:
+            # Upload bytes to sandbox
+            resp = await client.post(
+                f"{sandbox.agent_url}/api/file/upload/{TARBALL_PATH}",
+                files={"file": ("upload", input.tarball_data)},
+                headers={"X-Session-API-Key": sandbox.session_key},
+            )
+            resp.raise_for_status()
+            logger.info(
+                "Tarball uploaded: %d bytes to %s",
+                len(input.tarball_data),
+                TARBALL_PATH,
+            )
+
+        elif input.tarball_url is not None:
+            # Download inside sandbox using curl
+            curl_cmd = (
+                f"curl -fsSL --max-filesize {EXTERNAL_MAX_FILESIZE} "
+                f"-o {TARBALL_PATH} '{input.tarball_url}'"
+            )
+            resp = await client.post(
+                f"{sandbox.agent_url}/api/bash/execute_bash_command",
+                json={"command": curl_cmd, "timeout": EXTERNAL_DOWNLOAD_TIMEOUT},
+                headers={"X-Session-API-Key": sandbox.session_key},
+                timeout=httpx.Timeout(EXTERNAL_DOWNLOAD_TIMEOUT + 30),
+            )
+            resp.raise_for_status()
+            result = resp.json()
+
+            if result.get("exit_code") != 0:
+                stderr = result.get("stderr", "")
+                raise RuntimeError(f"Failed to download tarball: {stderr}")
+
+            logger.info("Tarball downloaded in sandbox from URL")
+
+        else:
+            raise ValueError("Either tarball_data or tarball_url must be provided")
+
+
+# --- Entrypoint Execution Activity ---
+
+
+def _shell_quote(s: str) -> str:
+    """Single-quote a string for safe shell interpolation."""
+    return "'" + s.replace("'", "'\\''") + "'"
+
+
+@activity.defn
+async def execute_entrypoint(input: ExecuteEntrypointInput) -> ExecutionResult:
+    """Execute the automation entrypoint in the sandbox.
+
+    Extracts the tarball, runs setup.sh if present, exports env vars,
+    and runs the entrypoint command. Waits for completion and returns
+    the result.
+
+    Heartbeats periodically while waiting for completion.
+
+    Returns:
+        ExecutionResult with success status, exit code, and output.
+    """
+    sandbox = input.sandbox_info
+
+    logger.info(
+        "Executing entrypoint: %s in sandbox=%s run=%s",
+        input.entrypoint,
+        sandbox.sandbox_id,
+        input.run_id,
+    )
+
+    # Build env var exports
+    exports = ""
+    if input.env_vars:
+        parts = [f"export {k}={_shell_quote(v)}" for k, v in input.env_vars.items()]
+        exports = " && ".join(parts) + " && "
+
+    # Build full command
+    cmd = (
+        f"mkdir -p {WORK_DIR}"
+        f" && tar xzf {TARBALL_PATH} -C {WORK_DIR}"
+        f" && cd {WORK_DIR}"
+        f" && ([ ! -f setup.sh ] || bash setup.sh)"
+        f" && {exports}{input.entrypoint}"
+    )
+
+    async with httpx.AsyncClient(timeout=input.timeout_seconds + 60) as client:
+        # Start the command
+        resp = await client.post(
+            f"{sandbox.agent_url}/api/bash/start_bash_command",
+            json={"command": cmd, "timeout": input.timeout_seconds},
+            headers={"X-Session-API-Key": sandbox.session_key},
+            timeout=30.0,
+        )
+        resp.raise_for_status()
+        command_id = resp.json().get("id")
+
+        logger.info(
+            "Command started: command_id=%s sandbox=%s",
+            command_id,
+            sandbox.sandbox_id,
+        )
+
+        # Poll for completion
+        elapsed = 0
+        poll_interval = 5
+        while elapsed < input.timeout_seconds + 30:
+            # Heartbeat to Temporal
+            activity.heartbeat(
+                f"Waiting for command {command_id}: {elapsed}s/{input.timeout_seconds}s"
+            )
+
+            await asyncio.sleep(poll_interval)
+            elapsed += poll_interval
+
+            # Check command status
+            try:
+                resp = await client.get(
+                    f"{sandbox.agent_url}/api/bash/bash_events/search",
+                    params={
+                        "kind__eq": "BashOutput",
+                        "sort_order": "TIMESTAMP_DESC",
+                        "limit": 1,
+                    },
+                    headers={"X-Session-API-Key": sandbox.session_key},
+                    timeout=30.0,
+                )
+                resp.raise_for_status()
+                page = resp.json()
+
+                items = page.get("items", [])
+                if items:
+                    output = items[0]
+                    exit_code = output.get("exit_code")
+
+                    # exit_code is None while command is still running
+                    if exit_code is not None:
+                        success = exit_code == 0
+                        logger.info(
+                            "Command completed: exit_code=%s sandbox=%s run=%s",
+                            exit_code,
+                            sandbox.sandbox_id,
+                            input.run_id,
+                        )
+                        return ExecutionResult(
+                            success=success,
+                            exit_code=exit_code,
+                            stdout=output.get("stdout") or "",
+                            stderr=output.get("stderr") or "",
+                            error=None if success else f"exit_code={exit_code}",
+                        )
+
+            except Exception as e:
+                logger.warning("Error polling command status: %s", e)
+
+        # Timeout waiting for command
+        logger.warning(
+            "Command timed out: sandbox=%s run=%s", sandbox.sandbox_id, input.run_id
+        )
+        return ExecutionResult(
+            success=False,
+            exit_code=-1,
+            error=f"Command timed out after {input.timeout_seconds}s",
+        )
+
+
+# --- Cleanup Activity ---
+
+
+@activity.defn
+async def cleanup_sandbox(input: CleanupSandboxInput) -> bool:
+    """Delete a sandbox.
+
+    This activity is idempotent - it succeeds even if the sandbox
+    is already deleted or doesn't exist.
+
+    Returns:
+        True if sandbox was deleted, False if it didn't exist.
+    """
+    api_url = input.api_url.rstrip("/")
+
+    logger.info(
+        "Cleaning up sandbox: sandbox_id=%s run=%s", input.sandbox_id, input.run_id
+    )
+
+    try:
+        async with httpx.AsyncClient(timeout=30.0) as client:
+            resp = await client.delete(
+                f"{api_url}/api/v1/sandboxes/{input.sandbox_id}",
+                params={"sandbox_id": input.sandbox_id},
+                headers={"Authorization": f"Bearer {input.api_key}"},
+            )
+
+            if resp.status_code == 404:
+                logger.info("Sandbox already deleted: %s", input.sandbox_id)
+                return False
+
+            if resp.status_code >= 300:
+                logger.warning(
+                    "Failed to delete sandbox %s: %s", input.sandbox_id, resp.text
+                )
+                return False
+
+            logger.info("Sandbox deleted: %s", input.sandbox_id)
+            return True
+
+    except Exception as e:
+        logger.warning("Error deleting sandbox %s: %s", input.sandbox_id, e)
+        return False
+
+
+# List of all activities for worker registration
+ALL_ACTIVITIES = [
+    get_api_key,
+    create_sandbox,
+    download_tarball,
+    upload_tarball,
+    execute_entrypoint,
+    cleanup_sandbox,
+]
diff --git a/automation/temporal/client.py b/automation/temporal/client.py
new file mode 100644
index 0000000..b81c616
--- /dev/null
+++ b/automation/temporal/client.py
@@ -0,0 +1,96 @@
+"""Temporal client factory.
+
+Provides functions to create and manage Temporal clients for connecting
+to the Temporal service. Supports both self-hosted and Temporal Cloud.
+"""
+
+import logging
+
+from temporalio.client import Client
+from temporalio.service import TLSConfig
+
+from automation.config import Settings, get_settings
+
+
+logger = logging.getLogger(__name__)
+
+
+async def create_temporal_client(settings: Settings | None = None) -> Client:
+    """Create a new Temporal client.
+
+    Args:
+        settings: Application settings. If None, uses get_settings().
+
+    Returns:
+        Connected Temporal client.
+
+    Raises:
+        Exception: If connection fails.
+    """
+    if settings is None:
+        settings = get_settings()
+
+    logger.info(
+        "Connecting to Temporal at %s (namespace=%s)",
+        settings.temporal_address,
+        settings.temporal_namespace,
+    )
+
+    # Build TLS config if enabled (for Temporal Cloud)
+    tls_config: TLSConfig | bool = False
+    if settings.temporal_tls_enabled:
+        if settings.temporal_tls_cert_path and settings.temporal_tls_key_path:
+            # Load cert and key from files
+            with open(settings.temporal_tls_cert_path, "rb") as f:
+                client_cert = f.read()
+            with open(settings.temporal_tls_key_path, "rb") as f:
+                client_key = f.read()
+
+            tls_config = TLSConfig(
+                client_cert=client_cert,
+                client_private_key=client_key,
+            )
+            logger.info("Using mTLS for Temporal connection")
+        else:
+            # Use system TLS (for Temporal Cloud with API keys)
+            tls_config = True
+            logger.info("Using TLS for Temporal connection")
+
+    client = await Client.connect(
+        settings.temporal_address,
+        namespace=settings.temporal_namespace,
+        tls=tls_config,
+    )
+
+    logger.info("Connected to Temporal")
+    return client
+
+
+# Global client instance (created lazily)
+_client: Client | None = None
+
+
+async def get_temporal_client() -> Client:
+    """Get or create the global Temporal client.
+
+    This function maintains a single client instance for the application.
+    The client is created on first call and reused thereafter.
+
+    Returns:
+        Connected Temporal client.
+    """
+    global _client
+    if _client is None:
+        _client = await create_temporal_client()
+    return _client
+
+
+async def close_temporal_client() -> None:
+    """Close the global Temporal client if it exists."""
+    global _client
+    if _client is not None:
+        # The Client doesn't have a close method directly, but we should
+        # clear the reference. The underlying connection is managed by
+        # the service client which handles cleanup.
+        _client = None
+        logger.info("Temporal client reference cleared")
diff --git a/automation/temporal/schedules.py b/automation/temporal/schedules.py
new file mode 100644
index 0000000..f3c6055
--- /dev/null
+++ b/automation/temporal/schedules.py
@@ -0,0 +1,321 @@
+"""Temporal Schedule management for cron automations.
+
+Temporal Schedules are first-class citizens that replace the need for
+custom cron polling loops. This module provides functions to create,
+update, and delete schedules for automations.
+
+Each automation with a cron trigger gets a corresponding Temporal Schedule
+that starts AutomationWorkflow executions at the specified times.
+"""
+
+import logging
+import uuid
+from datetime import timedelta
+
+from temporalio.client import (
+    Client,
+    Schedule,
+    ScheduleActionStartWorkflow,
+    ScheduleOverlapPolicy,
+    SchedulePolicy,
+    ScheduleSpec,
+    ScheduleState,
+    ScheduleUpdate,
+    ScheduleUpdateInput,
+)
+
+from automation.config import get_settings
+from automation.models import Automation
+from automation.temporal.types import (
+    AutomationConfig,
+    TriggerContext,
+    WorkflowInput,
+)
+from automation.temporal.workflows import AutomationWorkflow
+
+
+logger = logging.getLogger(__name__)
+
+
+def _make_schedule_id(automation_id: uuid.UUID) -> str:
+    """Generate a Temporal schedule ID for an automation."""
+    return f"automation-{automation_id}"
+
+
+def _make_workflow_id(automation_id: uuid.UUID) -> str:
+    """Generate a workflow ID prefix for an automation's runs."""
+    return f"automation-run-{automation_id}"
+
+
+def _automation_to_config(automation: Automation) -> AutomationConfig:
+    """Convert an Automation model to AutomationConfig dataclass."""
+    from automation.constants import MAX_RUN_DURATION_SECONDS
+
+    return AutomationConfig(
+        automation_id=str(automation.id),
+        user_id=str(automation.user_id),
+        org_id=str(automation.org_id),
+        name=automation.name,
+        tarball_path=automation.tarball_path,
+        entrypoint=automation.entrypoint,
+        timeout_seconds=automation.timeout or MAX_RUN_DURATION_SECONDS,
+        trigger=automation.trigger,
+        setup_script_path=automation.setup_script_path,
+    )
+
+
+async def create_schedule(
+    client: Client,
+    automation: Automation,
+) -> str:
+    """Create a Temporal Schedule for an automation.
+
+    Args:
+        client: Temporal client.
+        automation: The automation to schedule.
+
+    Returns:
+        The schedule ID.
+
+    Raises:
+        ValueError: If the automation doesn't have a cron trigger.
+    """
+    trigger = automation.trigger
+    if trigger.get("type") != "cron":
+        raise ValueError(f"Unsupported trigger type: {trigger.get('type')}")
+
+    cron_expression = trigger.get("schedule")
+    if not cron_expression:
+        raise ValueError("Cron trigger missing 'schedule' field")
+
+    timezone = trigger.get("timezone", "UTC")
+    schedule_id = _make_schedule_id(automation.id)
+    settings = get_settings()
+
+    # Build workflow input
+    automation_config = _automation_to_config(automation)
+    trigger_context = TriggerContext(
+        trigger_type="cron",
+        # scheduled_time will be filled by Temporal at runtime
+    )
+
+    # Note: run_id will be generated per execution using workflow ID
+    # The actual WorkflowInput is built at schedule execution time
+    # For now, we use a placeholder that will be replaced
+
+    logger.info(
+        "Creating schedule for automation: schedule_id=%s cron=%s timezone=%s",
+        schedule_id,
+        cron_expression,
+        timezone,
+    )
+
+    # Create the schedule
+    await client.create_schedule(
+        schedule_id,
+        Schedule(
+            action=ScheduleActionStartWorkflow(
+                AutomationWorkflow.run,
+                args=[
+                    WorkflowInput(
+                        automation=automation_config,
+                        trigger_context=trigger_context,
+                        run_id="",  # Will be set by workflow ID
+                        callback_url=f"{settings.resolved_base_url}/v1/runs/{{workflow_id}}/complete",
+                    )
+                ],
+                id=_make_workflow_id(automation.id),
+                task_queue=settings.temporal_task_queue,
+            ),
+            spec=ScheduleSpec(
+                cron_expressions=[cron_expression],
+                time_zone_name=timezone,
+            ),
+            policy=SchedulePolicy(
+                overlap=ScheduleOverlapPolicy.SKIP,  # Skip if previous run still active
+                catchup_window=timedelta(
+                    minutes=5
+                ),  # Catch up missed runs within 5 min
+            ),
+            state=ScheduleState(
+                paused=not automation.enabled,
+            ),
+        ),
+    )
+
+    logger.info("Schedule created: %s", schedule_id)
+    return schedule_id
+
+
+async def update_schedule(
+    client: Client,
+    automation: Automation,
+) -> None:
+    """Update an existing Temporal Schedule.
+
+    Updates the schedule's cron expression, timezone, and enabled state.
+
+    Args:
+        client: Temporal client.
+        automation: The automation with updated configuration.
+    """
+    schedule_id = _make_schedule_id(automation.id)
+    trigger = automation.trigger
+
+    if trigger.get("type") != "cron":
+        # If trigger type changed, delete the schedule
+        await delete_schedule(client, automation.id)
+        return
+
+    cron_expression = trigger.get("schedule")
+    timezone = trigger.get("timezone", "UTC")
+    settings = get_settings()
+
+    logger.info(
+        "Updating schedule: schedule_id=%s cron=%s timezone=%s enabled=%s",
+        schedule_id,
+        cron_expression,
+        timezone,
+        automation.enabled,
+    )
+
+    handle = client.get_schedule_handle(schedule_id)
+
+    # Update the schedule
+    automation_config = _automation_to_config(automation)
+    trigger_context = TriggerContext(trigger_type="cron")
+
+    async def update_fn(input: ScheduleUpdateInput) -> ScheduleUpdate:
+        schedule = input.description.schedule
+        schedule.action = ScheduleActionStartWorkflow(
+            AutomationWorkflow.run,
+            args=[
+                WorkflowInput(
+                    automation=automation_config,
+                    trigger_context=trigger_context,
+                    run_id="",
+                    callback_url=f"{settings.resolved_base_url}/v1/runs/{{workflow_id}}/complete",
+                )
+            ],
+            id=_make_workflow_id(automation.id),
+            task_queue=settings.temporal_task_queue,
+        )
+        schedule.spec = ScheduleSpec(
+            cron_expressions=[cron_expression] if cron_expression else [],
+            time_zone_name=timezone,
+        )
+        schedule.state.paused = not automation.enabled
+        return ScheduleUpdate(schedule=schedule)
+
+    await handle.update(update_fn)
+    logger.info("Schedule updated: %s", schedule_id)
+
+
+async def delete_schedule(
+    client: Client,
+    automation_id: uuid.UUID,
+) -> bool:
+    """Delete a Temporal Schedule.
+
+    Args:
+        client: Temporal client.
+        automation_id: The automation ID.
+
+    Returns:
+        True if the schedule was deleted, False if it didn't exist.
+    """
+    schedule_id = _make_schedule_id(automation_id)
+
+    logger.info("Deleting schedule: %s", schedule_id)
+
+    try:
+        handle = client.get_schedule_handle(schedule_id)
+        await handle.delete()
+        logger.info("Schedule deleted: %s", schedule_id)
+        return True
+    except Exception as e:
+        # Schedule might not exist
+        logger.warning("Failed to delete schedule %s: %s", schedule_id, e)
+        return False
+
+
+async def pause_schedule(
+    client: Client,
+    automation_id: uuid.UUID,
+) -> None:
+    """Pause a Temporal Schedule.
+
+    Args:
+        client: Temporal client.
+        automation_id: The automation ID.
+    """
+    schedule_id = _make_schedule_id(automation_id)
+    handle = client.get_schedule_handle(schedule_id)
+    await handle.pause(note="Automation disabled")
+    logger.info("Schedule paused: %s", schedule_id)
+
+
+async def unpause_schedule(
+    client: Client,
+    automation_id: uuid.UUID,
+) -> None:
+    """Unpause a Temporal Schedule.
+
+    Args:
+        client: Temporal client.
+        automation_id: The automation ID.
+    """
+    schedule_id = _make_schedule_id(automation_id)
+    handle = client.get_schedule_handle(schedule_id)
+    await handle.unpause(note="Automation enabled")
+    logger.info("Schedule unpaused: %s", schedule_id)
+
+
+async def trigger_schedule(
+    client: Client,
+    automation_id: uuid.UUID,
+) -> None:
+    """Manually trigger a schedule (run immediately).
+
+    Args:
+        client: Temporal client.
+        automation_id: The automation ID.
+    """
+    schedule_id = _make_schedule_id(automation_id)
+    handle = client.get_schedule_handle(schedule_id)
+    await handle.trigger()
+    logger.info("Schedule triggered manually: %s", schedule_id)
+
+
+async def get_schedule_info(
+    client: Client,
+    automation_id: uuid.UUID,
+) -> dict | None:
+    """Get information about a schedule.
+
+    Args:
+        client: Temporal client.
+        automation_id: The automation ID.
+
+    Returns:
+        Schedule info dict, or None if schedule doesn't exist.
+    """
+    schedule_id = _make_schedule_id(automation_id)
+
+    try:
+        handle = client.get_schedule_handle(schedule_id)
+        desc = await handle.describe()
+        return {
+            "schedule_id": schedule_id,
+            "paused": desc.schedule.state.paused,
+            "num_actions": desc.info.num_actions,
+            "last_action_time": desc.info.recent_actions[-1].scheduled_at
+            if desc.info.recent_actions
+            else None,
+            "next_action_times": [
+                t.isoformat() for t in (desc.info.next_action_times or [])[:3]
+            ],
+        }
+    except Exception as e:
+        logger.warning("Failed to get schedule info for %s: %s", schedule_id, e)
+        return None
diff --git a/automation/temporal/types.py b/automation/temporal/types.py
new file mode 100644
index 0000000..9993ee7
--- /dev/null
+++ b/automation/temporal/types.py
@@ -0,0 +1,137 @@
+"""Data classes for Temporal workflow inputs and outputs.
+
+These are serializable data classes used to pass data between workflows
+and activities. They must be JSON-serializable for Temporal's data converter.
+"""
+
+from dataclasses import dataclass, field
+
+
+@dataclass(frozen=True)
+class AutomationConfig:
+    """Configuration for an automation run, passed as workflow input."""
+
+    automation_id: str
+    user_id: str
+    org_id: str
+    name: str
+    tarball_path: str
+    entrypoint: str
+    timeout_seconds: int
+    trigger: dict = field(default_factory=dict)
+    setup_script_path: str | None = None
+
+
+@dataclass(frozen=True)
+class TriggerContext:
+    """Context about what triggered this automation run."""
+
+    trigger_type: str  # "cron", "manual", "webhook"
+    scheduled_time: str | None = None  # ISO format for cron triggers
+    triggered_by: str | None = None  # user_id for manual triggers
+
+
+@dataclass(frozen=True)
+class WorkflowInput:
+    """Input to the AutomationWorkflow."""
+
+    automation: AutomationConfig
+    trigger_context: TriggerContext
+    run_id: str  # Database run ID for status tracking
+    callback_url: str | None = None  # URL for SDK to POST completion status
+
+
+@dataclass(frozen=True)
+class SandboxInfo:
+    """Information about a created sandbox."""
+
+    sandbox_id: str
+    agent_url: str
+    session_key: str
+    api_key: str  # The per-user API key used to create the sandbox
+
+
+@dataclass(frozen=True)
+class ExecutionResult:
+    """Result of executing the entrypoint in the sandbox."""
+
+    success: bool
+    exit_code: int | None = None
+    stdout: str = ""
+    stderr: str = ""
+    error: str | None = None
+    conversation_id: str | None = None
+
+
+@dataclass(frozen=True)
+class WorkflowResult:
+    """Final result of the AutomationWorkflow."""
+
+    success: bool
+    run_id: str
+    sandbox_id: str | None = None
+    exit_code: int | None = None
+    error: str | None = None
+    conversation_id: str | None = None
+    started_at: str | None = None  # ISO format
+    completed_at: str | None = None  # ISO format
+
+
+# Activity input/output types
+
+
+@dataclass(frozen=True)
+class GetApiKeyInput:
+    """Input for get_api_key activity."""
+
+    user_id: str
+    org_id: str
+    run_id: str
+
+
+@dataclass(frozen=True)
+class CreateSandboxInput:
+    """Input for create_sandbox activity."""
+
+    api_url: str
+    api_key: str
+    run_id: str
+
+
+@dataclass(frozen=True)
+class DownloadTarballInput:
+    """Input for download_tarball activity (internal tarballs)."""
+
+    upload_id: str
+    run_id: str
+
+
+@dataclass(frozen=True)
+class UploadTarballInput:
+    """Input for upload_tarball activity."""
+
+    sandbox_info: SandboxInfo
+    tarball_data: bytes | None = None  # For internal tarballs (uploaded to sandbox)
+    tarball_url: str | None = None  # For external tarballs (downloaded in sandbox)
+    run_id: str = ""
+
+
+@dataclass(frozen=True)
+class ExecuteEntrypointInput:
+    """Input for execute_entrypoint activity."""
+
+    sandbox_info: SandboxInfo
+    entrypoint: str
+    env_vars: dict = field(default_factory=dict)
+    timeout_seconds: int = 600
+    run_id: str = ""
+
+
+@dataclass(frozen=True)
+class CleanupSandboxInput:
+    """Input for cleanup_sandbox activity."""
+
+    api_url: str
+    api_key: str
+    sandbox_id: str
+    run_id: str = ""
diff --git a/automation/temporal/worker.py b/automation/temporal/worker.py
new file mode 100644
index 0000000..a2679c2
--- /dev/null
+++ b/automation/temporal/worker.py
@@ -0,0 +1,121 @@
+"""Temporal worker setup.
+
+Workers are long-running processes that poll Temporal for tasks and execute
+workflows and activities. This module provides functions to create and run
+workers.
+
+Workers can be run:
+1. In-process with the FastAPI app (for development)
+2. As separate processes/pods (for production scaling)
+"""
+
+import asyncio
+import logging
+
+from temporalio.client import Client
+from temporalio.worker import Worker
+
+from automation.config import Settings, get_settings
+from automation.temporal.activities import ALL_ACTIVITIES
+from automation.temporal.client import create_temporal_client
+from automation.temporal.workflows import ALL_WORKFLOWS
+
+
+logger = logging.getLogger(__name__)
+
+
+async def create_worker(
+    client: Client | None = None,
+    settings: Settings | None = None,
+) -> Worker:
+    """Create a Temporal worker.
+
+    Args:
+        client: Temporal client. If None, creates a new one.
+        settings: Application settings. If None, uses get_settings().
+
+    Returns:
+        Configured Temporal worker (not yet running).
+    """
+    if settings is None:
+        settings = get_settings()
+
+    if client is None:
+        client = await create_temporal_client(settings)
+
+    worker = Worker(
+        client,
+        task_queue=settings.temporal_task_queue,
+        workflows=ALL_WORKFLOWS,
+        activities=ALL_ACTIVITIES,
+    )
+
+    logger.info(
+        "Worker created for task queue '%s' with %d workflows and %d activities",
+        settings.temporal_task_queue,
+        len(ALL_WORKFLOWS),
+        len(ALL_ACTIVITIES),
+    )
+
+    return worker
+
+
+async def run_worker(
+    client: Client | None = None,
+    settings: Settings | None = None,
+    shutdown_event: asyncio.Event | None = None,
+) -> None:
+    """Run a Temporal worker until shutdown.
+
+    This is the main entry point for running a worker. It creates a worker
+    and runs it until the shutdown_event is set or the process is interrupted.
+
+    Args:
+        client: Temporal client. If None, creates a new one.
+        settings: Application settings. If None, uses get_settings().
+        shutdown_event: Event to signal graceful shutdown.
+    """
+    worker = await create_worker(client, settings)
+
+    logger.info("Starting Temporal worker")
+
+    if shutdown_event is None:
+        # Run forever
+        await worker.run()
+    else:
+        # Run until shutdown event
+        async with worker:
+            await shutdown_event.wait()
+            logger.info("Worker received shutdown signal")
+
+
+async def run_worker_standalone() -> None:
+    """Run a standalone worker (for separate worker processes).
+
+    This function is meant to be called from a __main__ block or CLI.
+    It sets up signal handlers for graceful shutdown.
+    """
+    import signal
+
+    shutdown_event = asyncio.Event()
+
+    def signal_handler():
+        logger.info("Received shutdown signal")
+        shutdown_event.set()
+
+    loop = asyncio.get_event_loop()
+    for sig in (signal.SIGINT, signal.SIGTERM):
+        loop.add_signal_handler(sig, signal_handler)
+
+    try:
+        await run_worker(shutdown_event=shutdown_event)
+    finally:
+        logger.info("Worker stopped")
+
+
+# Entry point for standalone worker
+if __name__ == "__main__":
+    from automation.logger import setup_all_loggers
+
+    setup_all_loggers()
+    asyncio.run(run_worker_standalone())
diff --git a/automation/temporal/workflows.py b/automation/temporal/workflows.py
new file mode 100644
index 0000000..986c268
--- /dev/null
+++ b/automation/temporal/workflows.py
@@ -0,0 +1,329 @@
+"""Temporal Workflow definitions for automation execution.
+
+Workflows are the core orchestration units. They coordinate activities,
+handle failures, and maintain durable state. Workflows must be deterministic
+- they cannot make HTTP calls, access databases, or use random/time directly.
+All side effects must go through activities.
+
+The AutomationWorkflow is the main workflow that:
+1. Gets a per-user API key
+2. Creates a sandbox
+3. Downloads/uploads the tarball
+4. Executes the entrypoint
+5. Cleans up the sandbox (even on failure)
+"""
+
+import json
+import logging
+from datetime import timedelta
+
+from temporalio import workflow
+from temporalio.common import RetryPolicy
+from temporalio.exceptions import ActivityError
+
+
+# Import activity stubs - these are used for type hints and to call activities
+with workflow.unsafe.imports_passed_through():
+    from automation.config import get_settings
+    from automation.temporal.types import (
+        CleanupSandboxInput,
+        CreateSandboxInput,
+        DownloadTarballInput,
+        ExecuteEntrypointInput,
+        ExecutionResult,
+        GetApiKeyInput,
+        SandboxInfo,
+        UploadTarballInput,
+        WorkflowInput,
+        WorkflowResult,
+    )
+    # Use the lightweight tarball_url module (no fastapi/sqlalchemy/httpx deps)
+    # instead of tarball_validation which has heavy dependencies
+    from automation.utils.tarball_url import (
+        is_http_url,
+        parse_internal_upload_id,
+    )
+
+
+logger = logging.getLogger(__name__)
+
+
+def _get_retry_policies() -> (
+    tuple[RetryPolicy, RetryPolicy, RetryPolicy, RetryPolicy, RetryPolicy]
+):
+    """Get retry policies based on configuration.
+
+    When AUTOMATION_FAST_FAIL=true, all policies use maximum_attempts=1
+    for faster test feedback. In production, full retry policies are used
+    for resilience against transient failures.
+    """
+    settings = get_settings()
+
+    if settings.fast_fail:
+        # Fast-fail mode: no retries for faster test feedback
+        no_retry = RetryPolicy(maximum_attempts=1)
+        return no_retry, no_retry, no_retry, no_retry, no_retry
+
+    # Production retry policies
+    api_key_policy = RetryPolicy(
+        initial_interval=timedelta(seconds=5),
+        backoff_coefficient=2.0,
+        maximum_interval=timedelta(seconds=60),
+        maximum_attempts=5,
+        non_retryable_error_types=["ValueError"],  # Invalid user/org is permanent
+    )
+
+    sandbox_policy = RetryPolicy(
+        initial_interval=timedelta(seconds=10),
+        backoff_coefficient=2.0,
+        maximum_interval=timedelta(minutes=2),
+        maximum_attempts=3,
+    )
+
+    tarball_policy = RetryPolicy(
+        initial_interval=timedelta(seconds=5),
+        backoff_coefficient=2.0,
+        maximum_interval=timedelta(seconds=60),
+        maximum_attempts=3,
+        non_retryable_error_types=["ValueError"],  # Missing tarball is permanent
+    )
+
+    # No retries for execution - if it fails, it fails
+    execution_policy = RetryPolicy(maximum_attempts=1)
+
+    cleanup_policy = RetryPolicy(
+        initial_interval=timedelta(seconds=5),
+        backoff_coefficient=2.0,
+        maximum_interval=timedelta(seconds=30),
+        maximum_attempts=3,
+    )
+
+    return api_key_policy, sandbox_policy, tarball_policy, execution_policy, cleanup_policy
+
+
+# Initialize retry policies (evaluated at module load time)
+(
+    API_KEY_RETRY_POLICY,
+    SANDBOX_RETRY_POLICY,
+    TARBALL_RETRY_POLICY,
+    EXECUTION_RETRY_POLICY,
+    CLEANUP_RETRY_POLICY,
+) = _get_retry_policies()
+
+
+@workflow.defn
+class AutomationWorkflow:
+    """Main workflow for executing an automation.
+
+    This workflow orchestrates the full lifecycle of an automation run:
+    1. Fetch per-user API key from OpenHands SaaS
+    2. Create sandbox and wait until RUNNING
+    3. Get tarball into sandbox (download internal or fetch external)
+    4. Execute entrypoint command
+    5. Clean up sandbox (always, even on failure)
+
+    The workflow is durable - if the worker crashes at any point, Temporal
+    will resume execution from the last completed activity.
+    """
+
+    @workflow.run
+    async def run(self, input: WorkflowInput) -> WorkflowResult:
+        """Execute the automation workflow."""
+        workflow.logger.info(
+            "Starting automation workflow",
+            extra={
+                "run_id": input.run_id,
+                "automation_id": input.automation.automation_id,
+                "name": input.automation.name,
+            },
+        )
+
+        settings = get_settings()
+        sandbox_info: SandboxInfo | None = None
+        api_key: str | None = None
+
+        try:
+            # 1. Get per-user API key
+            api_key = await workflow.execute_activity(
+                "get_api_key",
+                GetApiKeyInput(
+                    user_id=input.automation.user_id,
+                    org_id=input.automation.org_id,
+                    run_id=input.run_id,
+                ),
+                start_to_close_timeout=timedelta(seconds=60),
+                retry_policy=API_KEY_RETRY_POLICY,
+            )
+            # Cast to satisfy type checker - activity returns str
+            assert api_key is not None
+
+            # 2. Create sandbox
+            sandbox_info = await workflow.execute_activity(
+                "create_sandbox",
+                CreateSandboxInput(
+                    api_url=settings.openhands_api_base_url,
+                    api_key=api_key,
+                    run_id=input.run_id,
+                ),
+                start_to_close_timeout=timedelta(minutes=10),
+                heartbeat_timeout=timedelta(minutes=2),
+                retry_policy=SANDBOX_RETRY_POLICY,
+            )
+            # Cast to satisfy type checker - activity returns SandboxInfo
+            assert sandbox_info is not None
+
+            # 3. Get tarball into sandbox
+            tarball_path = input.automation.tarball_path
+
+            if is_http_url(tarball_path):
+                # External URL - download directly in sandbox
+                await workflow.execute_activity(
+                    "upload_tarball",
+                    UploadTarballInput(
+                        sandbox_info=sandbox_info,
+                        tarball_url=tarball_path,
+                        run_id=input.run_id,
+                    ),
+                    start_to_close_timeout=timedelta(minutes=5),
+                    retry_policy=TARBALL_RETRY_POLICY,
+                )
+            else:
+                # Internal tarball - download from storage, upload to sandbox
+                upload_id = parse_internal_upload_id(tarball_path)
+                if upload_id is None:
+                    raise ValueError(f"Invalid tarball_path: {tarball_path}")
+
+                tarball_data = await workflow.execute_activity(
+                    "download_tarball",
+                    DownloadTarballInput(
+                        upload_id=str(upload_id),
+                        run_id=input.run_id,
+                    ),
+                    start_to_close_timeout=timedelta(minutes=5),
+                    retry_policy=TARBALL_RETRY_POLICY,
+                )
+
+                await workflow.execute_activity(
+                    "upload_tarball",
+                    UploadTarballInput(
+                        sandbox_info=sandbox_info,
+                        tarball_data=tarball_data,
+                        run_id=input.run_id,
+                    ),
+                    start_to_close_timeout=timedelta(minutes=5),
+                    retry_policy=TARBALL_RETRY_POLICY,
+                )
+
+            # 4. Build env vars for execution
+            env_vars = {
+                "OPENHANDS_API_KEY": api_key,
+                "OPENHANDS_CLOUD_API_URL": settings.openhands_api_base_url,
+                "SANDBOX_ID": sandbox_info.sandbox_id,
+                "SESSION_API_KEY": sandbox_info.session_key,
+                "AUTOMATION_RUN_ID": input.run_id,
+            }
+
+            # Add callback URL if provided
+            if input.callback_url:
+                env_vars["AUTOMATION_CALLBACK_URL"] = input.callback_url
+
+            # Add trigger context
+            event_payload = {
+                "trigger": input.automation.trigger,
+                "automation_id": input.automation.automation_id,
+                "automation_name": input.automation.name,
+            }
+            env_vars["AUTOMATION_EVENT_PAYLOAD"] = json.dumps(event_payload)
+
+            # 5. Execute entrypoint
+            execution_result: ExecutionResult = await workflow.execute_activity(
+                "execute_entrypoint",
+                ExecuteEntrypointInput(
+                    sandbox_info=sandbox_info,
+                    entrypoint=input.automation.entrypoint,
+                    env_vars=env_vars,
+                    timeout_seconds=input.automation.timeout_seconds,
+                    run_id=input.run_id,
+                ),
+                start_to_close_timeout=timedelta(
+                    seconds=input.automation.timeout_seconds + 120
+                ),
+                heartbeat_timeout=timedelta(minutes=2),
+                retry_policy=EXECUTION_RETRY_POLICY,
+            )
+
+            workflow.logger.info(
+                "Automation completed",
+                extra={
+                    "run_id": input.run_id,
+                    "success": execution_result.success,
+                    "exit_code": execution_result.exit_code,
+                },
+            )
+
+            return WorkflowResult(
+                success=execution_result.success,
+                run_id=input.run_id,
+                sandbox_id=sandbox_info.sandbox_id,
+                exit_code=execution_result.exit_code,
+                error=execution_result.error,
+                conversation_id=execution_result.conversation_id,
+            )
+
+        except ActivityError as e:
+            workflow.logger.error(
+                "Activity failed",
+                extra={
+                    "run_id": input.run_id,
+                    "error": str(e),
+                },
+            )
+            return WorkflowResult(
+                success=False,
+                run_id=input.run_id,
+                sandbox_id=sandbox_info.sandbox_id if sandbox_info else None,
+                error=str(e),
+            )
+
+        except Exception as e:
+            workflow.logger.exception(
+                "Workflow failed",
+                extra={"run_id": input.run_id},
+            )
+            return WorkflowResult(
+                success=False,
+                run_id=input.run_id,
+                sandbox_id=sandbox_info.sandbox_id if sandbox_info else None,
+                error=str(e),
+            )
+
+        finally:
+            # 6. Always clean up sandbox
+            if sandbox_info and api_key:
+                try:
+                    await workflow.execute_activity(
+                        "cleanup_sandbox",
+                        CleanupSandboxInput(
+                            api_url=settings.openhands_api_base_url,
+                            api_key=api_key,
+                            sandbox_id=sandbox_info.sandbox_id,
+                            run_id=input.run_id,
+                        ),
+                        start_to_close_timeout=timedelta(minutes=2),
+                        retry_policy=CLEANUP_RETRY_POLICY,
+                    )
+                except Exception as cleanup_error:
+                    workflow.logger.warning(
+                        "Failed to cleanup sandbox",
+                        extra={
+                            "run_id": input.run_id,
+                            "sandbox_id": sandbox_info.sandbox_id,
+                            "error": str(cleanup_error),
+                        },
+                    )
+
+
+# List of all workflows for worker registration
+ALL_WORKFLOWS = [
+    AutomationWorkflow,
+]
diff --git a/automation/utils/__init__.py b/automation/utils/__init__.py
index c0037a0..176c2a6 100644
--- a/automation/utils/__init__.py
+++ b/automation/utils/__init__.py
@@ -1,19 +1,8 @@
 """Utility modules for the automation service."""
 
-from automation.utils.api_key import APIKeyError, get_api_key_for_automation_run
-from automation.utils.cron import (
-    get_next_fire_time,
-    get_prev_fire_time,
-    is_automation_due,
-)
 from automation.utils.time import utcnow
 
 
 __all__ = [
-    "APIKeyError",
-    "get_api_key_for_automation_run",
-    "get_next_fire_time",
-    "get_prev_fire_time",
-    "is_automation_due",
     "utcnow",
 ]
diff --git a/automation/utils/api_key.py b/automation/utils/api_key.py
deleted file mode 100644
index e7910c0..0000000
--- a/automation/utils/api_key.py
+++ /dev/null
@@ -1,98 +0,0 @@
-"""API key utilities for automation runs."""
-
-import logging
-from typing import TYPE_CHECKING
-
-import httpx
-
-from automation.config import get_settings
-
-
-if TYPE_CHECKING:
-    from automation.models import AutomationRun
-
-logger = logging.getLogger(__name__)
-
-
-class APIKeyError(Exception):
-    """Exception raised when API key retrieval fails."""
-
-    pass
-
-
-async def get_api_key_for_automation_run(run: "AutomationRun") -> str:
-    """Get an API key for executing an automation run.
-
-    Creates a temporary API key for the user/org associated with the
-    automation run by calling the OpenHands SaaS service API.
-
-    Args:
-        run: The automation run to get an API key for. Must have its
-            `automation` relationship loaded with user_id and org_id.
-
-    Returns:
-        The API key string for authenticating with OpenHands.
-
-    Raises:
-        APIKeyError: If the API key cannot be retrieved.
-        ValueError: If the run's automation relationship is not loaded.
-    """
-    if run.automation is None:
-        raise ValueError(
-            "AutomationRun.automation relationship must be loaded "
-            "to retrieve user_id and org_id"
-        )
-
-    settings = get_settings()
-    user_id = run.automation.user_id
-    org_id = run.automation.org_id
-
-    url = (
-        f"{settings.openhands_api_base_url}/api/service/users/{user_id}"
-        f"/orgs/{org_id}/api-keys"
-    )
-
-    headers = {
-        "X-Service-API-Key": settings.service_key,
-        "Content-Type": "application/json",
-    }
-
-    payload = {"name": "automation"}
-
-    try:
-        async with httpx.AsyncClient(timeout=30.0) as client:
-            response = await client.post(url, headers=headers, json=payload)
-            response.raise_for_status()
-
-            data = response.json()
-            api_key = data.get("key")
-
-            if not api_key:
-                raise APIKeyError(f"API key not found in response: {list(data.keys())}")
-
-            logger.info(
-                "Created API key for automation run %s (user=%s, org=%s)",
-                run.id,
-                user_id,
-                org_id,
-            )
-            return api_key
-
-    except httpx.HTTPStatusError as e:
-        logger.error(
-            "Failed to create API key for run %s: HTTP %s - %s",
-            run.id,
-            e.response.status_code,
-            e.response.text,
-            exc_info=True,
-        )
-        raise APIKeyError(f"HTTP {e.response.status_code}: {e.response.text}") from e
-
-    except httpx.RequestError as e:
-        logger.error(
-            "Failed to create API key for run %s: %s",
-            run.id,
-            str(e),
-            exc_info=True,
-        )
-        raise APIKeyError(f"Request failed: {str(e)}") from e
diff --git a/automation/utils/cron.py b/automation/utils/cron.py
deleted file mode 100644
index 15b846b..0000000
--- a/automation/utils/cron.py
+++ /dev/null
@@ -1,143 +0,0 @@
-"""Cron schedule utilities.
-
-Pure functions for computing cron fire times and determining if automations
-are due to execute. These functions handle timezone conversion and croniter
-interactions.
-"""
-
-from __future__ import annotations
-
-from datetime import datetime
-from typing import TYPE_CHECKING
-from zoneinfo import ZoneInfo
-
-from croniter import croniter
-
-from automation.utils.time import utcnow
-
-
-if TYPE_CHECKING:
-    from automation.models import Automation
-
-
-def get_next_fire_time(
-    cron_schedule: str,
-    timezone: str = "UTC",
-    base_time: datetime | None = None,
-) -> datetime:
-    """Calculate the next fire time for a cron schedule.
-
-    Args:
-        cron_schedule: Cron expression (e.g., '0 9 * * 5')
-        timezone: IANA timezone name (e.g., 'America/New_York')
-        base_time: Base time for calculation (defaults to now, UTC-aware)
-
-    Returns:
-        Next fire time as a UTC-aware datetime
-    """
-    if base_time is None:
-        base_time = utcnow()
-
-    tz = ZoneInfo(timezone)
-
-    # Ensure base_time is aware (treat naive as UTC for safety)
-    if base_time.tzinfo is None:
-        base_time = base_time.replace(tzinfo=ZoneInfo("UTC"))
-
-    # Convert to the target timezone, then strip tzinfo for croniter
-    base_in_tz_naive = base_time.astimezone(tz).replace(tzinfo=None)
-
-    # croniter computes the next fire time in the target timezone
-    cron = croniter(cron_schedule, base_in_tz_naive)
-    next_fire_in_tz = cron.get_next(datetime)
-
-    # Convert back to UTC-aware
-    return next_fire_in_tz.replace(tzinfo=tz).astimezone(ZoneInfo("UTC"))
-
-
-def get_prev_fire_time(
-    cron_schedule: str,
-    timezone: str = "UTC",
-    base_time: datetime | None = None,
-) -> datetime:
-    """Calculate the previous (most recent) fire time for a cron schedule.
-
-    Args:
-        cron_schedule: Cron expression (e.g., '0 9 * * 5')
-        timezone: IANA timezone name (e.g., 'America/New_York')
-        base_time: Base time for calculation (defaults to now, UTC-aware)
-
-    Returns:
-        Previous fire time as a UTC-aware datetime
-    """
-    if base_time is None:
-        base_time = utcnow()
-
-    tz = ZoneInfo(timezone)
-
-    # Ensure base_time is aware (treat naive as UTC for safety)
-    if base_time.tzinfo is None:
-        base_time = base_time.replace(tzinfo=ZoneInfo("UTC"))
-
-    # Convert to the target timezone, then strip tzinfo for croniter
-    base_in_tz_naive = base_time.astimezone(tz).replace(tzinfo=None)
-
-    # croniter computes the previous fire time in the target timezone
-    cron = croniter(cron_schedule, base_in_tz_naive)
-    prev_fire_in_tz = cron.get_prev(datetime)
-
-    # Convert back to UTC-aware
-    return prev_fire_in_tz.replace(tzinfo=tz).astimezone(ZoneInfo("UTC"))
-
-
-def is_automation_due(
-    automation: Automation,
-    now: datetime | None = None,
-) -> bool:
-    """Check if an automation is due to fire.
-
-    An automation is due if:
-    1. It's enabled and not deleted
-    2. Its next fire time (based on cron schedule) is <= now
-    3. It hasn't been triggered since its last due time
-
-    Args:
-        automation: The automation to check
-        now: Current time (defaults to now, naive UTC)
-
-    Returns:
-        True if the automation should fire
-    """
-    if now is None:
-        now = utcnow()
-
-    if not automation.enabled or automation.deleted_at is not None:
-        return False
-
-    trigger = automation.trigger
-    if trigger.get("type") != "cron":
-        return False
-
-    schedule = trigger.get("schedule")
-    if not schedule:
-        return False
-
-    timezone = trigger.get("timezone", "UTC")
-
-    # Calculate the previous fire time (most recent time the cron should have fired)
-    # in the user's configured timezone, converted back to UTC
-    prev_fire_time = get_prev_fire_time(schedule, timezone, now)
-
-    # Determine the reference time (last trigger, or creation time if never triggered)
-    if automation.last_triggered_at is None:
-        # Never triggered - use created_at as reference (no catch-up on old schedules)
-        reference_time = automation.created_at
-    else:
-        reference_time = automation.last_triggered_at
-
-    # Ensure reference_time is aware (treat naive as UTC for safety)
-    if reference_time.tzinfo is None:
-        reference_time = reference_time.replace(tzinfo=ZoneInfo("UTC"))
-
-    # Due if a scheduled fire time has passed since the reference time
-    return prev_fire_time > reference_time
diff --git a/automation/utils/run.py b/automation/utils/run.py
deleted file mode 100644
index 875143f..0000000
--- a/automation/utils/run.py
+++ /dev/null
@@ -1,235 +0,0 @@
-"""Automation run utilities."""
-
-import logging
-import uuid
-from datetime import timedelta
-
-from sqlalchemy import CursorResult, select, update
-from sqlalchemy.ext.asyncio import AsyncSession, async_sessionmaker
-
-from automation.constants import MAX_RUN_DURATION
-from automation.models import Automation, AutomationRun, AutomationRunStatus
-from automation.utils.time import utcnow
-
-
-logger = logging.getLogger(__name__)
-
-
-async def disable_automation(
-    session_factory: async_sessionmaker[AsyncSession],
-    automation_id: uuid.UUID,
-    reason: str,
-) -> bool:
-    """Disable an automation due to a permanent configuration error.
-
-    This function sets enabled=False on the automation when we detect
-    an unrecoverable error condition (e.g., tarball URL doesn't exist).
-    The automation can be re-enabled manually after fixing the configuration.
-
-    Uses optimistic locking (UPDATE WHERE enabled=True) to handle race
-    conditions when multiple runs fail simultaneously.
-
-    Args:
-        session_factory: Async session factory
-        automation_id: The automation ID to disable
-        reason: Human-readable reason for disabling (logged)
-
-    Returns:
-        True if the automation was disabled, False if not found or already disabled
-    """
-    extra = {"automation_id": str(automation_id)}
-
-    try:
-        async with session_factory() as session:
-            # Use optimistic locking: only update if currently enabled
-            result: CursorResult = await session.execute(  # type: ignore[assignment]
-                update(Automation)
-                .where(
-                    Automation.id == automation_id,
-                    Automation.enabled == True,  # noqa: E712
-                )
-                .values(enabled=False)
-            )
-
-            if result.rowcount == 0:
-                # Either not found or already disabled - check which
-                check = await session.execute(
-                    select(Automation).where(Automation.id == automation_id)
-                )
-                if check.scalars().first() is None:
-                    logger.warning("Cannot disable automation: not found", extra=extra)
-                else:
-                    logger.info("Automation already disabled", extra=extra)
-                return False
-
-            await session.commit()
-
-            logger.warning(
-                "Automation disabled due to permanent error: %s",
-                reason,
-                extra=extra,
-            )
-            return True
-
-    except Exception:
-        logger.exception("Failed to disable automation", extra=extra)
-        return False
-
-
-async def create_pending_run(
-    session: AsyncSession,
-    automation: Automation,
-) -> AutomationRun:
-    """Create a PENDING automation run for dispatch.
-
-    Also updates the automation's last_triggered_at and last_polled_at
-    timestamps. Caller is responsible for committing the transaction.
-
-    Args:
-        session: Database session
-        automation: The automation to create a run for
-
-    Returns:
-        The created AutomationRun
-    """
-    now = utcnow()
-
-    run = AutomationRun(
-        id=uuid.uuid4(),
-        automation_id=automation.id,
-        status=AutomationRunStatus.PENDING,
-    )
-    session.add(run)
-
-    await session.execute(
-        update(Automation)
-        .where(Automation.id == automation.id)
-        .values(last_triggered_at=now, last_polled_at=now)
-    )
-
-    # Update the in-memory object for consistency with the database
-    automation.last_triggered_at = now
-    automation.last_polled_at = now
-
-    return run
-
-
-async def mark_run_status(
-    session: AsyncSession,
-    run: AutomationRun,
-    status: AutomationRunStatus,
-    error_detail: str | None = None,
-    max_duration: timedelta = MAX_RUN_DURATION,
-) -> None:
-    """Update a run's status and set the appropriate timestamp.
-
-    Sets started_at + timeout_at when transitioning to RUNNING, or
-    completed_at when transitioning to COMPLETED or FAILED. Caller is
-    responsible for committing the transaction.
-
-    Args:
-        session: Database session
-        run: The run to update
-        status: The new status to set
-        error_detail: Optional error message (only used for FAILED status)
-        max_duration: Maximum run duration for computing timeout_at
-    """
-    now = utcnow()
-
-    values: dict = {"status": status}
-    if status == AutomationRunStatus.RUNNING:
-        values["started_at"] = now
-        values["timeout_at"] = now + max_duration
-        run.started_at = now
-        run.timeout_at = now + max_duration
-    elif status in (AutomationRunStatus.COMPLETED, AutomationRunStatus.FAILED):
-        values["completed_at"] = now
-        run.completed_at = now
-
-    if error_detail and status == AutomationRunStatus.FAILED:
-        values["error_detail"] = error_detail
-        run.error_detail = error_detail
-
-    await session.execute(
-        update(AutomationRun).where(AutomationRun.id == run.id).values(**values)
-    )
-
-    run.status = status
-
-
-async def update_sandbox_id(
-    session_factory: async_sessionmaker[AsyncSession],
-    run_id: uuid.UUID,
-    sandbox_id: str,
-) -> None:
-    """Store the sandbox ID on the automation run for later verification.
-
-    Args:
-        session_factory: Async session factory
-        run_id: The run ID to update
-        sandbox_id: The sandbox ID to store
-    """
-    try:
-        async with session_factory() as session:
-            await session.execute(
-                update(AutomationRun)
-                .where(AutomationRun.id == run_id)
-                .values(sandbox_id=sandbox_id)
-            )
-            await session.commit()
-    except Exception:
-        logger.exception("Failed to update sandbox_id for run %s", run_id)
-
-
-async def mark_run_terminal(
-    session_factory: async_sessionmaker[AsyncSession],
-    run: AutomationRun,
-    status: AutomationRunStatus,
-    error: str | None = None,
-) -> None:
-    """Mark a run with a terminal status (COMPLETED or FAILED) if still RUNNING.
-
-    This is a safe wrapper around mark_run_status that:
-    1. Opens a new session
-    2. Re-fetches the run to check current status
-    3. Only updates if the run is still RUNNING (avoids race conditions)
-    4. Commits and handles errors gracefully
-
-    Args:
-        session_factory: Async session factory
-        run: The run to update (used to get the ID)
-        status: The terminal status to set (COMPLETED or FAILED)
-        error: Optional error message (only used for FAILED status)
-    """
-    from sqlalchemy import select
-
-    run_id = str(run.id)
-    automation_id = str(run.automation_id) if run.automation_id else None
-    extra = {"run_id": run_id}
-    if automation_id:
-        extra["automation_id"] = automation_id
-
-    try:
-        async with session_factory() as session:
-            db_result = await session.execute(
-                select(AutomationRun).where(AutomationRun.id == run.id)
-            )
-            db_run = db_result.scalars().first()
-            if db_run and db_run.status == AutomationRunStatus.RUNNING:
-                await mark_run_status(
-                    session,
-                    db_run,
-                    status,
-                    error_detail=error,
-                )
-                await session.commit()
-                logger.info("Run marked as %s", status.value, extra=extra)
-            else:
-                logger.info(
-                    "Run not marked %s (current status: %s)",
-                    status.value,
-                    db_run.status.value if db_run else "not found",
-                    extra=extra,
-                )
-    except Exception:
-        logger.exception("Failed to mark run as %s", status.value, extra=extra)
diff --git a/automation/utils/tarball_url.py b/automation/utils/tarball_url.py
new file mode 100644
index 0000000..32fd94f
--- /dev/null
+++ b/automation/utils/tarball_url.py
@@ -0,0 +1,69 @@
+"""Lightweight URL parsing utilities for tarball paths.
+
+This module contains only pure functions with minimal dependencies,
+making it safe to import in Temporal workflows (which run in a sandbox
+that restricts certain imports like httpx, urllib.request, etc.).
+
+For validation functions that require database access, see tarball_validation.py.
+"""
+
+import re
+from uuid import UUID
+
+
+# Valid external URL schemes (must be publicly accessible)
+EXTERNAL_URL_SCHEMES = ("https://", "s3://", "gs://")
+
+# HTTP(S) URL schemes that can be downloaded with curl inside a sandbox
+HTTP_URL_SCHEMES = ("http://", "https://")
+
+# Internal URL scheme for uploaded tarballs (must match config.INTERNAL_URL_SCHEME)
+_INTERNAL_URL_SCHEME = "oh-internal"
+
+# Internal URL prefix for uploaded tarballs
+INTERNAL_URL_PREFIX = f"{_INTERNAL_URL_SCHEME}://uploads/"
+
+# Compiled regex pattern for internal URLs: oh-internal://uploads/{uuid}
+_INTERNAL_URL_PATTERN = re.compile(
+    rf"^{re.escape(_INTERNAL_URL_SCHEME)}://uploads/"
+    r"([0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12})$",
+    re.IGNORECASE,
+)
+
+
+def get_internal_url_prefix() -> str:
+    """Get the internal URL prefix (e.g., 'oh-internal://uploads/')."""
+    return INTERNAL_URL_PREFIX
+
+
+def build_internal_url(upload_id: UUID) -> str:
+    """Build an internal URL for an upload."""
+    return f"{INTERNAL_URL_PREFIX}{upload_id}"
+
+
+def parse_internal_upload_id(tarball_path: str) -> UUID | None:
+    """
+    Extract upload_id from internal URL.
+
+    Returns the UUID if the path matches the internal format,
+    or None if it's not an internal URL.
+    """
+    match = _INTERNAL_URL_PATTERN.match(tarball_path)
+    if match:
+        return UUID(match.group(1))
+    return None
+
+
+def is_internal_url(tarball_path: str) -> bool:
+    """Check if the tarball_path is an internal upload URL."""
+    return tarball_path.startswith(f"{_INTERNAL_URL_SCHEME}://")
+
+
+def is_valid_external_url(tarball_path: str) -> bool:
+    """Check if the tarball_path has a valid external URL scheme."""
+    return tarball_path.startswith(EXTERNAL_URL_SCHEMES)
+
+
+def is_http_url(tarball_path: str) -> bool:
+    """Check if the tarball_path is an HTTP(S) URL downloadable with curl."""
+    return tarball_path.startswith(HTTP_URL_SCHEMES)
diff --git a/automation/utils/tarball_validation.py b/automation/utils/tarball_validation.py
index 8a5e163..cc6813c 100644
--- a/automation/utils/tarball_validation.py
+++ b/automation/utils/tarball_validation.py
@@ -3,9 +3,11 @@
 Supports two types of tarball sources:
 1. Internal uploads: oh-internal://uploads/{uuid}
 2. External public URLs: https://, s3://, gs://
+
+This module re-exports the pure URL parsing functions from tarball_url.py
+and adds validation functions that require database access.
 """
 
-import re
 from uuid import UUID
 
 from fastapi import HTTPException, status
@@ -15,62 +17,22 @@
 from automation.config import INTERNAL_URL_SCHEME
 from automation.models import TarballUpload, UploadStatus
 
-
-# Valid external URL schemes (must be publicly accessible)
-EXTERNAL_URL_SCHEMES = ("https://", "s3://", "gs://")
-
-# HTTP(S) URL schemes that can be downloaded with curl inside a sandbox
-HTTP_URL_SCHEMES = ("http://", "https://")
-
-# Internal URL prefix for uploaded tarballs
-INTERNAL_URL_PREFIX = f"{INTERNAL_URL_SCHEME}://uploads/"
-
-# Compiled regex pattern for internal URLs: oh-internal://uploads/{uuid}
-_INTERNAL_URL_PATTERN = re.compile(
-    rf"^{re.escape(INTERNAL_URL_SCHEME)}://uploads/"
-    r"([0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12})$",
-    re.IGNORECASE,
+# Re-export pure URL parsing functions from the lightweight module.
+# These are duplicated there to allow workflow code to import them
+# without pulling in fastapi/sqlalchemy/httpx dependencies.
+from automation.utils.tarball_url import (
+    EXTERNAL_URL_SCHEMES,
+    HTTP_URL_SCHEMES,
+    INTERNAL_URL_PREFIX,
+    build_internal_url,
+    get_internal_url_prefix,
+    is_http_url,
+    is_internal_url,
+    is_valid_external_url,
+    parse_internal_upload_id,
 )
 
 
-def get_internal_url_prefix() -> str:
-    """Get the internal URL prefix (e.g., 'oh-internal://uploads/')."""
-    return INTERNAL_URL_PREFIX
-
-
-def build_internal_url(upload_id: UUID) -> str:
-    """Build an internal URL for an upload."""
-    return f"{INTERNAL_URL_PREFIX}{upload_id}"
-
-
-def parse_internal_upload_id(tarball_path: str) -> UUID | None:
-    """
-    Extract upload_id from internal URL.
-
-    Returns the UUID if the path matches the internal format,
-    or None if it's not an internal URL.
-    """
-    match = _INTERNAL_URL_PATTERN.match(tarball_path)
-    if match:
-        return UUID(match.group(1))
-    return None
-
-
-def is_internal_url(tarball_path: str) -> bool:
-    """Check if the tarball_path is an internal upload URL."""
-    return tarball_path.startswith(f"{INTERNAL_URL_SCHEME}://")
-
-
-def is_valid_external_url(tarball_path: str) -> bool:
-    """Check if the tarball_path has a valid external URL scheme."""
-    return tarball_path.startswith(EXTERNAL_URL_SCHEMES)
-
-
-def is_http_url(tarball_path: str) -> bool:
-    """Check if the tarball_path is an HTTP(S) URL downloadable with curl."""
-    return tarball_path.startswith(HTTP_URL_SCHEMES)
-
-
 async def validate_tarball_path(
     tarball_path: str,
     user_id: UUID,
diff --git a/automation/watchdog.py b/automation/watchdog.py
deleted file mode 100644
index a45596e..0000000
--- a/automation/watchdog.py
+++ /dev/null
@@ -1,321 +0,0 @@
-"""Staleness watchdog for stuck RUNNING automation runs.
-
-Periodically scans for runs stuck in RUNNING state past their pre-computed
-``timeout_at`` deadline. Before marking as FAILED, attempts to verify the
-actual run status by querying the sandbox's bash command history.
-
-The ``timeout_at`` column is set to ``started_at + max_duration`` when the
-dispatcher transitions a run to RUNNING (see ``mark_run_status``).
-"""
-
-import asyncio
-import logging
-from typing import Any
-
-from sqlalchemy import select, update
-from sqlalchemy.engine import CursorResult
-from sqlalchemy.ext.asyncio import AsyncSession, async_sessionmaker
-from sqlalchemy.orm import selectinload
-
-from automation.config import Settings
-from automation.models import AutomationRun, AutomationRunStatus
-from automation.utils.api_key import get_api_key_for_automation_run
-from automation.utils.sandbox import cleanup_sandbox, verify_run_status
-from automation.utils.time import utcnow
-
-
-logger = logging.getLogger("automation.watchdog")
-
-
-def _run_extra(
-    run_id: str | None = None,
-    sandbox_id: str | None = None,
-) -> dict[str, Any]:
-    """Build extra dict for structured logging."""
-    extra: dict[str, Any] = {}
-    if run_id:
-        extra["run_id"] = run_id
-    if sandbox_id:
-        extra["sandbox_id"] = sandbox_id
-    return extra
-
-
-async def _verify_and_mark_run(
-    session: AsyncSession,
-    run: AutomationRun,
-    settings: Settings,
-) -> bool:
-    """Verify run status via sandbox and mark accordingly.
-
-    Attempts to connect to the sandbox and check the last bash command's exit code.
-    If verification succeeds, marks the run based on the actual result.
-    If verification fails (sandbox unavailable), marks as FAILED with timeout error.
-
-    Returns True if the run was marked with a terminal status.
-    """
-    run_id = str(run.id)
-    sandbox_id = run.sandbox_id
-    extra = _run_extra(run_id=run_id, sandbox_id=sandbox_id)
-    now = utcnow()
-
-    # If no sandbox_id, we can't verify - mark as failed
-    if not sandbox_id:
-        logger.warning("No sandbox_id for stale run, marking FAILED", extra=extra)
-        stmt = (
-            update(AutomationRun)
-            .where(
-                AutomationRun.id == run.id,
-                AutomationRun.status == AutomationRunStatus.RUNNING,
-            )
-            .values(
-                status=AutomationRunStatus.FAILED,
-                completed_at=now,
-                error_detail="Timed out: no sandbox_id available for verification",
-            )
-        )
-        result: CursorResult = await session.execute(stmt)  # type: ignore[assignment]
-        return result.rowcount > 0
-
-    # Get API key for sandbox access
-    try:
-        api_key = await get_api_key_for_automation_run(run)
-    except Exception as e:
-        logger.warning("Failed to get API key for verification: %s", e, extra=extra)
-        stmt = (
-            update(AutomationRun)
-            .where(
-                AutomationRun.id == run.id,
-                AutomationRun.status == AutomationRunStatus.RUNNING,
-            )
-            .values(
-                status=AutomationRunStatus.FAILED,
-                completed_at=now,
-                error_detail=f"Timed out: could not get API key for verification: {e}",
-            )
-        )
-        result = await session.execute(stmt)  # type: ignore[assignment]
-        return result.rowcount > 0
-
-    # Try to verify via sandbox
-    verification = await verify_run_status(
-        api_url=settings.openhands_api_base_url,
-        api_key=api_key,
-        sandbox_id=sandbox_id,
-        keep_alive=run.keep_alive,
-        run_id=run_id,
-    )
-
-    if verification.verified:
-        exit_code = verification.exit_code
-
-        # exit_code == 0: Command completed successfully, we just missed the callback
-        if exit_code == 0:
-            logger.info(
-                "Verified run completed successfully (exit_code=%s), "
-                "callback was missed",
-                exit_code,
-                extra=extra,
-            )
-            stmt = (
-                update(AutomationRun)
-                .where(
-                    AutomationRun.id == run.id,
-                    AutomationRun.status == AutomationRunStatus.RUNNING,
-                )
-                .values(
-                    status=AutomationRunStatus.COMPLETED,
-                    completed_at=now,
-                )
-            )
-
-        # exit_code == -1 or None: Command was killed/timed out by bash service
-        elif exit_code is None or exit_code == -1:
-            error_msg = "command timed out or was killed"
-            if verification.stderr:
-                error_msg += f"\nstderr: {verification.stderr[-1000:]}"
-
-            logger.warning(
-                "Run timed out (exit_code=%s)",
-                exit_code,
-                extra=extra,
-            )
-            stmt = (
-                update(AutomationRun)
-                .where(
-                    AutomationRun.id == run.id,
-                    AutomationRun.status == AutomationRunStatus.RUNNING,
-                )
-                .values(
-                    status=AutomationRunStatus.FAILED,
-                    completed_at=now,
-                    error_detail=f"Timed out: {error_msg}",
-                )
-            )
-
-        # Any other exit code: Command failed with an actual error
-        else:
-            error_parts = [f"exit_code={exit_code}"]
-            if verification.stderr:
-                error_parts.append(f"stderr: {verification.stderr[-1000:]}")
-            if verification.stdout:
-                error_parts.append(f"stdout: {verification.stdout[-500:]}")
-            error_detail = "\n".join(error_parts)
-
-            logger.warning(
-                "Verified run failed (exit_code=%s)",
-                exit_code,
-                extra=extra,
-            )
-            stmt = (
-                update(AutomationRun)
-                .where(
-                    AutomationRun.id == run.id,
-                    AutomationRun.status == AutomationRunStatus.RUNNING,
-                )
-                .values(
-                    status=AutomationRunStatus.FAILED,
-                    completed_at=now,
-                    error_detail=error_detail,
-                )
-            )
-
-        result = await session.execute(stmt)  # type: ignore[assignment]
-        return result.rowcount > 0
-
-    # Verification failed - sandbox not available or command still running
-    # This likely means the sandbox crashed or was cleaned up
-    logger.warning(
-        "Could not verify run status: %s, marking as timed out",
-        verification.error,
-        extra=extra,
-    )
-
-    # Clean up sandbox if not keep_alive (best effort, may already be gone)
-    if not run.keep_alive and sandbox_id:
-        await cleanup_sandbox(
-            api_url=settings.openhands_api_base_url,
-            api_key=api_key,
-            sandbox_id=sandbox_id,
-            run_id=run_id,
-        )
-
-    error_msg = verification.error or "no completion callback received"
-
-    logger.warning(
-        "Marking run as timed out: run_id=%s, sandbox_id=%s, timeout_at=%s, reason=%s",
-        run_id,
-        sandbox_id,
-        run.timeout_at,
-        error_msg,
-        extra=extra,
-    )
-
-    stmt = (
-        update(AutomationRun)
-        .where(
-            AutomationRun.id == run.id,
-            AutomationRun.status == AutomationRunStatus.RUNNING,
-        )
-        .values(
-            status=AutomationRunStatus.FAILED,
-            completed_at=now,
-            error_detail=f"Timed out: {error_msg}",
-        )
-    )
-    result = await session.execute(stmt)  # type: ignore[assignment]
-    return result.rowcount > 0
-
-
-async def mark_stale_runs(
-    session_factory: async_sessionmaker[AsyncSession],
-    settings: Settings,
-) -> int:
-    """Find and process stale RUNNING runs.
-
-    A run is stale if ``timeout_at < now()`` (pre-computed at dispatch time).
-    Before marking as FAILED, attempts to verify the actual status by querying
-    the sandbox. Uses optimistic locking so concurrent callbacks win.
-
-    Returns the number of runs marked with terminal status.
-    """
-    now = utcnow()
-    marked = 0
-
-    async with session_factory() as session:
-        # Fetch stale runs with their automation relationship for API key access
-        result = await session.execute(
-            select(AutomationRun)
-            .options(selectinload(AutomationRun.automation))
-            .where(
-                AutomationRun.status == AutomationRunStatus.RUNNING,
-                AutomationRun.timeout_at.isnot(None),
-                AutomationRun.timeout_at < now,
-            )
-        )
-        stale_runs = result.scalars().all()
-
-        for run in stale_runs:
-            run_id = str(run.id)
-            extra = _run_extra(run_id=run_id, sandbox_id=run.sandbox_id)
-
-            logger.info(
-                "Processing stale run (timeout_at=%s, now=%s)",
-                run.timeout_at,
-                now,
-                extra=extra,
-            )
-
-            try:
-                if await _verify_and_mark_run(session, run, settings):
-                    marked += 1
-                else:
-                    logger.info("Run already completed, skipping", extra=extra)
-            except Exception:
-                logger.exception("Error processing stale run", extra=extra)
-
-        if marked:
-            await session.commit()
-
-    return marked
-
-
-async def watchdog_loop(
-    session_factory: async_sessionmaker[AsyncSession],
-    settings: Settings,
-    shutdown_event: asyncio.Event | None = None,
-) -> None:
-    """Main watchdog loop — scans for stale runs periodically.
-
-    Args:
-        session_factory: Async session maker for database access.
-        settings: Application settings.
-        shutdown_event: Event to signal graceful shutdown.
-    """
-    interval = settings.watchdog_interval_seconds
-
-    logger.info(
-        "Watchdog started, scanning every %ds",
-        interval,
-    )
-
-    while True:
-        if shutdown_event is not None and shutdown_event.is_set():
-            logger.info("Watchdog received shutdown signal, exiting")
-            break
-
-        try:
-            marked = await mark_stale_runs(session_factory, settings)
-            if marked:
-                logger.info("Processed %d stale run(s)", marked)
-        except Exception:
-            logger.exception("Error in watchdog scan")
-
-        if shutdown_event is not None:
-            try:
-                await asyncio.wait_for(shutdown_event.wait(), timeout=interval)
-                logger.info("Watchdog received shutdown signal, exiting")
-                break
-            except TimeoutError:
-                pass
-        else:
-            await asyncio.sleep(interval)
diff --git a/pyproject.toml b/pyproject.toml
index fa9eefe..1543074 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -25,6 +25,7 @@ dependencies = [
   "pydantic-settings>=2",
   "python-json-logger>=3",
   "sqlalchemy[asyncio]>=2",
+  "temporalio>=1.9.0",
   "tenacity>=9.1.4",
   "uvicorn[standard]>=0.30",
 ]
@@ -109,7 +110,7 @@ include = [
     "tests",
 ]
 exclude = [
-    "scripts/test_tarball",
+    "scripts",
     "automation/presets",
 ]
 venvPath = "."
diff --git a/scripts/test_sandbox.py b/scripts/test_sandbox.py
new file mode 100644
index 0000000..febe946
--- /dev/null
+++ b/scripts/test_sandbox.py
@@ -0,0 +1,61 @@
+#!/usr/bin/env python3
+"""Test that workflows pass Temporal sandbox validation.
+
+Run this locally to verify workflows before deploying:
+    uv run python scripts/test_sandbox.py
+
+This validates that:
+1. Workflow code doesn't import restricted modules (httpx, urllib.request, etc.)
+2. All activity/workflow definitions are properly structured
+3. The worker can be created without sandbox errors
+"""
+import asyncio
+import sys
+
+
+async def test_worker_sandbox():
+    """Test that workflows can be validated by the Temporal sandbox."""
+    from temporalio.worker import Worker
+    from temporalio.testing import WorkflowEnvironment
+
+    print("Starting test environment...")
+
+    # Use the local environment - this creates an in-memory Temporal server
+    env = await WorkflowEnvironment.start_local()
+
+    try:
+        # Import AFTER environment is ready
+        from automation.temporal.workflows import ALL_WORKFLOWS
+        from automation.temporal.activities import ALL_ACTIVITIES
+
+        print(f"Testing {len(ALL_WORKFLOWS)} workflows and {len(ALL_ACTIVITIES)} activities...")
+
+        # This is where sandbox validation happens
+        # If it fails, we get RuntimeError: Failed validating workflow <name>
+        worker = Worker(
+            env.client,
+            task_queue="test-queue",
+            workflows=ALL_WORKFLOWS,
+            activities=ALL_ACTIVITIES,
+        )
+
+        print("✅ Worker created successfully - workflows pass sandbox validation!")
+        print(f"   Workflows: {[w.__name__ for w in ALL_WORKFLOWS]}")
+        print(f"   Activities: {[a.__name__ for a in ALL_ACTIVITIES]}")
+        return True
+
+    except RuntimeError as e:
+        if "Failed validating workflow" in str(e):
+            print(f"❌ Sandbox validation FAILED: {e}")
+            # Print the full traceback for debugging
+            import traceback
+            traceback.print_exc()
+            return False
+        raise
+    finally:
+        await env.shutdown()
+
+
+if __name__ == "__main__":
+    success = asyncio.run(test_worker_sandbox())
+    sys.exit(0 if success else 1)
diff --git a/tests/conftest.py b/tests/conftest.py
index 71654e9..adc7a96 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -3,6 +3,7 @@
 import logging
 import os
 from collections.abc import AsyncGenerator
+from unittest.mock import AsyncMock, MagicMock
 
 import pytest
 from fastapi.testclient import TestClient
@@ -24,6 +25,7 @@
 from automation.config import Settings  # noqa: E402
 from automation.db import get_session  # noqa: E402
 from automation.models import Base  # noqa: E402
+from automation.router import get_client  # noqa: E402
 
 
 @pytest.fixture(autouse=True)
@@ -100,11 +102,44 @@ def mock_authenticated_user():
     )
 
 
+@pytest.fixture
+def mock_temporal_client():
+    """Create a mock Temporal client for testing."""
+    mock_client = MagicMock()
+    # Mock schedule operations
+    mock_client.create_schedule = AsyncMock(return_value=None)
+    mock_client.get_schedule_handle = MagicMock()
+    mock_schedule_handle = MagicMock()
+    mock_schedule_handle.delete = AsyncMock(return_value=None)
+    mock_schedule_handle.update = AsyncMock(return_value=None)
+    mock_schedule_handle.pause = AsyncMock(return_value=None)
+    mock_schedule_handle.unpause = AsyncMock(return_value=None)
+    mock_schedule_handle.trigger = AsyncMock(return_value=None)
+    mock_client.get_schedule_handle.return_value = mock_schedule_handle
+    # Mock workflow operations
+    mock_client.start_workflow = AsyncMock(
+        return_value=MagicMock(id="mock-workflow-id")
+    )
+
+    # Mock list_workflows for readiness check (returns async iterator)
+    async def mock_list_workflows(*args, **kwargs):
+        # Return empty async iterator
+        return
+        yield  # Make this a generator  # noqa: B901
+
+    mock_client.list_workflows = mock_list_workflows
+    return mock_client
+
+
 @pytest.fixture
 async def async_client(
-    async_engine, async_session_factory, async_session, mock_authenticated_user
+    async_engine,
+    async_session_factory,
+    async_session,
+    mock_authenticated_user,
+    mock_temporal_client,
 ) -> AsyncGenerator[AsyncClient, None]:
-    """Create an async test client with mocked auth and DB session."""
+    """Create an async test client with mocked auth, DB session, and Temporal client."""
 
     async def override_get_session():
         yield async_session
@@ -112,12 +147,17 @@ async def override_get_session():
     async def override_authenticate():
         return mock_authenticated_user
 
+    async def override_get_client():
+        return mock_temporal_client
+
     app.dependency_overrides[get_session] = override_get_session
     app.dependency_overrides[authenticate_request] = override_authenticate
+    app.dependency_overrides[get_client] = override_get_client
 
     # Set app.state for endpoints that access it directly (e.g., /ready)
     app.state.engine = async_engine
     app.state.session_factory = async_session_factory
+    app.state.temporal_client = mock_temporal_client
     # Create a mock http_client for tests (auth is overridden, but state must exist)
     app.state.http_client = create_http_client()
 
@@ -132,12 +172,13 @@ async def override_authenticate():
 
 
 @pytest.fixture
-def sync_client(async_engine, async_session_factory):
+def sync_client(async_engine, async_session_factory, mock_temporal_client):
     """Create a sync test client for simple endpoint tests."""
     import asyncio
 
     app.state.engine = async_engine
     app.state.session_factory = async_session_factory
+    app.state.temporal_client = mock_temporal_client
     http_client = create_http_client()
     app.state.http_client = http_client
     yield TestClient(app)
diff --git a/tests/temporal/__init__.py b/tests/temporal/__init__.py
new file mode 100644
index 0000000..dc92c4c
--- /dev/null
+++ b/tests/temporal/__init__.py
@@ -0,0 +1 @@
+"""Tests for Temporal integration."""
diff --git a/tests/temporal/test_activities.py b/tests/temporal/test_activities.py
new file mode 100644
index 0000000..f6fcda9
--- /dev/null
+++ b/tests/temporal/test_activities.py
@@ -0,0 +1,474 @@
+"""Tests for Temporal activities.
+
+Uses ActivityEnvironment to test activities in isolation without a Worker.
+"""
+
+import uuid
+from unittest.mock import AsyncMock, MagicMock, patch
+
+import httpx
+import pytest
+from temporalio.testing import ActivityEnvironment
+
+from automation.temporal.activities import (
+    cleanup_sandbox,
+    create_sandbox,
+    download_tarball,
+    execute_entrypoint,
+    get_api_key,
+    upload_tarball,
+)
+from automation.temporal.types import (
+    CleanupSandboxInput,
+    CreateSandboxInput,
+    DownloadTarballInput,
+    ExecuteEntrypointInput,
+    ExecutionResult,
+    GetApiKeyInput,
+    SandboxInfo,
+    UploadTarballInput,
+)
+
+
+class TestGetApiKeyActivity:
+    """Tests for get_api_key activity."""
+
+    @pytest.fixture
+    def activity_env(self) -> ActivityEnvironment:
+        return ActivityEnvironment()
+
+    @pytest.fixture
+    def input(self) -> GetApiKeyInput:
+        return GetApiKeyInput(
+            user_id=str(uuid.uuid4()),
+            org_id=str(uuid.uuid4()),
+            run_id="run-123",
+        )
+
+    @pytest.mark.asyncio
+    async def test_get_api_key_success(
+        self, activity_env: ActivityEnvironment, input: GetApiKeyInput
+    ):
+        """Test successful API key retrieval."""
+        mock_response = MagicMock()
+        mock_response.status_code = 200
+        mock_response.json.return_value = {"key": "sk-test-key-12345"}
+        mock_response.raise_for_status = MagicMock()
+
+        with patch("automation.temporal.activities.httpx.AsyncClient") as mock_client:
+            mock_client.return_value.__aenter__.return_value.post = AsyncMock(
+                return_value=mock_response
+            )
+
+            result = await activity_env.run(get_api_key, input)
+
+            assert result == "sk-test-key-12345"
+
+    @pytest.mark.asyncio
+    async def test_get_api_key_failure(
+        self, activity_env: ActivityEnvironment, input: GetApiKeyInput
+    ):
+        """Test API key retrieval failure."""
+        mock_response = MagicMock()
+        mock_response.status_code = 401
+        mock_response.text = "Unauthorized"
+        mock_response.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "Unauthorized", request=MagicMock(), response=mock_response
+        )
+
+        with patch("automation.temporal.activities.httpx.AsyncClient") as mock_client:
+            mock_client.return_value.__aenter__.return_value.post = AsyncMock(
+                return_value=mock_response
+            )
+
+            with pytest.raises(httpx.HTTPStatusError):
+                await activity_env.run(get_api_key, input)
+
+
+class TestCreateSandboxActivity:
+    """Tests for create_sandbox activity."""
+
+    @pytest.fixture
+    def activity_env(self) -> ActivityEnvironment:
+        return ActivityEnvironment()
+
+    @pytest.fixture
+    def input(self) -> CreateSandboxInput:
+        return CreateSandboxInput(
+            api_url="https://api.example.com",
+            api_key="sk-test-key",
+            run_id="run-123",
+        )
+
+    @pytest.mark.asyncio
+    async def test_create_sandbox_success(
+        self, activity_env: ActivityEnvironment, input: CreateSandboxInput
+    ):
+        """Test successful sandbox creation."""
+        sandbox_id = "sandbox-abc123"
+
+        # Mock sandbox creation response
+        create_response = MagicMock()
+        create_response.status_code = 200
+        create_response.json.return_value = {"id": sandbox_id}
+
+        # Mock sandbox status poll response (immediately running)
+        poll_response = MagicMock()
+        poll_response.status_code = 200
+        poll_response.json.return_value = [
+            {
+                "sandbox_id": sandbox_id,
+                "status": "RUNNING",
+                "session_api_key": "session-key-xyz",
+                "exposed_urls": [
+                    {"name": "AGENT_SERVER", "url": "https://agent.example.com"}
+                ],
+            }
+        ]
+
+        with patch("automation.temporal.activities.httpx.AsyncClient") as mock_client:
+            mock_instance = mock_client.return_value.__aenter__.return_value
+            mock_instance.post = AsyncMock(return_value=create_response)
+            mock_instance.get = AsyncMock(return_value=poll_response)
+
+            result = await activity_env.run(create_sandbox, input)
+
+            assert isinstance(result, SandboxInfo)
+            assert result.sandbox_id == sandbox_id
+            assert result.agent_url == "https://agent.example.com"
+            assert result.session_key == "session-key-xyz"
+
+    @pytest.mark.asyncio
+    async def test_create_sandbox_creation_fails(
+        self, activity_env: ActivityEnvironment, input: CreateSandboxInput
+    ):
+        """Test sandbox creation failure."""
+        create_response = MagicMock()
+        create_response.status_code = 500
+        create_response.text = "Internal server error"
+        create_response.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "Server error", request=MagicMock(), response=create_response
+        )
+
+        with patch("automation.temporal.activities.httpx.AsyncClient") as mock_client:
+            mock_instance = mock_client.return_value.__aenter__.return_value
+            mock_instance.post = AsyncMock(return_value=create_response)
+
+            with pytest.raises(httpx.HTTPStatusError):
+                await activity_env.run(create_sandbox, input)
+
+
+class TestDownloadTarballActivity:
+    """Tests for download_tarball activity."""
+
+    @pytest.fixture
+    def activity_env(self) -> ActivityEnvironment:
+        return ActivityEnvironment()
+
+    @pytest.fixture
+    def input(self) -> DownloadTarballInput:
+        return DownloadTarballInput(
+            upload_id="12345678-1234-1234-1234-123456789012",
+            run_id="run-123",
+        )
+
+    @pytest.mark.asyncio
+    async def test_download_tarball_success(
+        self, activity_env: ActivityEnvironment, input: DownloadTarballInput
+    ):
+        """Test successful internal tarball download."""
+        tarball_content = b"mock tarball content"
+
+        # Mock database and file store
+        mock_upload = MagicMock()
+        mock_upload.storage_path = "path/to/tarball.tar.gz"
+
+        mock_session = AsyncMock()
+        mock_result = MagicMock()
+        mock_result.scalars.return_value.first.return_value = mock_upload
+        mock_session.execute.return_value = mock_result
+        mock_session.__aenter__.return_value = mock_session
+        mock_session.__aexit__.return_value = None
+
+        mock_session_factory = MagicMock(return_value=mock_session)
+
+        mock_engine_result = MagicMock()
+        mock_engine_result.engine = MagicMock()
+        mock_engine_result.dispose = AsyncMock()
+
+        with (
+            patch(
+                "automation.db.create_engine",
+                return_value=mock_engine_result,
+            ),
+            patch(
+                "automation.db.create_session_factory",
+                return_value=mock_session_factory,
+            ),
+            patch("automation.storage.get_file_store") as mock_get_store,
+        ):
+            mock_store = MagicMock()
+            mock_store.read.return_value = tarball_content
+            mock_get_store.return_value = mock_store
+
+            result = await activity_env.run(download_tarball, input)
+
+            assert result == tarball_content
+            mock_store.read.assert_called_once_with("path/to/tarball.tar.gz")
+
+    @pytest.mark.asyncio
+    async def test_download_tarball_not_found(
+        self, activity_env: ActivityEnvironment, input: DownloadTarballInput
+    ):
+        """Test tarball download when upload record not found."""
+        # Mock database returning no result
+        mock_session = AsyncMock()
+        mock_result = MagicMock()
+        mock_result.scalars.return_value.first.return_value = None
+        mock_session.execute.return_value = mock_result
+        mock_session.__aenter__.return_value = mock_session
+        mock_session.__aexit__.return_value = None
+
+        mock_session_factory = MagicMock(return_value=mock_session)
+
+        mock_engine_result = MagicMock()
+        mock_engine_result.engine = MagicMock()
+        mock_engine_result.dispose = AsyncMock()
+
+        with (
+            patch(
+                "automation.db.create_engine",
+                return_value=mock_engine_result,
+            ),
+            patch(
+                "automation.db.create_session_factory",
+                return_value=mock_session_factory,
+            ),
+        ):
+            with pytest.raises(ValueError, match="Internal tarball upload not found"):
+                await activity_env.run(download_tarball, input)
+
+
+class TestUploadTarballActivity:
+    """Tests for upload_tarball activity."""
+
+    @pytest.fixture
+    def activity_env(self) -> ActivityEnvironment:
+        return ActivityEnvironment()
+
+    @pytest.fixture
+    def sandbox_info(self) -> SandboxInfo:
+        return SandboxInfo(
+            sandbox_id="sandbox-123",
+            agent_url="https://agent.example.com",
+            session_key="session-key",
+            api_key="sk-test-key",
+        )
+
+    @pytest.fixture
+    def input(self, sandbox_info: SandboxInfo) -> UploadTarballInput:
+        return UploadTarballInput(
+            sandbox_info=sandbox_info,
+            tarball_data=b"mock tarball content",
+            run_id="run-123",
+        )
+
+    @pytest.mark.asyncio
+    async def test_upload_tarball_with_content(
+        self, activity_env: ActivityEnvironment, input: UploadTarballInput
+    ):
+        """Test uploading tarball content to sandbox."""
+        mock_response = MagicMock()
+        mock_response.status_code = 200
+        mock_response.raise_for_status = MagicMock()
+
+        with patch("automation.temporal.activities.httpx.AsyncClient") as mock_client:
+            mock_instance = mock_client.return_value.__aenter__.return_value
+            mock_instance.post = AsyncMock(return_value=mock_response)
+
+            await activity_env.run(upload_tarball, input)
+
+            # Verify upload was called
+            mock_instance.post.assert_called()
+
+    @pytest.mark.asyncio
+    async def test_upload_tarball_external_url(
+        self, activity_env: ActivityEnvironment, sandbox_info: SandboxInfo
+    ):
+        """Test triggering external tarball download in sandbox."""
+        input = UploadTarballInput(
+            sandbox_info=sandbox_info,
+            tarball_data=None,  # External URL - no content
+            tarball_url="https://example.com/tarball.tar.gz",
+            run_id="run-123",
+        )
+
+        # Mock bash command execution for curl
+        mock_response = MagicMock()
+        mock_response.status_code = 200
+        mock_response.json.return_value = {"exit_code": 0, "stdout": "", "stderr": ""}
+        mock_response.raise_for_status = MagicMock()
+
+        with patch("automation.temporal.activities.httpx.AsyncClient") as mock_client:
+            mock_instance = mock_client.return_value.__aenter__.return_value
+            mock_instance.post = AsyncMock(return_value=mock_response)
+
+            await activity_env.run(upload_tarball, input)
+
+
+class TestExecuteEntrypointActivity:
+    """Tests for execute_entrypoint activity."""
+
+    @pytest.fixture
+    def activity_env(self) -> ActivityEnvironment:
+        return ActivityEnvironment()
+
+    @pytest.fixture
+    def sandbox_info(self) -> SandboxInfo:
+        return SandboxInfo(
+            sandbox_id="sandbox-123",
+            agent_url="https://agent.example.com",
+            session_key="session-key",
+            api_key="sk-test-key",
+        )
+
+    @pytest.fixture
+    def input(self, sandbox_info: SandboxInfo) -> ExecuteEntrypointInput:
+        return ExecuteEntrypointInput(
+            sandbox_info=sandbox_info,
+            entrypoint="python main.py",
+            env_vars={"API_KEY": "test-key"},
+            timeout_seconds=300,
+            run_id="run-123",
+        )
+
+    @pytest.mark.asyncio
+    async def test_execute_entrypoint_success(
+        self, activity_env: ActivityEnvironment, input: ExecuteEntrypointInput
+    ):
+        """Test successful entrypoint execution."""
+        # Mock bash start response
+        start_response = MagicMock()
+        start_response.status_code = 200
+        start_response.json.return_value = {"id": "cmd-123"}
+        start_response.raise_for_status = MagicMock()
+
+        # Mock bash events search - returns items array with exit_code
+        result_response = MagicMock()
+        result_response.status_code = 200
+        result_response.json.return_value = {
+            "items": [
+                {
+                    "exit_code": 0,
+                    "stdout": "Success output",
+                    "stderr": "",
+                }
+            ]
+        }
+        result_response.raise_for_status = MagicMock()
+
+        with (
+            patch("automation.temporal.activities.httpx.AsyncClient") as mock_client,
+            patch("automation.temporal.activities.asyncio.sleep", new=AsyncMock()),
+        ):
+            mock_instance = mock_client.return_value.__aenter__.return_value
+            mock_instance.post = AsyncMock(return_value=start_response)
+            mock_instance.get = AsyncMock(return_value=result_response)
+
+            result = await activity_env.run(execute_entrypoint, input)
+
+            assert isinstance(result, ExecutionResult)
+            assert result.success is True
+            assert result.exit_code == 0
+
+    @pytest.mark.asyncio
+    async def test_execute_entrypoint_failure(
+        self, activity_env: ActivityEnvironment, input: ExecuteEntrypointInput
+    ):
+        """Test failed entrypoint execution."""
+        # Mock bash start response
+        start_response = MagicMock()
+        start_response.status_code = 200
+        start_response.json.return_value = {"id": "cmd-123"}
+        start_response.raise_for_status = MagicMock()
+
+        # Mock bash events search - returns items array with exit_code
+        result_response = MagicMock()
+        result_response.status_code = 200
+        result_response.json.return_value = {
+            "items": [
+                {
+                    "exit_code": 1,
+                    "stdout": "",
+                    "stderr": "Error: something went wrong",
+                }
+            ]
+        }
+        result_response.raise_for_status = MagicMock()
+
+        with (
+            patch("automation.temporal.activities.httpx.AsyncClient") as mock_client,
+            patch("automation.temporal.activities.asyncio.sleep", new=AsyncMock()),
+        ):
+            mock_instance = mock_client.return_value.__aenter__.return_value
+            mock_instance.post = AsyncMock(return_value=start_response)
+            mock_instance.get = AsyncMock(return_value=result_response)
+
+            result = await activity_env.run(execute_entrypoint, input)
+
+            assert isinstance(result, ExecutionResult)
+            assert result.success is False
+            assert result.exit_code == 1
+
+
+class TestCleanupSandboxActivity:
+    """Tests for cleanup_sandbox activity."""
+
+    @pytest.fixture
+    def activity_env(self) -> ActivityEnvironment:
+        return ActivityEnvironment()
+
+    @pytest.fixture
+    def input(self) -> CleanupSandboxInput:
+        return CleanupSandboxInput(
+            api_url="https://api.example.com",
+            api_key="sk-test-key",
+            sandbox_id="sandbox-123",
+            run_id="run-123",
+        )
+
+    @pytest.mark.asyncio
+    async def test_cleanup_sandbox_success(
+        self, activity_env: ActivityEnvironment, input: CleanupSandboxInput
+    ):
+        """Test successful sandbox cleanup."""
+        mock_response = MagicMock()
+        mock_response.status_code = 200
+        mock_response.raise_for_status = MagicMock()
+
+        with patch("automation.temporal.activities.httpx.AsyncClient") as mock_client:
+            mock_instance = mock_client.return_value.__aenter__.return_value
+            mock_instance.delete = AsyncMock(return_value=mock_response)
+
+            await activity_env.run(cleanup_sandbox, input)
+
+            mock_instance.delete.assert_called_once()
+
+    @pytest.mark.asyncio
+    async def test_cleanup_sandbox_failure_ignored(
+        self, activity_env: ActivityEnvironment, input: CleanupSandboxInput
+    ):
+        """Test cleanup failure is handled gracefully."""
+        mock_response = MagicMock()
+        mock_response.status_code = 404
+        mock_response.text = "Not found"
+        mock_response.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "Not found", request=MagicMock(), response=mock_response
+        )
+
+        with patch("automation.temporal.activities.httpx.AsyncClient") as mock_client:
+            mock_instance = mock_client.return_value.__aenter__.return_value
+            mock_instance.delete = AsyncMock(return_value=mock_response)
+
+            # Should not raise - cleanup failures are logged but not propagated
+            await activity_env.run(cleanup_sandbox, input)
diff --git a/tests/temporal/test_schedules.py b/tests/temporal/test_schedules.py
new file mode 100644
index 0000000..9468103
--- /dev/null
+++ b/tests/temporal/test_schedules.py
@@ -0,0 +1,223 @@
+"""Tests for Temporal schedule management.
+
+Tests the schedule creation, update, and deletion functions.
+"""
+
+import uuid
+from unittest.mock import AsyncMock, MagicMock
+
+import pytest
+
+from automation.models import Automation
+from automation.temporal.schedules import (
+    _make_schedule_id,
+    create_schedule,
+    delete_schedule,
+    pause_schedule,
+    trigger_schedule,
+    unpause_schedule,
+    update_schedule,
+)
+
+
+def make_test_automation(
+    cron_schedule: str = "0 9 * * 1-5",
+    timezone: str = "UTC",
+    trigger_type: str = "cron",
+) -> Automation:
+    """Create a test automation with sensible defaults."""
+    automation = Automation(
+        id=uuid.uuid4(),
+        user_id=uuid.uuid4(),
+        org_id=uuid.uuid4(),
+        name="Test Automation",
+        trigger={
+            "type": trigger_type,
+            "schedule": cron_schedule,
+            "timezone": timezone,
+        },
+        tarball_path="https://example.com/code.tar.gz",
+        entrypoint="python main.py",
+        timeout=300,
+        enabled=True,
+    )
+    return automation
+
+
+class TestMakeScheduleId:
+    """Tests for schedule ID generation."""
+
+    def test_schedule_id_format(self):
+        """Test schedule ID has expected format."""
+        automation_id = uuid.uuid4()
+        schedule_id = _make_schedule_id(automation_id)
+
+        assert schedule_id.startswith("automation-")
+        assert str(automation_id) in schedule_id
+
+    def test_schedule_id_deterministic(self):
+        """Test same automation ID produces same schedule ID."""
+        automation_id = uuid.uuid4()
+        id1 = _make_schedule_id(automation_id)
+        id2 = _make_schedule_id(automation_id)
+
+        assert id1 == id2
+
+
+class TestCreateSchedule:
+    """Tests for schedule creation."""
+
+    @pytest.fixture
+    def automation(self) -> Automation:
+        return make_test_automation()
+
+    @pytest.mark.asyncio
+    async def test_create_schedule_success(self, automation: Automation):
+        """Test successful schedule creation."""
+        mock_handle = MagicMock()
+
+        mock_client = AsyncMock()
+        mock_client.create_schedule = AsyncMock(return_value=mock_handle)
+
+        schedule_id = await create_schedule(mock_client, automation)
+
+        assert schedule_id is not None
+        assert str(automation.id) in schedule_id
+        mock_client.create_schedule.assert_called_once()
+
+    @pytest.mark.asyncio
+    async def test_create_schedule_with_cron(self, automation: Automation):
+        """Test schedule is created with correct cron expression."""
+        mock_handle = MagicMock()
+        mock_client = AsyncMock()
+        mock_client.create_schedule = AsyncMock(return_value=mock_handle)
+
+        await create_schedule(mock_client, automation)
+
+        # Verify the schedule was created with correct parameters
+        call_args = mock_client.create_schedule.call_args
+        assert call_args is not None
+
+    @pytest.mark.asyncio
+    async def test_create_schedule_without_cron_raises(self):
+        """Test that creating a schedule without cron raises error."""
+        automation = make_test_automation(trigger_type="manual")
+        automation.trigger = {"type": "manual"}
+
+        mock_client = AsyncMock()
+
+        with pytest.raises(ValueError, match="trigger type"):
+            await create_schedule(mock_client, automation)
+
+
+class TestUpdateSchedule:
+    """Tests for schedule updates."""
+
+    @pytest.fixture
+    def automation(self) -> Automation:
+        return make_test_automation(cron_schedule="0 10 * * 1-5")
+
+    @pytest.mark.asyncio
+    async def test_update_schedule_success(self, automation: Automation):
+        """Test successful schedule update."""
+        mock_handle = AsyncMock()
+        mock_handle.update = AsyncMock()
+
+        mock_client = AsyncMock()
+        mock_client.get_schedule_handle = MagicMock(return_value=mock_handle)
+
+        await update_schedule(mock_client, automation)
+
+        mock_client.get_schedule_handle.assert_called_once()
+        mock_handle.update.assert_called_once()
+
+
+class TestDeleteSchedule:
+    """Tests for schedule deletion."""
+
+    @pytest.mark.asyncio
+    async def test_delete_schedule_success(self):
+        """Test successful schedule deletion."""
+        automation_id = uuid.uuid4()
+
+        mock_handle = AsyncMock()
+        mock_handle.delete = AsyncMock()
+
+        mock_client = AsyncMock()
+        mock_client.get_schedule_handle = MagicMock(return_value=mock_handle)
+
+        await delete_schedule(mock_client, automation_id)
+
+        mock_client.get_schedule_handle.assert_called_once()
+        mock_handle.delete.assert_called_once()
+
+    @pytest.mark.asyncio
+    async def test_delete_schedule_not_found_ignored(self):
+        """Test delete handles not found gracefully."""
+        from temporalio.service import RPCError, RPCStatusCode
+
+        automation_id = uuid.uuid4()
+
+        mock_handle = AsyncMock()
+        mock_handle.delete = AsyncMock(
+            side_effect=RPCError("Not found", RPCStatusCode.NOT_FOUND, b"")
+        )
+
+        mock_client = AsyncMock()
+        mock_client.get_schedule_handle = MagicMock(return_value=mock_handle)
+
+        # Should not raise
+        await delete_schedule(mock_client, automation_id)
+
+
+class TestPauseUnpauseSchedule:
+    """Tests for pausing and unpausing schedules."""
+
+    @pytest.mark.asyncio
+    async def test_pause_schedule_success(self):
+        """Test successful schedule pause."""
+        automation_id = uuid.uuid4()
+
+        mock_handle = AsyncMock()
+        mock_handle.pause = AsyncMock()
+
+        mock_client = AsyncMock()
+        mock_client.get_schedule_handle = MagicMock(return_value=mock_handle)
+
+        await pause_schedule(mock_client, automation_id)
+
+        mock_handle.pause.assert_called_once()
+
+    @pytest.mark.asyncio
+    async def test_unpause_schedule_success(self):
+        """Test successful schedule unpause."""
+        automation_id = uuid.uuid4()
+
+        mock_handle = AsyncMock()
+        mock_handle.unpause = AsyncMock()
+
+        mock_client = AsyncMock()
+        mock_client.get_schedule_handle = MagicMock(return_value=mock_handle)
+
+        await unpause_schedule(mock_client, automation_id)
+
+        mock_handle.unpause.assert_called_once()
+
+
+class TestTriggerSchedule:
+    """Tests for manual schedule triggering."""
+
+    @pytest.mark.asyncio
+    async def test_trigger_schedule_success(self):
+        """Test successful manual trigger."""
+        automation_id = uuid.uuid4()
+
+        mock_handle = AsyncMock()
+        mock_handle.trigger = AsyncMock()
+
+        mock_client = AsyncMock()
+        mock_client.get_schedule_handle = MagicMock(return_value=mock_handle)
+
+        await trigger_schedule(mock_client, automation_id)
+
+        mock_handle.trigger.assert_called_once()
diff --git a/tests/temporal/test_types.py b/tests/temporal/test_types.py
new file mode 100644
index 0000000..8d7a081
--- /dev/null
+++ b/tests/temporal/test_types.py
@@ -0,0 +1,229 @@
+"""Tests for Temporal dataclasses."""
+
+import pytest
+
+from automation.temporal.types import (
+    AutomationConfig,
+    CleanupSandboxInput,
+    CreateSandboxInput,
+    ExecutionResult,
+    GetApiKeyInput,
+    SandboxInfo,
+    TriggerContext,
+    WorkflowInput,
+    WorkflowResult,
+)
+
+
+class TestAutomationConfig:
+    """Tests for AutomationConfig dataclass."""
+
+    def test_create_basic(self):
+        """Test creating a basic AutomationConfig."""
+        config = AutomationConfig(
+            automation_id="test-id",
+            user_id="user-123",
+            org_id="org-456",
+            name="Test Automation",
+            tarball_path="oh-internal://uploads/abc123",
+            entrypoint="python main.py",
+            timeout_seconds=600,
+        )
+
+        assert config.automation_id == "test-id"
+        assert config.user_id == "user-123"
+        assert config.org_id == "org-456"
+        assert config.name == "Test Automation"
+        assert config.tarball_path == "oh-internal://uploads/abc123"
+        assert config.entrypoint == "python main.py"
+        assert config.timeout_seconds == 600
+        assert config.trigger == {}
+        assert config.setup_script_path is None
+
+    def test_create_with_trigger(self):
+        """Test creating AutomationConfig with trigger."""
+        trigger = {"type": "cron", "schedule": "0 9 * * 1", "timezone": "UTC"}
+        config = AutomationConfig(
+            automation_id="test-id",
+            user_id="user-123",
+            org_id="org-456",
+            name="Test",
+            tarball_path="https://example.com/code.tar.gz",
+            entrypoint="./run.sh",
+            timeout_seconds=300,
+            trigger=trigger,
+            setup_script_path="setup.sh",
+        )
+
+        assert config.trigger == trigger
+        assert config.setup_script_path == "setup.sh"
+
+    def test_is_frozen(self):
+        """Test that AutomationConfig is immutable."""
+        config = AutomationConfig(
+            automation_id="test-id",
+            user_id="user-123",
+            org_id="org-456",
+            name="Test",
+            tarball_path="https://example.com/code.tar.gz",
+            entrypoint="./run.sh",
+            timeout_seconds=300,
+        )
+
+        with pytest.raises(AttributeError):
+            config.name = "New Name"  # type: ignore
+
+
+class TestWorkflowInput:
+    """Tests for WorkflowInput dataclass."""
+
+    def test_create(self):
+        """Test creating WorkflowInput."""
+        config = AutomationConfig(
+            automation_id="auto-1",
+            user_id="user-1",
+            org_id="org-1",
+            name="Test",
+            tarball_path="https://example.com/code.tar.gz",
+            entrypoint="python main.py",
+            timeout_seconds=600,
+        )
+        trigger_context = TriggerContext(
+            trigger_type="manual",
+            triggered_by="user-1",
+        )
+
+        input = WorkflowInput(
+            automation=config,
+            trigger_context=trigger_context,
+            run_id="run-123",
+            callback_url="https://example.com/callback",
+        )
+
+        assert input.automation == config
+        assert input.trigger_context == trigger_context
+        assert input.run_id == "run-123"
+        assert input.callback_url == "https://example.com/callback"
+
+
+class TestSandboxInfo:
+    """Tests for SandboxInfo dataclass."""
+
+    def test_create(self):
+        """Test creating SandboxInfo."""
+        info = SandboxInfo(
+            sandbox_id="sb-123",
+            agent_url="https://agent.example.com",
+            session_key="session-key-abc",
+            api_key="api-key-xyz",
+        )
+
+        assert info.sandbox_id == "sb-123"
+        assert info.agent_url == "https://agent.example.com"
+        assert info.session_key == "session-key-abc"
+        assert info.api_key == "api-key-xyz"
+
+
+class TestExecutionResult:
+    """Tests for ExecutionResult dataclass."""
+
+    def test_successful_result(self):
+        """Test creating a successful execution result."""
+        result = ExecutionResult(
+            success=True,
+            exit_code=0,
+            stdout="Hello World",
+            stderr="",
+        )
+
+        assert result.success is True
+        assert result.exit_code == 0
+        assert result.stdout == "Hello World"
+        assert result.stderr == ""
+        assert result.error is None
+
+    def test_failed_result(self):
+        """Test creating a failed execution result."""
+        result = ExecutionResult(
+            success=False,
+            exit_code=1,
+            stdout="",
+            stderr="Error: file not found",
+            error="exit_code=1",
+        )
+
+        assert result.success is False
+        assert result.exit_code == 1
+        assert result.error == "exit_code=1"
+
+
+class TestWorkflowResult:
+    """Tests for WorkflowResult dataclass."""
+
+    def test_successful_result(self):
+        """Test creating a successful workflow result."""
+        result = WorkflowResult(
+            success=True,
+            run_id="run-123",
+            sandbox_id="sb-456",
+            exit_code=0,
+            conversation_id="conv-789",
+        )
+
+        assert result.success is True
+        assert result.run_id == "run-123"
+        assert result.sandbox_id == "sb-456"
+        assert result.exit_code == 0
+        assert result.error is None
+
+    def test_failed_result(self):
+        """Test creating a failed workflow result."""
+        result = WorkflowResult(
+            success=False,
+            run_id="run-123",
+            sandbox_id="sb-456",
+            error="Sandbox creation failed",
+        )
+
+        assert result.success is False
+        assert result.error == "Sandbox creation failed"
+
+
+class TestActivityInputs:
+    """Tests for activity input dataclasses."""
+
+    def test_get_api_key_input(self):
+        """Test GetApiKeyInput."""
+        input = GetApiKeyInput(
+            user_id="user-123",
+            org_id="org-456",
+            run_id="run-789",
+        )
+
+        assert input.user_id == "user-123"
+        assert input.org_id == "org-456"
+        assert input.run_id == "run-789"
+
+    def test_create_sandbox_input(self):
+        """Test CreateSandboxInput."""
+        input = CreateSandboxInput(
+            api_url="https://api.example.com",
+            api_key="test-key",
+            run_id="run-123",
+        )
+
+        assert input.api_url == "https://api.example.com"
+        assert input.api_key == "test-key"
+        assert input.run_id == "run-123"
+
+    def test_cleanup_sandbox_input(self):
+        """Test CleanupSandboxInput."""
+        input = CleanupSandboxInput(
+            api_url="https://api.example.com",
+            api_key="test-key",
+            sandbox_id="sb-123",
+            run_id="run-456",
+        )
+
+        assert input.api_url == "https://api.example.com"
+        assert input.sandbox_id == "sb-123"
diff --git a/tests/temporal/test_workflows.py b/tests/temporal/test_workflows.py
new file mode 100644
index 0000000..bc1d8a5
--- /dev/null
+++ b/tests/temporal/test_workflows.py
@@ -0,0 +1,285 @@
+"""Tests for Temporal workflows.
+
+Uses WorkflowEnvironment with time-skipping to test workflows with mocked activities.
+
+Note: These tests require the Temporal test server which is bundled with temporalio.
+The time-skipping environment allows testing workflows with timers/delays quickly.
+"""
+
+import uuid
+
+import pytest
+from temporalio import activity
+from temporalio.testing import WorkflowEnvironment
+from temporalio.worker import Worker
+
+from automation.temporal.types import (
+    AutomationConfig,
+    CleanupSandboxInput,
+    CreateSandboxInput,
+    DownloadTarballInput,
+    ExecuteEntrypointInput,
+    ExecutionResult,
+    GetApiKeyInput,
+    SandboxInfo,
+    TriggerContext,
+    UploadTarballInput,
+    WorkflowInput,
+    WorkflowResult,
+)
+from automation.temporal.workflows import AutomationWorkflow
+
+
+# --- Mock Activities ---
+# These mocked activities simulate successful execution paths
+
+
+@activity.defn(name="get_api_key")
+async def mock_get_api_key(input: GetApiKeyInput) -> str:
+    """Mock activity that returns a test API key."""
+    return f"sk-test-{input.user_id[:8]}"
+
+
+@activity.defn(name="create_sandbox")
+async def mock_create_sandbox(input: CreateSandboxInput) -> SandboxInfo:
+    """Mock activity that creates a fake sandbox."""
+    return SandboxInfo(
+        sandbox_id=f"sandbox-{input.run_id}",
+        agent_url="https://mock-agent.example.com",
+        session_key="mock-session-key",
+        api_key=input.api_key,
+    )
+
+
+@activity.defn(name="download_tarball")
+async def mock_download_tarball(input: DownloadTarballInput) -> bytes:
+    """Mock activity that returns fake tarball content."""
+    return b"mock tarball content"
+
+
+@activity.defn(name="upload_tarball")
+async def mock_upload_tarball(input: UploadTarballInput) -> None:
+    """Mock activity that simulates tarball upload."""
+    pass
+
+
+@activity.defn(name="execute_entrypoint")
+async def mock_execute_entrypoint_success(
+    input: ExecuteEntrypointInput,
+) -> ExecutionResult:
+    """Mock activity that simulates successful execution."""
+    return ExecutionResult(
+        success=True,
+        exit_code=0,
+        stdout="Execution completed successfully",
+        stderr="",
+    )
+
+
+@activity.defn(name="cleanup_sandbox")
+async def mock_cleanup_sandbox(input: CleanupSandboxInput) -> None:
+    """Mock activity that simulates sandbox cleanup."""
+    pass
+
+
+# Mock activities for failure scenarios
+
+
+def create_failing_execute_activity():
+    """Create a mock execute activity that fails."""
+
+    @activity.defn(name="execute_entrypoint")
+    async def mock_execute_entrypoint_failure(
+        input: ExecuteEntrypointInput,
+    ) -> ExecutionResult:
+        return ExecutionResult(
+            success=False,
+            exit_code=1,
+            stdout="",
+            stderr="Error: Script failed",
+            error="Script exited with code 1",
+        )
+
+    return mock_execute_entrypoint_failure
+
+
+def create_tracking_cleanup_activity(cleanup_calls: list):
+    """Create a cleanup activity that tracks calls."""
+
+    @activity.defn(name="cleanup_sandbox")
+    async def mock_cleanup_tracking(input: CleanupSandboxInput) -> None:
+        cleanup_calls.append(input.sandbox_id)
+
+    return mock_cleanup_tracking
+
+
+# Standard set of mock activities for successful workflows
+MOCK_ACTIVITIES_SUCCESS = [
+    mock_get_api_key,
+    mock_create_sandbox,
+    mock_download_tarball,
+    mock_upload_tarball,
+    mock_execute_entrypoint_success,
+    mock_cleanup_sandbox,
+]
+
+
+def make_automation_config(
+    name: str = "Test Automation",
+    tarball_path: str = "https://example.com/code.tar.gz",
+    timeout_seconds: int = 300,
+) -> AutomationConfig:
+    """Helper to create test AutomationConfig."""
+    return AutomationConfig(
+        automation_id=str(uuid.uuid4()),
+        user_id=str(uuid.uuid4()),
+        org_id=str(uuid.uuid4()),
+        name=name,
+        tarball_path=tarball_path,
+        entrypoint="python main.py",
+        timeout_seconds=timeout_seconds,
+    )
+
+
+def make_workflow_input(
+    config: AutomationConfig | None = None,
+    trigger_type: str = "manual",
+) -> WorkflowInput:
+    """Helper to create test WorkflowInput."""
+    if config is None:
+        config = make_automation_config()
+    return WorkflowInput(
+        automation=config,
+        trigger_context=TriggerContext(trigger_type=trigger_type),
+        run_id=str(uuid.uuid4()),
+    )
+
+
+# Skip workflow tests if temporal test server is not available
+# These tests require downloading the test server on first run
+pytestmark = pytest.mark.skip(
+    reason="Workflow tests require Temporal test server - run manually with: "
+    "pytest tests/temporal/test_workflows.py --no-skip"
+)
+
+
+class TestAutomationWorkflow:
+    """Tests for AutomationWorkflow.
+
+    These tests use the Temporal time-skipping test server to run workflows
+    with mocked activities. On first run, the test server binary will be
+    downloaded automatically.
+    """
+
+    @pytest.fixture
+    def workflow_input(self) -> WorkflowInput:
+        return make_workflow_input()
+
+    @pytest.mark.asyncio
+    async def test_workflow_success(self, workflow_input: WorkflowInput):
+        """Test successful workflow execution end-to-end."""
+        async with await WorkflowEnvironment.start_time_skipping() as env:
+            async with Worker(
+                env.client,
+                task_queue="test-queue",
+                workflows=[AutomationWorkflow],
+                activities=MOCK_ACTIVITIES_SUCCESS,
+            ):
+                result = await env.client.execute_workflow(
+                    AutomationWorkflow.run,
+                    workflow_input,
+                    id=f"test-{workflow_input.run_id}",
+                    task_queue="test-queue",
+                )
+
+                assert isinstance(result, WorkflowResult)
+                assert result.success is True
+                assert result.run_id == workflow_input.run_id
+                assert result.exit_code == 0
+                assert result.error is None
+
+    @pytest.mark.asyncio
+    async def test_workflow_with_internal_tarball(self):
+        """Test workflow with internal tarball (oh-internal://)."""
+        config = make_automation_config(
+            tarball_path="oh-internal://uploads/user-123/code.tar.gz"
+        )
+        workflow_input = make_workflow_input(config=config)
+
+        async with await WorkflowEnvironment.start_time_skipping() as env:
+            async with Worker(
+                env.client,
+                task_queue="test-queue",
+                workflows=[AutomationWorkflow],
+                activities=MOCK_ACTIVITIES_SUCCESS,
+            ):
+                result = await env.client.execute_workflow(
+                    AutomationWorkflow.run,
+                    workflow_input,
+                    id=f"test-internal-{workflow_input.run_id}",
+                    task_queue="test-queue",
+                )
+
+                assert result.success is True
+
+    @pytest.mark.asyncio
+    async def test_workflow_execution_failure(self, workflow_input: WorkflowInput):
+        """Test workflow handles execution failure gracefully."""
+        activities_with_failure = [
+            mock_get_api_key,
+            mock_create_sandbox,
+            mock_download_tarball,
+            mock_upload_tarball,
+            create_failing_execute_activity(),
+            mock_cleanup_sandbox,
+        ]
+
+        async with await WorkflowEnvironment.start_time_skipping() as env:
+            async with Worker(
+                env.client,
+                task_queue="test-queue",
+                workflows=[AutomationWorkflow],
+                activities=activities_with_failure,
+            ):
+                result = await env.client.execute_workflow(
+                    AutomationWorkflow.run,
+                    workflow_input,
+                    id=f"test-failure-{workflow_input.run_id}",
+                    task_queue="test-queue",
+                )
+
+                assert result.success is False
+                assert result.exit_code == 1
+                assert result.error is not None
+
+    @pytest.mark.asyncio
+    async def test_cleanup_always_runs(self, workflow_input: WorkflowInput):
+        """Test that cleanup activity runs even when execution fails."""
+        cleanup_calls: list[str] = []
+
+        activities_with_failure_and_tracking = [
+            mock_get_api_key,
+            mock_create_sandbox,
+            mock_download_tarball,
+            mock_upload_tarball,
+            create_failing_execute_activity(),
+            create_tracking_cleanup_activity(cleanup_calls),
+        ]
+
+        async with await WorkflowEnvironment.start_time_skipping() as env:
+            async with Worker(
+                env.client,
+                task_queue="test-queue",
+                workflows=[AutomationWorkflow],
+                activities=activities_with_failure_and_tracking,
+            ):
+                result = await env.client.execute_workflow(
+                    AutomationWorkflow.run,
+                    workflow_input,
+                    id=f"test-cleanup-{workflow_input.run_id}",
+                    task_queue="test-queue",
+                )
+
+                # Execution failed but cleanup still ran
+                assert result.success is False
+                assert len(cleanup_calls) == 1
diff --git a/tests/test_auth.py b/tests/test_auth.py
index aa3e579..0244e48 100644
--- a/tests/test_auth.py
+++ b/tests/test_auth.py
@@ -149,7 +149,9 @@ class TestAuthIntegration:
     call to the OpenHands API (the external dependency).
     """
 
-    async def test_valid_key_through_api(self, async_engine, async_session_factory):
+    async def test_valid_key_through_api(
+        self, async_engine, async_session_factory, mock_temporal_client
+    ):
         """Valid API key flows through auth middleware to endpoint."""
         mock_response = MagicMock()
         mock_response.status_code = 200
@@ -165,10 +167,17 @@ async def override_get_session():
             async with async_session_factory() as session:
                 yield session
 
+        from automation.router import get_client
+
+        async def override_get_client():
+            return mock_temporal_client
+
         # Only override the DB session; auth stays real
         app.dependency_overrides[get_session] = override_get_session
+        app.dependency_overrides[get_client] = override_get_client
         app.state.engine = async_engine
         app.state.session_factory = async_session_factory
+        app.state.temporal_client = mock_temporal_client
 
         # Create a mock http_client in app.state for the DI pattern
         mock_client = AsyncMock()
@@ -192,7 +201,7 @@ async def override_get_session():
             app.dependency_overrides.clear()
 
     async def test_missing_auth_header_through_api(
-        self, async_engine, async_session_factory
+        self, async_engine, async_session_factory, mock_temporal_client
     ):
         """Request without Authorization header is rejected by real auth middleware."""
 
@@ -200,9 +209,16 @@ async def override_get_session():
             async with async_session_factory() as session:
                 yield session
 
+        from automation.router import get_client
+
+        async def override_get_client():
+            return mock_temporal_client
+
         app.dependency_overrides[get_session] = override_get_session
+        app.dependency_overrides[get_client] = override_get_client
         app.state.engine = async_engine
         app.state.session_factory = async_session_factory
+        app.state.temporal_client = mock_temporal_client
 
         # Create a mock http_client in app.state for the DI pattern
         mock_client = AsyncMock()
@@ -219,7 +235,9 @@ async def override_get_session():
         finally:
             app.dependency_overrides.clear()
 
-    async def test_invalid_key_through_api(self, async_engine, async_session_factory):
+    async def test_invalid_key_through_api(
+        self, async_engine, async_session_factory, mock_temporal_client
+    ):
         """Invalid API key is rejected by auth middleware."""
         mock_response = MagicMock()
         mock_response.status_code = 401
@@ -228,9 +246,16 @@ async def override_get_session():
             async with async_session_factory() as session:
                 yield session
 
+        from automation.router import get_client
+
+        async def override_get_client():
+            return mock_temporal_client
+
         app.dependency_overrides[get_session] = override_get_session
+        app.dependency_overrides[get_client] = override_get_client
         app.state.engine = async_engine
         app.state.session_factory = async_session_factory
+        app.state.temporal_client = mock_temporal_client
 
         # Create a mock http_client in app.state for the DI pattern
         mock_client = AsyncMock()
diff --git a/tests/test_disable_automation.py b/tests/test_disable_automation.py
deleted file mode 100644
index 3ad0649..0000000
--- a/tests/test_disable_automation.py
+++ /dev/null
@@ -1,349 +0,0 @@
-"""Tests for automatic disabling of automations with erroneous configurations.
-
-When an automation has a permanent error (e.g., tarball URL doesn't exist),
-the system should automatically disable it to prevent repeated failed runs.
-"""
-
-import uuid
-from unittest.mock import AsyncMock, patch
-
-import pytest
-from sqlalchemy import select
-
-from automation.exceptions import PermanentDispatchError, TarballNotFoundError
-from automation.execution import _is_permanent_http_error
-
-
-# Test UUIDs
-TEST_USER_ID = uuid.UUID("12345678-1234-5678-1234-567812345678")
-TEST_ORG_ID = uuid.UUID("87654321-4321-8765-4321-876543218765")
-
-
-def _docker_available() -> bool:
-    """Check if Docker is available for testcontainers."""
-    try:
-        import socket
-
-        sock = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM)
-        sock.connect("/var/run/docker.sock")
-        sock.close()
-        return True
-    except (FileNotFoundError, ConnectionRefusedError):
-        return False
-
-
-requires_docker = pytest.mark.skipif(
-    not _docker_available(),
-    reason="Docker not available for testcontainers",
-)
-
-
-class TestExceptions:
-    """Tests for the custom exception hierarchy."""
-
-    def test_tarball_not_found_is_permanent_error(self):
-        """TarballNotFoundError is a PermanentDispatchError."""
-        exc = TarballNotFoundError("test")
-        assert isinstance(exc, PermanentDispatchError)
-
-    def test_permanent_dispatch_error_is_exception(self):
-        """PermanentDispatchError is a standard Exception."""
-        exc = PermanentDispatchError("test")
-        assert isinstance(exc, Exception)
-
-
-class TestIsPermanentHttpError:
-    """Tests for _is_permanent_http_error function."""
-
-    def test_404_is_permanent(self):
-        """HTTP 404 Not Found is a permanent error."""
-        stderr = "curl: (22) The requested URL returned error: 404"
-        assert _is_permanent_http_error(stderr) is True
-
-    def test_403_is_permanent(self):
-        """HTTP 403 Forbidden is a permanent error."""
-        stderr = "curl: (22) The requested URL returned error: 403"
-        assert _is_permanent_http_error(stderr) is True
-
-    def test_401_is_permanent(self):
-        """HTTP 401 Unauthorized is a permanent error."""
-        stderr = "curl: (22) The requested URL returned error: 401"
-        assert _is_permanent_http_error(stderr) is True
-
-    def test_400_is_permanent(self):
-        """HTTP 400 Bad Request is a permanent error."""
-        stderr = "curl: (22) The requested URL returned error: 400"
-        assert _is_permanent_http_error(stderr) is True
-
-    def test_410_is_permanent(self):
-        """HTTP 410 Gone is a permanent error."""
-        stderr = "curl: (22) The requested URL returned error: 410"
-        assert _is_permanent_http_error(stderr) is True
-
-    def test_500_is_not_permanent(self):
-        """HTTP 500 Internal Server Error is a transient error."""
-        stderr = "curl: (22) The requested URL returned error: 500"
-        assert _is_permanent_http_error(stderr) is False
-
-    def test_502_is_not_permanent(self):
-        """HTTP 502 Bad Gateway is a transient error."""
-        stderr = "curl: (22) The requested URL returned error: 502"
-        assert _is_permanent_http_error(stderr) is False
-
-    def test_503_is_not_permanent(self):
-        """HTTP 503 Service Unavailable is a transient error."""
-        stderr = "curl: (22) The requested URL returned error: 503"
-        assert _is_permanent_http_error(stderr) is False
-
-    def test_no_status_code_is_not_permanent(self):
-        """Non-HTTP errors are not permanent."""
-        stderr = "curl: (7) Failed to connect to host.example.com"
-        assert _is_permanent_http_error(stderr) is False
-
-    def test_empty_stderr_is_not_permanent(self):
-        """Empty stderr is not permanent."""
-        assert _is_permanent_http_error("") is False
-
-    def test_timeout_error_is_not_permanent(self):
-        """Timeout errors are not permanent."""
-        stderr = "curl: (28) Operation timed out after 30000 milliseconds"
-        assert _is_permanent_http_error(stderr) is False
-
-
-@requires_docker
-class TestDisableAutomation:
-    """Tests for the disable_automation function."""
-
-    async def test_disables_enabled_automation(self, async_session_factory):
-        """An enabled automation is disabled and returns True."""
-        from automation.models import Automation
-        from automation.utils.run import disable_automation
-
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="https://example.com/missing.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-            automation_id = automation.id
-
-        result = await disable_automation(
-            async_session_factory, automation_id, "Tarball not found"
-        )
-
-        assert result is True
-
-        async with async_session_factory() as session:
-            db_result = await session.execute(
-                select(Automation).where(Automation.id == automation_id)
-            )
-            automation = db_result.scalars().first()
-            assert automation.enabled is False
-
-    async def test_returns_false_for_already_disabled(self, async_session_factory):
-        """Already disabled automation returns False."""
-        from automation.models import Automation
-        from automation.utils.run import disable_automation
-
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="https://example.com/missing.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=False,  # Already disabled
-            )
-            session.add(automation)
-            await session.commit()
-            automation_id = automation.id
-
-        result = await disable_automation(
-            async_session_factory, automation_id, "Tarball not found"
-        )
-
-        assert result is False
-
-    async def test_returns_false_for_nonexistent(self, async_session_factory):
-        """Non-existent automation returns False."""
-        from automation.utils.run import disable_automation
-
-        fake_id = uuid.uuid4()
-        result = await disable_automation(
-            async_session_factory, fake_id, "Tarball not found"
-        )
-
-        assert result is False
-
-
-@requires_docker
-class TestDownloadInternalTarball:
-    """Tests for _download_internal_tarball raising TarballNotFoundError."""
-
-    async def test_raises_tarball_not_found_for_missing_upload(
-        self, async_session_factory
-    ):
-        """TarballNotFoundError is raised when upload record doesn't exist."""
-        from automation.dispatcher import _download_internal_tarball
-
-        fake_upload_id = uuid.uuid4()
-
-        async with async_session_factory() as session:
-            with pytest.raises(TarballNotFoundError) as exc_info:
-                await _download_internal_tarball(fake_upload_id, session)
-
-        assert "not found" in str(exc_info.value).lower()
-        assert str(fake_upload_id) in str(exc_info.value)
-
-
-@requires_docker
-class TestExecuteRunDisablesAutomation:
-    """Tests that _execute_run disables automation on permanent errors."""
-
-    @patch("automation.dispatcher.dispatch_automation")
-    @patch("automation.dispatcher.get_api_key_for_automation_run")
-    async def test_disables_automation_on_internal_tarball_not_found(
-        self,
-        mock_get_api_key,
-        mock_dispatch,
-        async_session_factory,
-        mock_settings,
-    ):
-        """Automation is disabled when internal tarball upload is not found."""
-        from automation.dispatcher import _execute_run
-        from automation.models import Automation, AutomationRun, AutomationRunStatus
-
-        mock_get_api_key.return_value = "test-api-key"
-
-        # Create an automation with a non-existent internal tarball
-        fake_upload_id = uuid.uuid4()
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path=f"oh-internal://uploads/{fake_upload_id}",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.RUNNING,
-            )
-            session.add(run)
-            await session.commit()
-            automation_id = automation.id
-
-        # Re-fetch with automation relationship loaded
-        async with async_session_factory() as session:
-            from sqlalchemy.orm import selectinload
-
-            result = await session.execute(
-                select(AutomationRun)
-                .options(selectinload(AutomationRun.automation))
-                .where(AutomationRun.automation_id == automation_id)
-            )
-            run = result.scalars().first()
-
-            await _execute_run(run, mock_settings, async_session_factory)
-
-        # Verify automation was disabled
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(Automation).where(Automation.id == automation_id)
-            )
-            automation = result.scalars().first()
-            assert automation.enabled is False
-
-        # Verify run was marked as FAILED
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(AutomationRun).where(
-                    AutomationRun.automation_id == automation_id
-                )
-            )
-            run = result.scalars().first()
-            assert run.status == AutomationRunStatus.FAILED
-            assert "not found" in run.error_detail.lower()
-
-    @patch("automation.dispatcher.dispatch_automation")
-    @patch("automation.dispatcher.get_api_key_for_automation_run")
-    async def test_does_not_disable_on_transient_error(
-        self,
-        mock_get_api_key,
-        mock_dispatch,
-        async_session_factory,
-        mock_settings,
-    ):
-        """Automation is NOT disabled on transient errors like network failures."""
-        from automation.dispatcher import _execute_run
-        from automation.models import Automation, AutomationRun, AutomationRunStatus
-
-        mock_get_api_key.return_value = "test-api-key"
-        # Simulate a transient dispatch failure (e.g., sandbox creation failed)
-        mock_dispatch.return_value = AsyncMock(
-            success=False, sandbox_id=None, error="Connection timeout"
-        )
-
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="https://example.com/valid.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.RUNNING,
-            )
-            session.add(run)
-            await session.commit()
-            automation_id = automation.id
-
-        # Re-fetch with automation relationship loaded
-        async with async_session_factory() as session:
-            from sqlalchemy.orm import selectinload
-
-            result = await session.execute(
-                select(AutomationRun)
-                .options(selectinload(AutomationRun.automation))
-                .where(AutomationRun.automation_id == automation_id)
-            )
-            run = result.scalars().first()
-
-            await _execute_run(run, mock_settings, async_session_factory)
-
-        # Verify automation is still enabled (transient error)
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(Automation).where(Automation.id == automation_id)
-            )
-            automation = result.scalars().first()
-            assert automation.enabled is True
-
-        # Verify run was marked as FAILED
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(AutomationRun).where(
-                    AutomationRun.automation_id == automation_id
-                )
-            )
-            run = result.scalars().first()
-            assert run.status == AutomationRunStatus.FAILED
diff --git a/tests/test_dispatcher.py b/tests/test_dispatcher.py
deleted file mode 100644
index dee4ddc..0000000
--- a/tests/test_dispatcher.py
+++ /dev/null
@@ -1,539 +0,0 @@
-"""Tests for the dispatcher module.
-
-The dispatcher polls for PENDING automation runs and marks them as RUNNING.
-"""
-
-import asyncio
-import uuid
-from datetime import timedelta
-from unittest.mock import AsyncMock, patch
-
-import pytest
-from sqlalchemy import select
-
-from automation.dispatcher import (
-    dispatch_pending_runs,
-    dispatcher_loop,
-)
-from automation.models import Automation, AutomationRun, AutomationRunStatus
-from automation.utils import utcnow
-from automation.utils.run import mark_run_status
-from automation.utils.tarball_validation import is_http_url
-
-
-# Test UUIDs
-TEST_USER_ID = uuid.UUID("12345678-1234-5678-1234-567812345678")
-TEST_ORG_ID = uuid.UUID("87654321-4321-8765-4321-876543218765")
-
-
-class TestIsHttpUrl:
-    """Tests for is_http_url helper function."""
-
-    def test_https_url_is_http(self):
-        """HTTPS URLs are HTTP URLs (downloadable with curl in sandbox)."""
-        assert is_http_url("https://example.com/file.tar.gz") is True
-        github_url = "https://github.com/user/repo/archive/main.tar.gz"
-        assert is_http_url(github_url) is True
-
-    def test_http_url_is_http(self):
-        """HTTP URLs are HTTP URLs (downloadable with curl in sandbox)."""
-        assert is_http_url("http://example.com/file.tar.gz") is True
-
-    def test_internal_url_is_not_http(self):
-        """Internal URLs (oh-internal://) are not HTTP URLs."""
-        internal_url = "oh-internal://uploads/12345678-1234-5678-1234-567812345678"
-        assert is_http_url(internal_url) is False
-
-    def test_s3_url_is_not_http(self):
-        """S3 URLs are not HTTP URLs (need special handling, not curl)."""
-        assert is_http_url("s3://bucket/key.tar.gz") is False
-
-    def test_gs_url_is_not_http(self):
-        """GCS URLs are not HTTP URLs (need special handling, not curl)."""
-        assert is_http_url("gs://bucket/key.tar.gz") is False
-
-
-class TestMarkRunStatus:
-    """Tests for mark_run_status function."""
-
-    async def test_marks_run_as_running(self, async_session_factory):
-        """Run status is changed to RUNNING."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.PENDING,
-            )
-            session.add(run)
-            await session.commit()
-            run_id = run.id
-
-            await mark_run_status(session, run, AutomationRunStatus.RUNNING)
-            await session.commit()
-
-        # Verify status changed
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(AutomationRun).where(AutomationRun.id == run_id)
-            )
-            updated = result.scalars().first()
-            assert updated.status == AutomationRunStatus.RUNNING
-            assert updated.started_at is not None
-
-    async def test_sets_started_at_timestamp(self, async_session_factory):
-        """started_at is set to current time when transitioning to RUNNING."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.PENDING,
-            )
-            session.add(run)
-            await session.commit()
-
-            before = utcnow()
-            await mark_run_status(session, run, AutomationRunStatus.RUNNING)
-            await session.commit()
-            after = utcnow()
-
-            assert run.started_at is not None
-            # started_at should be between before and after
-            assert before <= run.started_at <= after
-
-    async def test_sets_completed_at_on_completed(self, async_session_factory):
-        """completed_at is set when transitioning to COMPLETED."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.RUNNING,
-                started_at=utcnow(),
-            )
-            session.add(run)
-            await session.commit()
-            run_id = run.id
-
-            before = utcnow()
-            await mark_run_status(session, run, AutomationRunStatus.COMPLETED)
-            await session.commit()
-            after = utcnow()
-
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(AutomationRun).where(AutomationRun.id == run_id)
-            )
-            updated = result.scalars().first()
-            assert updated.status == AutomationRunStatus.COMPLETED
-            assert updated.completed_at is not None
-            assert before <= updated.completed_at <= after
-
-    async def test_sets_completed_at_on_failed(self, async_session_factory):
-        """completed_at is set when transitioning to FAILED."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.RUNNING,
-                started_at=utcnow(),
-            )
-            session.add(run)
-            await session.commit()
-            run_id = run.id
-
-            before = utcnow()
-            await mark_run_status(session, run, AutomationRunStatus.FAILED)
-            await session.commit()
-            after = utcnow()
-
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(AutomationRun).where(AutomationRun.id == run_id)
-            )
-            updated = result.scalars().first()
-            assert updated.status == AutomationRunStatus.FAILED
-            assert updated.completed_at is not None
-            assert before <= updated.completed_at <= after
-
-
-class TestDispatchPendingRuns:
-    """Tests for dispatch_pending_runs function."""
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_dispatches_pending_runs(
-        self, mock_execute, async_session_factory, mock_settings
-    ):
-        """Pending runs are dispatched and marked as RUNNING."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.PENDING,
-            )
-            session.add(run)
-            await session.commit()
-            run_id = run.id
-
-        dispatched = await dispatch_pending_runs(async_session_factory, mock_settings)
-
-        assert len(dispatched) == 1
-        assert dispatched[0].id == run_id
-
-        # Verify status changed in DB
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(AutomationRun).where(AutomationRun.id == run_id)
-            )
-            updated = result.scalars().first()
-            assert updated.status == AutomationRunStatus.RUNNING
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_ignores_running_runs(
-        self, mock_execute, async_session_factory, mock_settings
-    ):
-        """Runs already in RUNNING status are not dispatched."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.RUNNING,
-                started_at=utcnow(),
-            )
-            session.add(run)
-            await session.commit()
-
-        dispatched = await dispatch_pending_runs(async_session_factory, mock_settings)
-
-        assert len(dispatched) == 0
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_ignores_completed_runs(
-        self, mock_execute, async_session_factory, mock_settings
-    ):
-        """Completed runs are not dispatched."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.COMPLETED,
-                started_at=utcnow(),
-                completed_at=utcnow(),
-            )
-            session.add(run)
-            await session.commit()
-
-        dispatched = await dispatch_pending_runs(async_session_factory, mock_settings)
-
-        assert len(dispatched) == 0
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_respects_batch_size(
-        self, mock_execute, async_session_factory, mock_settings
-    ):
-        """Only batch_size runs are dispatched at once."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            # Create 5 pending runs
-            for _ in range(5):
-                run = AutomationRun(
-                    automation_id=automation.id,
-                    status=AutomationRunStatus.PENDING,
-                )
-                session.add(run)
-            await session.commit()
-
-        dispatched = await dispatch_pending_runs(
-            async_session_factory, mock_settings, batch_size=2
-        )
-
-        assert len(dispatched) == 2
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_orders_by_created_at(
-        self, mock_execute, async_session_factory, mock_settings
-    ):
-        """Oldest pending runs are dispatched first."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            now = utcnow()
-            old_run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.PENDING,
-                created_at=now - timedelta(hours=1),
-            )
-            new_run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.PENDING,
-                created_at=now,
-            )
-            session.add_all([new_run, old_run])  # Add in reverse order
-            await session.commit()
-            old_run_id = old_run.id
-
-        dispatched = await dispatch_pending_runs(
-            async_session_factory, mock_settings, batch_size=1
-        )
-
-        assert len(dispatched) == 1
-        assert dispatched[0].id == old_run_id  # Old run should be first
-
-
-class TestDispatcherLoop:
-    """Tests for dispatcher_loop function."""
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_dispatcher_loop_exits_on_shutdown(
-        self, mock_execute, async_session_factory, mock_settings
-    ):
-        """Dispatcher exits gracefully when shutdown event is set."""
-        shutdown_event = asyncio.Event()
-
-        task = asyncio.create_task(
-            dispatcher_loop(
-                async_session_factory,
-                mock_settings,
-                interval_seconds=1,
-                shutdown_event=shutdown_event,
-            )
-        )
-
-        await asyncio.sleep(0.1)
-        shutdown_event.set()
-
-        try:
-            await asyncio.wait_for(task, timeout=2.0)
-        except TimeoutError:
-            task.cancel()
-            pytest.fail("Dispatcher did not exit on shutdown signal")
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_dispatcher_loop_dispatches_runs(
-        self, mock_execute, async_session_factory, mock_settings, caplog
-    ):
-        """Dispatcher polls and dispatches pending runs."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.PENDING,
-            )
-            session.add(run)
-            await session.commit()
-            run_id = run.id
-
-        shutdown_event = asyncio.Event()
-
-        import logging
-
-        with caplog.at_level(logging.INFO, logger="automation.dispatcher"):
-            task = asyncio.create_task(
-                dispatcher_loop(
-                    async_session_factory,
-                    mock_settings,
-                    interval_seconds=60,
-                    shutdown_event=shutdown_event,
-                )
-            )
-
-            await asyncio.sleep(0.2)
-
-            shutdown_event.set()
-            await asyncio.wait_for(task, timeout=2.0)
-
-        # Check logs
-        assert any(
-            "Dispatching automation run" in record.message for record in caplog.records
-        )
-        assert any("Dispatched 1 run" in record.message for record in caplog.records)
-
-        # Verify run status changed
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(AutomationRun).where(AutomationRun.id == run_id)
-            )
-            updated = result.scalars().first()
-            assert updated.status == AutomationRunStatus.RUNNING
-
-
-class TestEffectiveTimeout:
-    """Tests for effective timeout calculation in dispatcher."""
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_uses_automation_timeout_when_set(
-        self, mock_execute, async_session_factory, mock_settings
-    ):
-        """Dispatcher uses automation's timeout when set."""
-
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="With Timeout",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                timeout=120,  # Custom timeout
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.PENDING,
-            )
-            session.add(run)
-            await session.commit()
-
-        await dispatch_pending_runs(async_session_factory, mock_settings)
-
-        # Verify _execute_run_safe was called
-        mock_execute.assert_called_once()
-        # The automation passed should have timeout=120
-        call_args = mock_execute.call_args
-        run_arg = call_args[0][0]
-        assert run_arg.automation.timeout == 120
-
-    @patch("automation.dispatcher._execute_run_safe", new_callable=AsyncMock)
-    async def test_uses_default_timeout_when_not_set(
-        self, mock_execute, async_session_factory, mock_settings
-    ):
-        """Dispatcher uses MAX_RUN_DURATION_SECONDS when automation timeout is None."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="No Timeout",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                timeout=None,  # No custom timeout
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.PENDING,
-            )
-            session.add(run)
-            await session.commit()
-
-        await dispatch_pending_runs(async_session_factory, mock_settings)
-
-        # Verify _execute_run_safe was called
-        mock_execute.assert_called_once()
-        # The automation passed should have timeout=None
-        call_args = mock_execute.call_args
-        run_arg = call_args[0][0]
-        assert run_arg.automation.timeout is None
diff --git a/tests/test_execution.py b/tests/test_execution.py
deleted file mode 100644
index 8785ae7..0000000
--- a/tests/test_execution.py
+++ /dev/null
@@ -1,320 +0,0 @@
-"""Tests for the execution module — build_tarball, _shell_quote, and result types.
-
-Only tests pure logic that can run without a network.  The e2e flow
-(run_automation/dispatch_automation against a real sandbox) lives in
-scripts/test_automation.py.
-"""
-
-import io
-import tarfile
-from unittest.mock import patch
-
-import pytest
-
-from automation.exceptions import PermanentDispatchError, TarballNotFoundError
-from automation.execution import (
-    EXTERNAL_DOWNLOAD_TIMEOUT,
-    EXTERNAL_MAX_FILESIZE,
-    AutomationResult,
-    DispatchResult,
-    _shell_quote,
-    build_tarball,
-    dispatch_automation,
-)
-
-
-class TestBuildTarball:
-    def test_produces_valid_tarball(self):
-        tb = build_tarball({"hello.txt": "world", "bin.dat": b"\x00\x01"})
-        with tarfile.open(fileobj=io.BytesIO(tb), mode="r:gz") as tar:
-            names = sorted(tar.getnames())
-            assert names == ["bin.dat", "hello.txt"]
-            hello = tar.extractfile("hello.txt")
-            assert hello is not None
-            assert hello.read() == b"world"
-            bindat = tar.extractfile("bin.dat")
-            assert bindat is not None
-            assert bindat.read() == b"\x00\x01"
-
-    def test_empty_files(self):
-        tb = build_tarball({})
-        with tarfile.open(fileobj=io.BytesIO(tb), mode="r:gz") as tar:
-            assert tar.getnames() == []
-
-    def test_setup_and_entrypoint(self):
-        tb = build_tarball(
-            {
-                "setup.sh": "#!/bin/bash\npip install requests\n",
-                "run.py": 'print("ok")\n',
-            }
-        )
-        with tarfile.open(fileobj=io.BytesIO(tb), mode="r:gz") as tar:
-            assert "setup.sh" in tar.getnames()
-            assert "run.py" in tar.getnames()
-            setup_file = tar.extractfile("setup.sh")
-            assert setup_file is not None
-            setup = setup_file.read().decode()
-            assert "pip install" in setup
-
-
-class TestShellQuote:
-    def test_simple_string(self):
-        assert _shell_quote("hello") == "'hello'"
-
-    def test_string_with_spaces(self):
-        assert _shell_quote("hello world") == "'hello world'"
-
-    def test_string_with_single_quotes(self):
-        assert _shell_quote("it's") == "'it'\\''s'"
-
-    def test_empty_string(self):
-        assert _shell_quote("") == "''"
-
-    def test_special_characters(self):
-        assert _shell_quote("$HOME") == "'$HOME'"
-
-
-class TestAutomationResult:
-    """Tests for AutomationResult (blocking execution result)."""
-
-    def test_frozen_dataclass(self):
-        r = AutomationResult(success=True, sandbox_id="sb-1", exit_code=0, stdout="ok")
-        assert r.success is True
-        assert r.sandbox_id == "sb-1"
-        assert r.exit_code == 0
-        assert r.stdout == "ok"
-        with pytest.raises(AttributeError):
-            r.success = False  # type: ignore[misc]
-
-    def test_with_error(self):
-        r = AutomationResult(
-            success=False,
-            sandbox_id="sb-1",
-            exit_code=1,
-            stderr="error",
-            error="Failed",
-        )
-        assert r.success is False
-        assert r.exit_code == 1
-        assert r.stderr == "error"
-        assert r.error == "Failed"
-
-
-class TestDispatchResult:
-    """Tests for DispatchResult (fire-and-forget execution result)."""
-
-    def test_frozen_dataclass(self):
-        r = DispatchResult(success=True, sandbox_id="sb-1")
-        assert r.success is True
-        assert r.sandbox_id == "sb-1"
-        with pytest.raises(AttributeError):
-            r.success = False  # type: ignore[misc]
-
-    def test_with_error(self):
-        r = DispatchResult(success=False, sandbox_id="sb-1", error="Failed to start")
-        assert r.success is False
-        assert r.error == "Failed to start"
-
-
-class TestAutomationTarballSource:
-    """Tests for tarball_source parameter."""
-
-    def test_tarball_source_accepts_bytes(self):
-        """tarball_source accepts bytes (will be uploaded)."""
-        # This just validates the type - actual execution would need mocking
-        source: bytes | str = b"test tarball content"
-        assert isinstance(source, bytes)
-
-    def test_tarball_source_accepts_str(self):
-        """tarball_source accepts str URL (will be downloaded in sandbox)."""
-        source: bytes | str = "https://example.com/file.tar.gz"
-        assert isinstance(source, str)
-
-
-class TestExternalDownloadConstants:
-    """Tests for external download configuration constants."""
-
-    def test_timeout_is_reasonable(self):
-        """External download timeout should be reasonable (60-300s)."""
-        assert 60 <= EXTERNAL_DOWNLOAD_TIMEOUT <= 300
-
-    def test_max_filesize_is_reasonable(self):
-        """Max filesize should be reasonable (10MB - 500MB)."""
-        assert 10 * 1024 * 1024 <= EXTERNAL_MAX_FILESIZE <= 500 * 1024 * 1024
-
-
-class TestDispatchAutomationPermanentErrors:
-    """Tests for dispatch_automation handling of PermanentDispatchError."""
-
-    @pytest.mark.asyncio
-    @patch("automation.execution._create_and_wait")
-    @patch("automation.execution.delete_sandbox")
-    @patch("automation.execution._download_in_sandbox")
-    async def test_reraises_permanent_error_after_sandbox_cleanup(
-        self,
-        mock_download_in_sandbox,
-        mock_delete_sandbox,
-        mock_create_and_wait,
-    ):
-        """PermanentDispatchError is re-raised after cleaning up the sandbox."""
-        sandbox_id = "test-sandbox-123"
-        mock_create_and_wait.return_value = (
-            sandbox_id,
-            "session-key",
-            "https://agent.example.com",
-        )
-        mock_download_in_sandbox.side_effect = TarballNotFoundError(
-            "External tarball URL is not accessible"
-        )
-        mock_delete_sandbox.return_value = None
-
-        with pytest.raises(TarballNotFoundError) as exc_info:
-            await dispatch_automation(
-                api_url="https://api.example.com",
-                api_key="test-key",
-                entrypoint="python main.py",
-                tarball_source="https://example.com/missing.tar.gz",
-            )
-
-        assert "not accessible" in str(exc_info.value)
-        # Verify sandbox was deleted before re-raising
-        mock_delete_sandbox.assert_called_once()
-        call_args = mock_delete_sandbox.call_args
-        assert call_args[0][2] == "test-key"  # api_key
-        assert call_args[0][3] == sandbox_id  # sandbox_id
-
-    @pytest.mark.asyncio
-    @patch("automation.execution._create_and_wait")
-    @patch("automation.execution.delete_sandbox")
-    @patch("automation.execution._download_in_sandbox")
-    async def test_transient_error_returns_dispatch_result(
-        self,
-        mock_download_in_sandbox,
-        mock_delete_sandbox,
-        mock_create_and_wait,
-    ):
-        """Non-permanent errors return DispatchResult with success=False."""
-        sandbox_id = "test-sandbox-456"
-        mock_create_and_wait.return_value = (
-            sandbox_id,
-            "session-key",
-            "https://agent.example.com",
-        )
-        mock_download_in_sandbox.side_effect = RuntimeError("Connection timeout")
-        mock_delete_sandbox.return_value = None
-
-        result = await dispatch_automation(
-            api_url="https://api.example.com",
-            api_key="test-key",
-            entrypoint="python main.py",
-            tarball_source="https://example.com/file.tar.gz",
-        )
-
-        # Should return DispatchResult, not raise
-        assert isinstance(result, DispatchResult)
-        assert result.success is False
-        assert result.error is not None
-        assert "Connection timeout" in result.error
-        # Verify sandbox was still cleaned up
-        mock_delete_sandbox.assert_called_once()
-
-    @pytest.mark.asyncio
-    @patch("automation.execution._create_and_wait")
-    @patch("automation.execution.delete_sandbox")
-    @patch("automation.execution._download_in_sandbox")
-    async def test_permanent_error_without_sandbox_still_raises(
-        self,
-        mock_download_in_sandbox,
-        mock_delete_sandbox,
-        mock_create_and_wait,
-    ):
-        """PermanentDispatchError is re-raised even if sandbox_id is None."""
-        # Simulate sandbox creation started but failed before getting ID
-        mock_create_and_wait.return_value = (
-            "test-sandbox",
-            "session-key",
-            "https://agent.example.com",
-        )
-        mock_download_in_sandbox.side_effect = TarballNotFoundError("404 Not Found")
-
-        with pytest.raises(TarballNotFoundError):
-            await dispatch_automation(
-                api_url="https://api.example.com",
-                api_key="test-key",
-                entrypoint="python main.py",
-                tarball_source="https://example.com/missing.tar.gz",
-            )
-
-    @pytest.mark.asyncio
-    @patch("automation.execution._create_and_wait")
-    @patch("automation.execution.delete_sandbox")
-    @patch("automation.execution._upload")
-    async def test_permanent_error_with_bytes_tarball_reraises(
-        self,
-        mock_upload,
-        mock_delete_sandbox,
-        mock_create_and_wait,
-    ):
-        """PermanentDispatchError during upload is also re-raised."""
-        sandbox_id = "test-sandbox-789"
-        mock_create_and_wait.return_value = (
-            sandbox_id,
-            "session-key",
-            "https://agent.example.com",
-        )
-        # Simulate a permanent error during upload (unlikely but possible)
-        mock_upload.side_effect = PermanentDispatchError("Upload permanently failed")
-        mock_delete_sandbox.return_value = None
-
-        with pytest.raises(PermanentDispatchError) as exc_info:
-            await dispatch_automation(
-                api_url="https://api.example.com",
-                api_key="test-key",
-                entrypoint="python main.py",
-                tarball_source=b"fake tarball bytes",
-            )
-
-        assert "permanently failed" in str(exc_info.value)
-        mock_delete_sandbox.assert_called_once()
-
-    @pytest.mark.asyncio
-    @patch("automation.execution._create_and_wait")
-    @patch("automation.execution.delete_sandbox")
-    @patch("automation.execution._download_in_sandbox")
-    async def test_permanent_error_not_masked_by_cleanup_failure(
-        self,
-        mock_download_in_sandbox,
-        mock_delete_sandbox,
-        mock_create_and_wait,
-    ):
-        """PermanentDispatchError is re-raised even if sandbox cleanup fails.
-
-        This tests the fix for review comment about exception masking:
-        if delete_sandbox() raises, we should still re-raise the original
-        PermanentDispatchError so the dispatcher can disable the automation.
-        """
-        sandbox_id = "test-sandbox-cleanup-fail"
-        mock_create_and_wait.return_value = (
-            sandbox_id,
-            "session-key",
-            "https://agent.example.com",
-        )
-        mock_download_in_sandbox.side_effect = TarballNotFoundError(
-            "External tarball URL is not accessible: 404"
-        )
-        # Simulate cleanup failure
-        mock_delete_sandbox.side_effect = RuntimeError("Failed to delete sandbox")
-
-        # Should still raise TarballNotFoundError, not RuntimeError
-        with pytest.raises(TarballNotFoundError) as exc_info:
-            await dispatch_automation(
-                api_url="https://api.example.com",
-                api_key="test-key",
-                entrypoint="python main.py",
-                tarball_source="https://example.com/missing.tar.gz",
-            )
-
-        # Verify we got the original error, not the cleanup error
-        assert "404" in str(exc_info.value)
-        # Cleanup was still attempted
-        mock_delete_sandbox.assert_called_once()
diff --git a/tests/test_health.py b/tests/test_health.py
index 6cbeec9..c603a69 100644
--- a/tests/test_health.py
+++ b/tests/test_health.py
@@ -37,6 +37,6 @@ async def test_ready_endpoint_db_unavailable(self, async_client):
             assert response.status_code == 503
             data = response.json()
             assert data["status"] == "not_ready"
-            assert "error" in data
+            assert "database unavailable" in data.get("errors", [])
         finally:
             app.state.engine = original_engine
diff --git a/tests/test_router.py b/tests/test_router.py
index 70bf438..b8b0b91 100644
--- a/tests/test_router.py
+++ b/tests/test_router.py
@@ -696,7 +696,7 @@ class TestDispatchAutomation:
     """Tests for POST /v1/{id}/dispatch endpoint."""
 
     async def test_dispatch_automation_success(self, async_client, async_session):
-        """Dispatching an automation creates a PENDING run."""
+        """Dispatching an automation creates a RUNNING run and starts a workflow."""
         automation = Automation(
             user_id=TEST_USER_ID,
             org_id=TEST_ORG_ID,
@@ -713,11 +713,13 @@ async def test_dispatch_automation_success(self, async_client, async_session):
         assert response.status_code == 201
         data = response.json()
         assert data["automation_id"] == str(automation.id)
-        assert data["status"] == "PENDING"
+        assert (
+            data["status"] == "RUNNING"
+        )  # Now RUNNING since Temporal starts immediately
         assert data["error_detail"] is None
         assert "id" in data
         assert "created_at" in data
-        assert data["started_at"] is None
+        assert data["started_at"] is not None  # Set when Temporal workflow starts
         assert data["completed_at"] is None
 
     async def test_dispatch_automation_not_found(self, async_client):
@@ -789,12 +791,12 @@ async def test_dispatch_automation_multiple_runs(self, async_client, async_sessi
         # Each dispatch creates a unique run
         assert run1["id"] != run2["id"]
         assert run1["automation_id"] == run2["automation_id"] == str(automation.id)
-        assert run1["status"] == run2["status"] == "PENDING"
+        assert (
+            run1["status"] == run2["status"] == "RUNNING"
+        )  # Temporal starts immediately
 
-    async def test_dispatch_updates_last_triggered_at(
-        self, async_client, async_session
-    ):
-        """Dispatching updates the automation's last_triggered_at."""
+    async def test_dispatch_creates_running_run(self, async_client, async_session):
+        """Dispatching creates a run with RUNNING status and started_at set."""
         automation = Automation(
             user_id=TEST_USER_ID,
             org_id=TEST_ORG_ID,
@@ -806,15 +808,12 @@ async def test_dispatch_updates_last_triggered_at(
         async_session.add(automation)
         await async_session.commit()
 
-        assert automation.last_triggered_at is None
-
         response = await async_client.post(f"/v1/{automation.id}/dispatch")
 
         assert response.status_code == 201
-
-        # Refresh from DB to verify last_triggered_at was updated
-        await async_session.refresh(automation)
-        assert automation.last_triggered_at is not None
+        data = response.json()
+        assert data["status"] == "RUNNING"
+        assert data["started_at"] is not None
 
 
 class TestListAutomationRuns:
diff --git a/tests/test_scheduler.py b/tests/test_scheduler.py
deleted file mode 100644
index d83640f..0000000
--- a/tests/test_scheduler.py
+++ /dev/null
@@ -1,945 +0,0 @@
-"""Tests for the scheduler module."""
-
-import asyncio
-import uuid
-from datetime import UTC, datetime, timedelta
-
-import pytest
-from sqlalchemy import func, select
-
-from automation.models import Automation, AutomationRun, AutomationRunStatus
-from automation.scheduler import (
-    POLL_INTERVAL_SECONDS,
-    poll_and_schedule,
-    scheduler_loop,
-)
-from automation.utils import (
-    get_next_fire_time,
-    get_prev_fire_time,
-    is_automation_due,
-    utcnow,
-)
-from automation.utils.run import create_pending_run
-
-
-UTC = UTC
-
-# Test UUIDs
-TEST_USER_ID = uuid.UUID("12345678-1234-5678-1234-567812345678")
-TEST_ORG_ID = uuid.UUID("87654321-4321-8765-4321-876543218765")
-
-
-def _utc(*args: int) -> datetime:
-    """Create a UTC-aware datetime for test assertions."""
-    return datetime(*args, tzinfo=UTC)
-
-
-class TestGetNextFireTime:
-    """Tests for get_next_fire_time function."""
-
-    def test_next_fire_time_daily(self):
-        """Daily cron schedule returns correct next fire time."""
-        # Every day at 9:00 AM UTC
-        base_time = _utc(2026, 3, 15, 8, 0, 0)
-        next_fire = get_next_fire_time("0 9 * * *", base_time=base_time)
-
-        assert next_fire == _utc(2026, 3, 15, 9, 0, 0)
-
-    def test_next_fire_time_weekly(self):
-        """Weekly cron schedule returns correct next fire time."""
-        # Every Friday at 9:00 AM (Friday = 5)
-        # March 15, 2026 is a Sunday
-        base_time = _utc(2026, 3, 15, 10, 0, 0)
-        next_fire = get_next_fire_time("0 9 * * 5", base_time=base_time)
-
-        # Next Friday is March 20, 2026
-        assert next_fire == _utc(2026, 3, 20, 9, 0, 0)
-
-    def test_next_fire_time_already_past_today(self):
-        """Returns tomorrow if today's fire time has passed."""
-        # Every day at 9:00 AM, but current time is 10:00 AM
-        base_time = _utc(2026, 3, 15, 10, 0, 0)
-        next_fire = get_next_fire_time("0 9 * * *", base_time=base_time)
-
-        # Should be tomorrow at 9:00 AM
-        assert next_fire == _utc(2026, 3, 16, 9, 0, 0)
-
-    def test_next_fire_time_every_minute(self):
-        """Every minute schedule works correctly."""
-        base_time = _utc(2026, 3, 15, 10, 30, 45)
-        next_fire = get_next_fire_time("* * * * *", base_time=base_time)
-
-        assert next_fire == _utc(2026, 3, 15, 10, 31, 0)
-
-    def test_next_fire_time_with_timezone(self):
-        """Timezone is correctly applied to cron schedule."""
-        # Schedule: 9:00 AM America/New_York
-        # Base time: 12:00 UTC on March 15, 2026 (which is 8:00 AM EDT)
-        # March 15 is after DST starts (March 8, 2026), so EDT = UTC-4
-        base_time = _utc(2026, 3, 15, 12, 0, 0)  # 12:00 UTC = 8:00 AM EDT
-        next_fire = get_next_fire_time(
-            "0 9 * * *", timezone="America/New_York", base_time=base_time
-        )
-
-        # Next fire should be 9:00 AM EDT = 13:00 UTC
-        assert next_fire == _utc(2026, 3, 15, 13, 0, 0)
-
-    def test_next_fire_time_timezone_different_day(self):
-        """Timezone conversion can shift the fire time to a different day."""
-        # Schedule: 2:00 AM America/Los_Angeles (UTC-8 in winter, UTC-7 in summer)
-        # Base time: 8:00 UTC on March 15, 2026
-        # March 15 is after DST starts, so PDT = UTC-7
-        # 8:00 UTC = 1:00 AM PDT, so next 2:00 AM PDT is same day
-        base_time = _utc(2026, 3, 15, 8, 0, 0)  # 8:00 UTC = 1:00 AM PDT
-        next_fire = get_next_fire_time(
-            "0 2 * * *", timezone="America/Los_Angeles", base_time=base_time
-        )
-
-        # Next fire: 2:00 AM PDT = 9:00 UTC same day
-        assert next_fire == _utc(2026, 3, 15, 9, 0, 0)
-
-
-class TestGetPrevFireTime:
-    """Tests for get_prev_fire_time function."""
-
-    def test_prev_fire_time_daily(self):
-        """Daily cron schedule returns correct previous fire time."""
-        # Every day at 9:00 AM UTC
-        base_time = _utc(2026, 3, 15, 10, 0, 0)  # 10:00 UTC
-        prev_fire = get_prev_fire_time("0 9 * * *", base_time=base_time)
-
-        # Previous fire was 9:00 UTC same day
-        assert prev_fire == _utc(2026, 3, 15, 9, 0, 0)
-
-    def test_prev_fire_time_with_timezone(self):
-        """Timezone is correctly applied when computing previous fire time."""
-        # Schedule: 9:00 AM America/New_York
-        # Base time: 14:00 UTC on March 15, 2026 (which is 10:00 AM EDT)
-        # March 15 is after DST, so EDT = UTC-4
-        base_time = _utc(2026, 3, 15, 14, 0, 0)  # 14:00 UTC = 10:00 AM EDT
-        prev_fire = get_prev_fire_time(
-            "0 9 * * *", timezone="America/New_York", base_time=base_time
-        )
-
-        # Previous fire was 9:00 AM EDT = 13:00 UTC same day
-        assert prev_fire == _utc(2026, 3, 15, 13, 0, 0)
-
-
-class TestIsAutomationDue:
-    """Tests for is_automation_due function."""
-
-    def test_disabled_automation_not_due(self):
-        """Disabled automations are never due."""
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "* * * * *"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=False,
-        )
-
-        assert is_automation_due(automation) is False
-
-    def test_deleted_automation_not_due(self):
-        """Deleted automations are never due."""
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "* * * * *"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            deleted_at=utcnow(),
-        )
-
-        assert is_automation_due(automation) is False
-
-    def test_non_cron_trigger_not_due(self):
-        """Non-cron trigger types are not due (for now)."""
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "github", "event": "push"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-        )
-
-        assert is_automation_due(automation) is False
-
-    def test_never_triggered_created_before_schedule_is_due(self):
-        """Automation created before a scheduled time is due after that time passes."""
-        # Created at 10:25, schedule is every 30 mins (0,30)
-        # At 10:35, prev_fire_time is 10:30, which is after created_at (10:25)
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "0,30 * * * *", "timezone": "UTC"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=None,
-            created_at=_utc(2026, 3, 15, 10, 25, 0),
-        )
-
-        now = _utc(2026, 3, 15, 10, 35, 0)
-        assert is_automation_due(automation, now) is True
-
-    def test_never_triggered_created_after_schedule_not_due(self):
-        """Automation created after a scheduled time waits for next schedule."""
-        # Created at 10:35, schedule is every 30 mins (0,30)
-        # At 10:40, prev_fire_time is 10:30, which is BEFORE created_at (10:35)
-        # Should NOT be due - wait for 11:00
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "0,30 * * * *", "timezone": "UTC"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=None,
-            created_at=_utc(2026, 3, 15, 10, 35, 0),
-        )
-
-        now = _utc(2026, 3, 15, 10, 40, 0)
-        assert is_automation_due(automation, now) is False
-
-    def test_never_triggered_due_at_next_schedule(self):
-        """Automation created after a scheduled time becomes due at next schedule."""
-        # Created at 10:35, schedule is every 30 mins (0,30)
-        # At 11:05, prev_fire_time is 11:00, which is after created_at (10:35)
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "0,30 * * * *", "timezone": "UTC"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=None,
-            created_at=_utc(2026, 3, 15, 10, 35, 0),
-        )
-
-        now = _utc(2026, 3, 15, 11, 5, 0)
-        assert is_automation_due(automation, now) is True
-
-    def test_recently_triggered_not_due(self):
-        """Automation triggered in current period is not due again."""
-        # Every minute schedule
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=_utc(2026, 3, 15, 10, 30, 5),
-        )
-
-        # Same minute, later
-        now = _utc(2026, 3, 15, 10, 30, 30)
-        assert is_automation_due(automation, now) is False
-
-    def test_automation_due_next_period(self):
-        """Automation is due when a new period starts."""
-        # Every minute schedule, last triggered at 10:29:05
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=_utc(2026, 3, 15, 10, 29, 5),
-        )
-
-        # Now at 10:30:30 - the 10:30 fire time should make it due
-        now = _utc(2026, 3, 15, 10, 30, 30)
-        assert is_automation_due(automation, now) is True
-
-    def test_daily_automation_not_due_same_day(self):
-        """Daily automation triggered today is not due again today."""
-        # Every day at 9:00 AM
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "0 9 * * *", "timezone": "UTC"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=_utc(2026, 3, 15, 9, 0, 5),
-        )
-
-        # Later the same day
-        now = _utc(2026, 3, 15, 14, 0, 0)
-        assert is_automation_due(automation, now) is False
-
-    def test_daily_automation_due_next_day(self):
-        """Daily automation is due the next day."""
-        # Every day at 9:00 AM
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={"type": "cron", "schedule": "0 9 * * *", "timezone": "UTC"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=_utc(2026, 3, 15, 9, 0, 5),
-        )
-
-        # Next day after 9:00 AM
-        now = _utc(2026, 3, 16, 9, 30, 0)
-        assert is_automation_due(automation, now) is True
-
-    def test_automation_due_with_timezone(self):
-        """Automation with non-UTC timezone fires at correct time."""
-        # Schedule: 9:00 AM America/New_York (EDT = UTC-4 in March)
-        # Created at 12:00 UTC (8:00 AM EDT) - before 9 AM EDT
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={
-                "type": "cron",
-                "schedule": "0 9 * * *",
-                "timezone": "America/New_York",
-            },
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=None,
-            created_at=_utc(2026, 3, 15, 12, 0, 0),  # 8:00 AM EDT
-        )
-
-        # At 12:30 UTC (8:30 AM EDT) - before 9 AM EDT, not due
-        now_before = _utc(2026, 3, 15, 12, 30, 0)
-        assert is_automation_due(automation, now_before) is False
-
-        # At 13:30 UTC (9:30 AM EDT) - after 9 AM EDT, should be due
-        now_after = _utc(2026, 3, 15, 13, 30, 0)
-        assert is_automation_due(automation, now_after) is True
-
-    def test_automation_not_due_with_timezone_before_schedule(self):
-        """Automation with timezone is not due before its scheduled time."""
-        # Schedule: 9:00 AM America/Los_Angeles (PDT = UTC-7 in March)
-        # Created at 14:00 UTC (7:00 AM PDT)
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test",
-            trigger={
-                "type": "cron",
-                "schedule": "0 9 * * *",
-                "timezone": "America/Los_Angeles",
-            },
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            last_triggered_at=None,
-            created_at=_utc(2026, 3, 15, 14, 0, 0),  # 7:00 AM PDT
-        )
-
-        # At 15:00 UTC (8:00 AM PDT) - still before 9 AM PDT
-        now = _utc(2026, 3, 15, 15, 0, 0)
-        assert is_automation_due(automation, now) is False
-
-        # At 16:30 UTC (9:30 AM PDT) - after 9 AM PDT, should be due
-        now_due = _utc(2026, 3, 15, 16, 30, 0)
-        assert is_automation_due(automation, now_due) is True
-
-
-class TestPollAndSchedule:
-    """Tests for poll_and_schedule function (atomic poll + run creation)."""
-
-    async def test_poll_creates_runs_for_due_automations(self, async_session_factory):
-        """Creates pending runs for automations that are due."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Due Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_triggered_at=None,
-                created_at=utcnow() - timedelta(minutes=5),
-            )
-            session.add(automation)
-            await session.commit()
-            automation_id = automation.id
-
-        runs = await poll_and_schedule(async_session_factory)
-
-        assert len(runs) == 1
-        assert runs[0].automation_id == automation_id
-        assert runs[0].status == AutomationRunStatus.PENDING
-
-    async def test_poll_excludes_disabled(self, async_session_factory):
-        """Disabled automations are not returned."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Disabled Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=False,
-            )
-            session.add(automation)
-            await session.commit()
-
-        runs = await poll_and_schedule(async_session_factory)
-
-        assert len(runs) == 0
-
-    async def test_poll_excludes_deleted(self, async_session_factory):
-        """Deleted automations are not returned."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Deleted Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                deleted_at=utcnow(),
-            )
-            session.add(automation)
-            await session.commit()
-
-        runs = await poll_and_schedule(async_session_factory)
-
-        assert len(runs) == 0
-
-    async def test_poll_excludes_recently_triggered(self, async_session_factory):
-        """Recently triggered automations are not returned as due."""
-        now = utcnow()
-        async with async_session_factory() as session:
-            # Triggered AFTER the most recent cron fire time → not due.
-            # Use 'now' as last_triggered_at so prev_fire_time is always earlier.
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Recently Triggered",
-                trigger={"type": "cron", "schedule": "0 9 * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_triggered_at=now,
-            )
-            session.add(automation)
-            await session.commit()
-
-        runs = await poll_and_schedule(async_session_factory)
-
-        assert len(runs) == 0
-
-    async def test_poll_updates_last_polled_at(self, async_session_factory):
-        """Polling updates last_polled_at for due automations."""
-        async with async_session_factory() as session:
-            # Create an automation that IS due: every-minute schedule,
-            # created well in the past so prev_fire_time > created_at.
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=None,
-                created_at=utcnow() - timedelta(minutes=5),
-            )
-            session.add(automation)
-            await session.commit()
-            automation_id = automation.id
-
-        await poll_and_schedule(async_session_factory)
-
-        async with async_session_factory() as session:
-            from sqlalchemy import select
-
-            result = await session.execute(
-                select(Automation).where(Automation.id == automation_id)
-            )
-            updated = result.scalars().first()
-            assert updated.last_polled_at is not None
-
-    async def test_poll_skips_recently_polled(self, async_session_factory):
-        """Automations polled within POLL_INTERVAL_SECONDS are skipped."""
-        now = utcnow()
-        recent_poll_time = now - timedelta(seconds=POLL_INTERVAL_SECONDS // 2)
-
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Recently Polled",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=recent_poll_time,
-            )
-            session.add(automation)
-            await session.commit()
-
-        runs = await poll_and_schedule(async_session_factory)
-
-        assert len(runs) == 0
-
-    async def test_poll_returns_old_polled_automations(self, async_session_factory):
-        """Automations polled longer than POLL_INTERVAL_SECONDS ago are returned."""
-        now = utcnow()
-        old_poll_time = now - timedelta(seconds=POLL_INTERVAL_SECONDS + 10)
-
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Old Polled",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=old_poll_time,
-                last_triggered_at=None,
-                created_at=now - timedelta(minutes=5),
-            )
-            session.add(automation)
-            await session.commit()
-            automation_id = automation.id
-
-        runs = await poll_and_schedule(async_session_factory)
-
-        assert len(runs) == 1
-        assert runs[0].automation_id == automation_id
-
-    async def test_poll_respects_batch_size(self, async_session_factory):
-        """Polling respects batch_size limit."""
-        now = utcnow()
-        async with async_session_factory() as session:
-            # Create more automations than the batch size
-            for i in range(5):
-                automation = Automation(
-                    user_id=TEST_USER_ID,
-                    org_id=TEST_ORG_ID,
-                    name=f"Automation {i}",
-                    trigger={
-                        "type": "cron",
-                        "schedule": "* * * * *",
-                        "timezone": "UTC",
-                    },
-                    tarball_path="s3://bucket/code.tar.gz",
-                    entrypoint="uv run main.py",
-                    enabled=True,
-                    last_polled_at=None,
-                    last_triggered_at=None,
-                    created_at=now - timedelta(minutes=5),
-                )
-                session.add(automation)
-            await session.commit()
-
-        runs = await poll_and_schedule(async_session_factory, batch_size=2)
-
-        assert len(runs) == 2
-
-    async def test_poll_orders_by_oldest_polled_first(self, async_session_factory):
-        """Polling returns oldest-polled automations first."""
-        now = utcnow()
-        created_at = now - timedelta(minutes=5)
-
-        async with async_session_factory() as session:
-            # Create automations with different last_polled_at times
-            old_automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Old",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=now - timedelta(hours=2),
-                last_triggered_at=None,
-                created_at=created_at,
-            )
-            newer_automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Newer",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=now - timedelta(hours=1),
-                last_triggered_at=None,
-                created_at=created_at,
-            )
-            never_polled = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Never Polled",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=None,
-                last_triggered_at=None,
-                created_at=created_at,
-            )
-            session.add_all([newer_automation, old_automation, never_polled])
-            await session.commit()
-
-        runs = await poll_and_schedule(async_session_factory, batch_size=2)
-
-        assert len(runs) == 2
-
-    async def test_batch_rotates_to_different_automation_after_poll(
-        self, async_session_factory
-    ):
-        """With batch_size=1, consecutive polls pick different automations.
-
-        This verifies that updating last_polled_at moves the automation to the
-        back of the queue, so the next poll picks a different one.
-        """
-        now = utcnow()
-        created_at = now - timedelta(minutes=5)
-
-        async with async_session_factory() as session:
-            # Create two due automations with NULL last_polled_at
-            automation_a = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Automation A",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=None,
-                last_triggered_at=None,
-                created_at=created_at,
-            )
-            automation_b = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Automation B",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=None,
-                last_triggered_at=None,
-                created_at=created_at,
-            )
-            session.add_all([automation_a, automation_b])
-            await session.commit()
-            id_a = automation_a.id
-            id_b = automation_b.id
-
-        # First poll with batch_size=1: should pick one automation
-        runs_first = await poll_and_schedule(async_session_factory, batch_size=1)
-        assert len(runs_first) == 1
-        first_automation_id = runs_first[0].automation_id
-
-        # Second poll with batch_size=1: should pick the OTHER automation
-        # because the first one now has a recent last_polled_at
-        runs_second = await poll_and_schedule(async_session_factory, batch_size=1)
-        assert len(runs_second) == 1
-        second_automation_id = runs_second[0].automation_id
-
-        # Verify we picked different automations
-        assert first_automation_id != second_automation_id
-        assert {first_automation_id, second_automation_id} == {id_a, id_b}
-
-    async def test_last_polled_at_updated_even_when_not_due(
-        self, async_session_factory
-    ):
-        """last_polled_at is updated for all polled automations, not just due ones.
-
-        This ensures fair batch rotation even when an automation is polled but
-        not triggered (e.g., cron not yet due).
-        """
-        now = utcnow()
-
-        async with async_session_factory() as session:
-            # Create a NOT due automation: recently triggered, so prev_fire_time
-            # is before last_triggered_at
-            not_due_automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Not Due Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=None,
-                last_triggered_at=now,  # Just triggered, so not due again yet
-                created_at=now - timedelta(minutes=5),
-            )
-            session.add(not_due_automation)
-            await session.commit()
-            automation_id = not_due_automation.id
-
-        # Poll - should return no runs since the automation is not due
-        runs = await poll_and_schedule(async_session_factory)
-        assert len(runs) == 0
-
-        # But last_polled_at should still be updated
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(Automation).where(Automation.id == automation_id)
-            )
-            updated = result.scalars().first()
-            assert updated.last_polled_at is not None
-
-    async def test_batch_rotates_with_mix_of_due_and_not_due(
-        self, async_session_factory
-    ):
-        """With batch_size=1, rotation works correctly with due and non-due automations.
-
-        First poll picks a non-due automation and updates its last_polled_at.
-        Second poll picks the due automation (not the same non-due one).
-        """
-        now = utcnow()
-        created_at = now - timedelta(minutes=5)
-
-        async with async_session_factory() as session:
-            # Non-due automation (recently triggered)
-            not_due = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Not Due",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=None,
-                last_triggered_at=now,  # Just triggered
-                created_at=created_at,
-            )
-            # Due automation (never triggered)
-            due = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Due",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_polled_at=None,
-                last_triggered_at=None,
-                created_at=created_at,
-            )
-            session.add_all([not_due, due])
-            await session.commit()
-            not_due_id = not_due.id
-            due_id = due.id
-
-        # First poll with batch_size=1: picks one automation (order not guaranteed)
-        runs_first = await poll_and_schedule(async_session_factory, batch_size=1)
-
-        # Second poll with batch_size=1: should pick the OTHER automation
-        runs_second = await poll_and_schedule(async_session_factory, batch_size=1)
-
-        # Together, we should have exactly 1 run (from the due automation)
-        all_runs = runs_first + runs_second
-        assert len(all_runs) == 1
-        assert all_runs[0].automation_id == due_id
-
-        # Verify both automations have last_polled_at set
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(Automation).where(Automation.id.in_([not_due_id, due_id]))
-            )
-            automations = result.scalars().all()
-            for automation in automations:
-                assert automation.last_polled_at is not None
-
-
-class TestSchedulerLoop:
-    """Tests for scheduler_loop function."""
-
-    async def test_scheduler_loop_exits_on_shutdown(self, async_session_factory):
-        """Scheduler exits gracefully when shutdown event is set."""
-        shutdown_event = asyncio.Event()
-
-        # Start the scheduler with a short interval
-        task = asyncio.create_task(
-            scheduler_loop(
-                async_session_factory,
-                interval_seconds=1,
-                shutdown_event=shutdown_event,
-            )
-        )
-
-        # Give it a moment to start
-        await asyncio.sleep(0.1)
-
-        # Signal shutdown
-        shutdown_event.set()
-
-        # Should exit within a reasonable time
-        try:
-            await asyncio.wait_for(task, timeout=2.0)
-        except TimeoutError:
-            task.cancel()
-            pytest.fail("Scheduler did not exit on shutdown signal")
-
-    async def test_scheduler_loop_polls_automations(
-        self, async_session_factory, caplog
-    ):
-        """Scheduler polls and creates pending runs for due automations."""
-        # Create a due automation (created in the past so it's due)
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Due Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_triggered_at=None,
-                created_at=utcnow() - timedelta(minutes=5),
-            )
-            session.add(automation)
-            await session.commit()
-            automation_id = automation.id
-
-        shutdown_event = asyncio.Event()
-
-        # Run scheduler briefly with logging capture
-        import logging
-
-        with caplog.at_level(logging.INFO, logger="automation.scheduler"):
-            task = asyncio.create_task(
-                scheduler_loop(
-                    async_session_factory,
-                    interval_seconds=60,  # Long interval, we'll stop it quickly
-                    shutdown_event=shutdown_event,
-                )
-            )
-
-            # Let it run one poll cycle
-            await asyncio.sleep(0.2)
-
-            # Stop the scheduler
-            shutdown_event.set()
-            await asyncio.wait_for(task, timeout=2.0)
-
-        # Check logs for the due automation
-        assert any("Test Due Automation" in record.message for record in caplog.records)
-        assert any(
-            "Found 1 due automation" in record.message for record in caplog.records
-        )
-        assert any("Created pending run" in record.message for record in caplog.records)
-
-        # Verify a pending run was created
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(AutomationRun).where(
-                    AutomationRun.automation_id == automation_id
-                )
-            )
-            runs = result.scalars().all()
-            assert len(runs) == 1
-            assert runs[0].status == AutomationRunStatus.PENDING
-
-
-class TestCreatePendingRun:
-    """Tests for create_pending_run function."""
-
-    async def test_creates_pending_run(self, async_session_factory):
-        """Creates a run with PENDING status."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run = await create_pending_run(session, automation)
-            await session.commit()
-
-            assert run.id is not None
-            assert run.automation_id == automation.id
-            assert run.status == AutomationRunStatus.PENDING
-            assert run.error_detail is None
-
-    async def test_updates_last_triggered_at(self, async_session_factory):
-        """Updates automation's last_triggered_at timestamp."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-                last_triggered_at=None,
-            )
-            session.add(automation)
-            await session.commit()
-            automation_id = automation.id
-
-            await create_pending_run(session, automation)
-            await session.commit()
-
-        # Verify last_triggered_at was updated
-        async with async_session_factory() as session:
-            result = await session.execute(
-                select(Automation).where(Automation.id == automation_id)
-            )
-            updated = result.scalars().first()
-            assert updated.last_triggered_at is not None
-
-    async def test_multiple_runs_for_same_automation(self, async_session_factory):
-        """Can create multiple runs for the same automation."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Test Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            run1 = await create_pending_run(session, automation)
-            run2 = await create_pending_run(session, automation)
-            await session.commit()
-
-            assert run1.id != run2.id
-            assert run1.automation_id == run2.automation_id
-
-            # Verify both runs exist
-            result = await session.execute(
-                select(func.count())
-                .select_from(AutomationRun)
-                .where(AutomationRun.automation_id == automation.id)
-            )
-            count = result.scalar()
-            assert count == 2
diff --git a/tests/test_watchdog.py b/tests/test_watchdog.py
deleted file mode 100644
index cfed531..0000000
--- a/tests/test_watchdog.py
+++ /dev/null
@@ -1,373 +0,0 @@
-"""Tests for the watchdog module.
-
-The watchdog processes stale runs (RUNNING but past timeout_at) and marks them
-with appropriate status based on sandbox verification results.
-"""
-
-import uuid
-from datetime import timedelta
-from unittest.mock import AsyncMock, patch
-
-import pytest
-
-from automation.models import Automation, AutomationRun, AutomationRunStatus
-from automation.utils import utcnow
-from automation.utils.sandbox import VerificationResult
-from automation.watchdog import _verify_and_mark_run
-
-
-# Test UUIDs
-TEST_USER_ID = uuid.UUID("12345678-1234-5678-1234-567812345678")
-TEST_ORG_ID = uuid.UUID("87654321-4321-8765-4321-876543218765")
-
-
-@pytest.fixture
-async def automation_with_run(async_session_factory):
-    """Create an automation with a RUNNING run that is past timeout."""
-    async with async_session_factory() as session:
-        automation = Automation(
-            user_id=TEST_USER_ID,
-            org_id=TEST_ORG_ID,
-            name="Test Automation",
-            trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-            tarball_path="s3://bucket/code.tar.gz",
-            entrypoint="uv run main.py",
-            enabled=True,
-            timeout=60,
-        )
-        session.add(automation)
-        await session.commit()
-
-        now = utcnow()
-        run = AutomationRun(
-            automation_id=automation.id,
-            status=AutomationRunStatus.RUNNING,
-            sandbox_id="test-sandbox-123",
-            started_at=now - timedelta(minutes=5),
-            timeout_at=now - timedelta(minutes=1),  # Already past timeout
-        )
-        session.add(run)
-        await session.commit()
-
-        yield {"automation": automation, "run": run, "run_id": run.id}
-
-
-class TestVerifyAndMarkRunExitCodes:
-    """Tests for _verify_and_mark_run handling different exit codes."""
-
-    @pytest.mark.asyncio
-    async def test_exit_code_0_marks_completed(
-        self, async_session_factory, automation_with_run, mock_settings
-    ):
-        """Exit code 0 means command succeeded - mark as COMPLETED."""
-        run_id = automation_with_run["run_id"]
-
-        verification = VerificationResult(
-            verified=True,
-            success=True,
-            exit_code=0,
-            stdout="Success output",
-            stderr="",
-        )
-
-        with (
-            patch(
-                "automation.watchdog.verify_run_status",
-                new_callable=AsyncMock,
-                return_value=verification,
-            ),
-            patch(
-                "automation.watchdog.get_api_key_for_automation_run",
-                new_callable=AsyncMock,
-                return_value="test-api-key",
-            ),
-        ):
-            async with async_session_factory() as session:
-                run = await session.get(AutomationRun, run_id)
-                result = await _verify_and_mark_run(session, run, mock_settings)
-                await session.commit()
-
-        assert result is True
-
-        # Verify the run was marked as COMPLETED
-        async with async_session_factory() as session:
-            run = await session.get(AutomationRun, run_id)
-            assert run.status == AutomationRunStatus.COMPLETED
-            assert run.completed_at is not None
-            assert run.error_detail is None
-
-    @pytest.mark.asyncio
-    async def test_exit_code_minus_1_marks_timed_out(
-        self, async_session_factory, automation_with_run, mock_settings
-    ):
-        """Exit code -1 means command was killed/timed out."""
-        run_id = automation_with_run["run_id"]
-
-        verification = VerificationResult(
-            verified=True,
-            success=False,
-            exit_code=-1,
-            stdout="",
-            stderr="Command timed out after 60 seconds",
-        )
-
-        with (
-            patch(
-                "automation.watchdog.verify_run_status",
-                new_callable=AsyncMock,
-                return_value=verification,
-            ),
-            patch(
-                "automation.watchdog.get_api_key_for_automation_run",
-                new_callable=AsyncMock,
-                return_value="test-api-key",
-            ),
-        ):
-            async with async_session_factory() as session:
-                run = await session.get(AutomationRun, run_id)
-                result = await _verify_and_mark_run(session, run, mock_settings)
-                await session.commit()
-
-        assert result is True
-
-        # Verify the run was marked as FAILED with timeout message
-        async with async_session_factory() as session:
-            run = await session.get(AutomationRun, run_id)
-            assert run.status == AutomationRunStatus.FAILED
-            assert run.completed_at is not None
-            assert "Timed out" in run.error_detail
-            assert "timed out" in run.error_detail.lower()
-
-    @pytest.mark.asyncio
-    async def test_exit_code_none_marks_timed_out(
-        self, async_session_factory, automation_with_run, mock_settings
-    ):
-        """Exit code None means command was killed - mark as FAILED with timeout."""
-        run_id = automation_with_run["run_id"]
-
-        verification = VerificationResult(
-            verified=True,
-            success=False,
-            exit_code=None,
-            stdout="",
-            stderr="",
-        )
-
-        with (
-            patch(
-                "automation.watchdog.verify_run_status",
-                new_callable=AsyncMock,
-                return_value=verification,
-            ),
-            patch(
-                "automation.watchdog.get_api_key_for_automation_run",
-                new_callable=AsyncMock,
-                return_value="test-api-key",
-            ),
-        ):
-            async with async_session_factory() as session:
-                run = await session.get(AutomationRun, run_id)
-                result = await _verify_and_mark_run(session, run, mock_settings)
-                await session.commit()
-
-        assert result is True
-
-        # Verify the run was marked as FAILED with timeout message
-        async with async_session_factory() as session:
-            run = await session.get(AutomationRun, run_id)
-            assert run.status == AutomationRunStatus.FAILED
-            assert run.completed_at is not None
-            assert "Timed out" in run.error_detail
-
-    @pytest.mark.asyncio
-    async def test_nonzero_exit_code_marks_failed_without_timeout(
-        self, async_session_factory, automation_with_run, mock_settings
-    ):
-        """Non-zero exit code (not -1) means command failed."""
-        run_id = automation_with_run["run_id"]
-
-        verification = VerificationResult(
-            verified=True,
-            success=False,
-            exit_code=1,
-            stdout="Some output",
-            stderr="Error: something went wrong",
-        )
-
-        with (
-            patch(
-                "automation.watchdog.verify_run_status",
-                new_callable=AsyncMock,
-                return_value=verification,
-            ),
-            patch(
-                "automation.watchdog.get_api_key_for_automation_run",
-                new_callable=AsyncMock,
-                return_value="test-api-key",
-            ),
-        ):
-            async with async_session_factory() as session:
-                run = await session.get(AutomationRun, run_id)
-                result = await _verify_and_mark_run(session, run, mock_settings)
-                await session.commit()
-
-        assert result is True
-
-        # Verify the run was marked as FAILED with exit code (not timeout)
-        async with async_session_factory() as session:
-            run = await session.get(AutomationRun, run_id)
-            assert run.status == AutomationRunStatus.FAILED
-            assert run.completed_at is not None
-            assert "exit_code=1" in run.error_detail
-            assert "Timed out" not in run.error_detail
-            assert "stderr: Error: something went wrong" in run.error_detail
-
-    @pytest.mark.asyncio
-    async def test_exit_code_127_marks_failed_without_timeout(
-        self, async_session_factory, automation_with_run, mock_settings
-    ):
-        """Exit code 127 (command not found) - mark as FAILED without timeout."""
-        run_id = automation_with_run["run_id"]
-
-        verification = VerificationResult(
-            verified=True,
-            success=False,
-            exit_code=127,
-            stdout="",
-            stderr="bash: command not found",
-        )
-
-        with (
-            patch(
-                "automation.watchdog.verify_run_status",
-                new_callable=AsyncMock,
-                return_value=verification,
-            ),
-            patch(
-                "automation.watchdog.get_api_key_for_automation_run",
-                new_callable=AsyncMock,
-                return_value="test-api-key",
-            ),
-        ):
-            async with async_session_factory() as session:
-                run = await session.get(AutomationRun, run_id)
-                result = await _verify_and_mark_run(session, run, mock_settings)
-                await session.commit()
-
-        assert result is True
-
-        # Verify the run was marked as FAILED with exit code (not timeout)
-        async with async_session_factory() as session:
-            run = await session.get(AutomationRun, run_id)
-            assert run.status == AutomationRunStatus.FAILED
-            assert "exit_code=127" in run.error_detail
-            assert "Timed out" not in run.error_detail
-
-
-class TestVerifyAndMarkRunVerificationFailed:
-    """Tests for _verify_and_mark_run when verification fails."""
-
-    @pytest.mark.asyncio
-    async def test_verification_failed_marks_timed_out(
-        self, async_session_factory, automation_with_run, mock_settings
-    ):
-        """When verification fails (sandbox unavailable), mark as timed out."""
-        run_id = automation_with_run["run_id"]
-
-        verification = VerificationResult(
-            verified=False,
-            error="Sandbox not available",
-        )
-
-        with (
-            patch(
-                "automation.watchdog.verify_run_status",
-                new_callable=AsyncMock,
-                return_value=verification,
-            ),
-            patch(
-                "automation.watchdog.get_api_key_for_automation_run",
-                new_callable=AsyncMock,
-                return_value="test-api-key",
-            ),
-            patch(
-                "automation.watchdog.cleanup_sandbox",
-                new_callable=AsyncMock,
-            ) as mock_cleanup,
-        ):
-            async with async_session_factory() as session:
-                run = await session.get(AutomationRun, run_id)
-                result = await _verify_and_mark_run(session, run, mock_settings)
-                await session.commit()
-
-        assert result is True
-        mock_cleanup.assert_called_once()
-
-        # Verify the run was marked as FAILED with timeout message
-        async with async_session_factory() as session:
-            run = await session.get(AutomationRun, run_id)
-            assert run.status == AutomationRunStatus.FAILED
-            assert run.completed_at is not None
-            assert "Timed out" in run.error_detail
-            assert "Sandbox not available" in run.error_detail
-
-    @pytest.mark.asyncio
-    async def test_verification_failed_no_cleanup_if_keep_alive(
-        self, async_session_factory, mock_settings
-    ):
-        """When keep_alive is True, don't cleanup sandbox on verification failure."""
-        async with async_session_factory() as session:
-            automation = Automation(
-                user_id=TEST_USER_ID,
-                org_id=TEST_ORG_ID,
-                name="Keep Alive Automation",
-                trigger={"type": "cron", "schedule": "* * * * *", "timezone": "UTC"},
-                tarball_path="s3://bucket/code.tar.gz",
-                entrypoint="uv run main.py",
-                enabled=True,
-            )
-            session.add(automation)
-            await session.commit()
-
-            now = utcnow()
-            run = AutomationRun(
-                automation_id=automation.id,
-                status=AutomationRunStatus.RUNNING,
-                sandbox_id="test-sandbox-456",
-                started_at=now - timedelta(minutes=5),
-                timeout_at=now - timedelta(minutes=1),
-                keep_alive=True,
-            )
-            session.add(run)
-            await session.commit()
-            run_id = run.id
-
-        verification = VerificationResult(
-            verified=False,
-            error="Sandbox not available",
-        )
-
-        with (
-            patch(
-                "automation.watchdog.verify_run_status",
-                new_callable=AsyncMock,
-                return_value=verification,
-            ),
-            patch(
-                "automation.watchdog.get_api_key_for_automation_run",
-                new_callable=AsyncMock,
-                return_value="test-api-key",
-            ),
-            patch(
-                "automation.watchdog.cleanup_sandbox",
-                new_callable=AsyncMock,
-            ) as mock_cleanup,
-        ):
-            async with async_session_factory() as session:
-                run = await session.get(AutomationRun, run_id)
-                result = await _verify_and_mark_run(session, run, mock_settings)
-                await session.commit()
-
-        assert result is True
-        # Cleanup should NOT be called when keep_alive is True
-        mock_cleanup.assert_not_called()
diff --git a/uv.lock b/uv.lock
index 67ef337..604a507 100644
--- a/uv.lock
+++ b/uv.lock
@@ -2070,6 +2070,18 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/81/08/7036c080d7117f28a4af526d794aab6a84463126db031b007717c1a6676e/multidict-6.7.1-py3-none-any.whl", hash = "sha256:55d97cc6dae627efa6a6e548885712d4864b81110ac76fa4e534c03819fa4a56", size = 12319, upload-time = "2026-01-26T02:46:44.004Z" },
 ]
 
+[[package]]
+name = "nexus-rpc"
+version = "1.4.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/35/d5/cd1ffb202b76ebc1b33c1332a3416e55a39929006982adc2b1eb069aaa9b/nexus_rpc-1.4.0.tar.gz", hash = "sha256:3b8b373d4865671789cc43623e3dc0bcbf192562e40e13727e17f1c149050fba", size = 82367, upload-time = "2026-02-25T22:01:34.053Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/11/52/6327a5f4fda01207205038a106a99848a41c83e933cd23ea2cab3d2ebc6c/nexus_rpc-1.4.0-py3-none-any.whl", hash = "sha256:14c953d3519113f8ccec533a9efdb6b10c28afef75d11cdd6d422640c40b3a49", size = 29645, upload-time = "2026-02-25T22:01:33.122Z" },
+]
+
 [[package]]
 name = "nodeenv"
 version = "1.10.0"
@@ -2146,6 +2158,7 @@ dependencies = [
     { name = "pydantic-settings" },
     { name = "python-json-logger" },
     { name = "sqlalchemy", extra = ["asyncio"] },
+    { name = "temporalio" },
     { name = "tenacity" },
     { name = "uvicorn", extra = ["standard"] },
 ]
@@ -2181,6 +2194,7 @@ requires-dist = [
     { name = "pydantic-settings", specifier = ">=2" },
     { name = "python-json-logger", specifier = ">=3" },
     { name = "sqlalchemy", extras = ["asyncio"], specifier = ">=2" },
+    { name = "temporalio", specifier = ">=1.9.0" },
     { name = "tenacity", specifier = ">=9.1.4" },
     { name = "uvicorn", extras = ["standard"], specifier = ">=0.30" },
 ]
@@ -3451,6 +3465,25 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/81/0d/13d1d239a25cbfb19e740db83143e95c772a1fe10202dda4b76792b114dd/starlette-0.52.1-py3-none-any.whl", hash = "sha256:0029d43eb3d273bc4f83a08720b4912ea4b071087a3b48db01b7c839f7954d74", size = 74272, upload-time = "2026-01-18T13:34:09.188Z" },
 ]
 
+[[package]]
+name = "temporalio"
+version = "1.24.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "nexus-rpc" },
+    { name = "protobuf" },
+    { name = "types-protobuf" },
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a7/b1/7d9b3104ab7994e7d49e765b92495aaff44810b1e066c874c284a93ebd55/temporalio-1.24.0.tar.gz", hash = "sha256:e534e2e71b4a721193ec4ff3dae521146d093554bd47a64f5605d4ca33e56718", size = 2040485, upload-time = "2026-03-23T15:33:33.638Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/84/a9/30517c21d6155bce1c3dc0e420db48da0231230dbc683f40ab6d5fe22b37/temporalio-1.24.0-cp310-abi3-macosx_10_12_x86_64.whl", hash = "sha256:7f11e7b4f4d09bafba499b43188353e23dc128b1fe3f3160014476e3dce70760", size = 12223918, upload-time = "2026-03-23T15:33:05.045Z" },
+    { url = "https://files.pythonhosted.org/packages/73/d0/11aa103bde794524008c1850a84e06cde98698395ca1f8b12e1bd2390aa8/temporalio-1.24.0-cp310-abi3-macosx_11_0_arm64.whl", hash = "sha256:5cff75a0ca922575b808a7fca1b0de38f6eea061f49e026664b8be9d5bb06ab8", size = 11708887, upload-time = "2026-03-23T15:33:11.67Z" },
+    { url = "https://files.pythonhosted.org/packages/1d/f4/774b56100e6bb94e3757ec96fb5c2bc62d42defc7d6de0ee35a12273827a/temporalio-1.24.0-cp310-abi3-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ee7c13b6724dd0c304aa846aecf6da72a8550f4ade40a0a7f6dcc1c92ef35710", size = 12028303, upload-time = "2026-03-23T15:33:18.022Z" },
+    { url = "https://files.pythonhosted.org/packages/e5/91/c05d0e9c2432fe8b1ea0d6fae321866ee49a320ad5e494e6ec9424ca5c28/temporalio-1.24.0-cp310-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:aa71b9bfa42f951dd04ade97ce7f92ecedee8903047b4b41b122bb8cbd87a337", size = 12375155, upload-time = "2026-03-23T15:33:24.234Z" },
+    { url = "https://files.pythonhosted.org/packages/c4/97/5c939e4609c164c8690a3b5a135eb828d531de8ef63ff447a2a439c0b0fb/temporalio-1.24.0-cp310-abi3-win_amd64.whl", hash = "sha256:52f6833647eceddbebcc376e2ea663a9f73b2b3a42675f503aeb27c98fd4daeb", size = 12720174, upload-time = "2026-03-23T15:33:30.826Z" },
+]
+
 [[package]]
 name = "tenacity"
 version = "9.1.4"
@@ -3581,6 +3614,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/4a/91/48db081e7a63bb37284f9fbcefda7c44c277b18b0e13fbc36ea2335b71e6/typer-0.24.1-py3-none-any.whl", hash = "sha256:112c1f0ce578bfb4cab9ffdabc68f031416ebcc216536611ba21f04e9aa84c9e", size = 56085, upload-time = "2026-02-21T16:54:41.616Z" },
 ]
 
+[[package]]
+name = "types-protobuf"
+version = "7.34.1.20260403"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ae/b3/c2e407ea36e0e4355c135127cee1b88a2cc9a2c92eafca50a360ab9f2708/types_protobuf-7.34.1.20260403.tar.gz", hash = "sha256:8d7881867888e667eb9563c08a916fccdc12bdb5f9f34c31d217cce876e36765", size = 68782, upload-time = "2026-04-03T04:18:09.428Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/7d/95/24fb0f6fe37b41cf94f9b9912712645e17d8048d4becaf37c1607ddd8e32/types_protobuf-7.34.1.20260403-py3-none-any.whl", hash = "sha256:16d9bbca52ab0f306279958878567df2520f3f5579059419b0ce149a0ad1e332", size = 86011, upload-time = "2026-04-03T04:18:08.245Z" },
+]
+
 [[package]]
 name = "typing-extensions"
 version = "4.15.0"