ci: use self-hosted netty runners for validation jobs

update crates.io link
release: v0.1.14 [skip ci]
2026-04-18 05:01:56 +00:00 · 2026-04-05 11:46:45 -04:00 · 2026-04-02 14:53:56 -04:00 · 2026-03-27 23:46:33 +00:00 · 2026-03-27 19:40:24 -04:00 · 2026-03-27 19:25:26 -04:00
63 changed files with 12315 additions and 647 deletions
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@ -1,18 +1,107 @@
 name: CI

 on:
+  pull_request:
+    branches: [main]
  push:
    branches: [main]
  workflow_dispatch:
+    inputs:
+      bump:
+        description: Version bump type (only for workflow_dispatch)
+        type: choice
+        options:
+          - patch
+          - minor
+          - major
+        default: patch
+      publish_npm:
+        description: Publish to npm
+        type: boolean
+        default: true
+      publish_crates:
+        description: Publish to crates.io
+        type: boolean
+        default: true
+
+env:
+  FORCE_JAVASCRIPT_ACTIONS_TO_NODE24: true

 permissions:
  contents: write
-  packages: write

 jobs:
-  cargo:
-    name: Cargo Build
-    runs-on: ${{ vars.UVA_RUNNER || 'ubuntu-latest' }}
+  changes:
+    name: Changes
+    runs-on: [self-hosted, netty]
+    outputs:
+      rust: ${{ steps.check.outputs.rust }}
+      version: ${{ steps.version.outputs.version }}
+      tag: ${{ steps.version.outputs.tag }}
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - uses: dorny/paths-filter@v3
+        id: filter
+        with:
+          filters: |
+            rust:
+              - 'src/**'
+              - 'tests/**'
+              - 'Cargo.toml'
+              - 'Cargo.lock'
+              - 'npm/**'
+              - 'flake.nix'
+              - 'flake.lock'
+              - 'docker/**'
+              - '.github/workflows/**'
+              - 'Makefile'
+
+      - name: Set outputs
+        id: check
+        run: |
+          if [ "${{ github.event_name }}" = "workflow_dispatch" ]; then
+            echo "rust=true" >> "$GITHUB_OUTPUT"
+          else
+            echo "rust=${{ steps.filter.outputs.rust }}" >> "$GITHUB_OUTPUT"
+          fi
+
+      - name: Calculate next version
+        id: version
+        if: github.event_name != 'pull_request' && steps.check.outputs.rust == 'true'
+        run: |
+          CURRENT=$(grep '^version' Cargo.toml | head -1 | sed 's/.*"\(.*\)"/\1/')
+          IFS='.' read -r MAJOR MINOR PATCH <<< "$CURRENT"
+
+          BUMP="${{ inputs.bump || 'patch' }}"
+          case "$BUMP" in
+            major) MAJOR=$((MAJOR + 1)); MINOR=0; PATCH=0 ;;
+            minor) MINOR=$((MINOR + 1)); PATCH=0 ;;
+            patch)
+              LATEST=$(git tag -l "v${MAJOR}.${MINOR}.*" | sort -V | tail -1)
+              if [ -z "$LATEST" ]; then
+                NEW_PATCH=$PATCH
+              else
+                LATEST_VER="${LATEST#v}"
+                IFS='.' read -r _ _ LATEST_PATCH <<< "$LATEST_VER"
+                NEW_PATCH=$((LATEST_PATCH + 1))
+              fi
+              PATCH=$NEW_PATCH
+              ;;
+          esac
+
+          NEW="${MAJOR}.${MINOR}.${PATCH}"
+          echo "version=${NEW}" >> "$GITHUB_OUTPUT"
+          echo "tag=v${NEW}" >> "$GITHUB_OUTPUT"
+          echo "Computed version: ${NEW} (v${NEW})"
+
+  validate:
+    name: Validate
+    needs: changes
+    if: needs.changes.outputs.rust == 'true'
+    runs-on: [self-hosted, netty]
    steps:
      - uses: actions/checkout@v4

@ -22,9 +111,141 @@ jobs:

      - uses: Swatinem/rust-cache@v2

+      - uses: pnpm/action-setup@v4
+        with:
+          version: 10
+          run_install: false
+
+      - uses: actions/setup-node@v4
+        with:
+          node-version: 22
+          cache: pnpm
+          cache-dependency-path: site/pnpm-lock.yaml
+
+      - name: Install site dependencies
+        run: pnpm --dir site install --frozen-lockfile
+
+      - name: Format check
+        run: make fmt-check
+
+      - name: Clippy
+        run: make lint
+
+      - name: Unit tests
+        run: make test-unit
+
+      - name: Site format check
+        run: make site-format-check
+
+  integration:
+    name: Integration (Xvfb)
+    needs: changes
+    if: needs.changes.outputs.rust == 'true'
+    runs-on: [self-hosted, netty]
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: dtolnay/rust-toolchain@stable
+
+      - uses: Swatinem/rust-cache@v2
+
+      - name: Xvfb integration tests
+        run: make test-integration
+
+  distribution:
+    name: Distribution Validate
+    needs: changes
+    if: needs.changes.outputs.rust == 'true'
+    runs-on: [self-hosted, netty]
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: dtolnay/rust-toolchain@stable
+
+      - uses: Swatinem/rust-cache@v2
+
+      - uses: actions/setup-node@v4
+        with:
+          node-version: 22
+
+      - name: Distribution validation
+        run: make dist-validate
+
+  # --- Release pipeline: update-manifests -> build -> release -> publish ---
+  # These stay on ubuntu-latest for artifact upload/download and registry publishing.
+
+  update-manifests:
+    name: Update Manifests
+    needs: [changes, validate, integration, distribution]
+    if: github.event_name != 'pull_request' && needs.changes.outputs.rust == 'true'
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - uses: dtolnay/rust-toolchain@stable
+
+      - uses: actions/setup-node@v4
+        with:
+          node-version: 22
+
+      - name: Update versions
+        run: |
+          CURRENT=$(grep '^version' Cargo.toml | head -1 | sed 's/.*"\(.*\)"/\1/')
+          NEW="${{ needs.changes.outputs.version }}"
+          if [ "$CURRENT" != "$NEW" ]; then
+            sed -i "0,/^version = \"${CURRENT}\"/s//version = \"${NEW}\"/" Cargo.toml
+            cargo generate-lockfile
+          fi
+          node -e '
+            const fs = require("node:fs");
+            const p = "npm/deskctl/package.json";
+            const pkg = JSON.parse(fs.readFileSync(p, "utf8"));
+            pkg.version = process.argv[1];
+            fs.writeFileSync(p, JSON.stringify(pkg, null, 2) + "\n");
+          ' "$NEW"
+
+      - name: Commit, tag, and push
+        run: |
+          git config user.name "github-actions[bot]"
+          git config user.email "github-actions[bot]@users.noreply.github.com"
+          git add Cargo.toml Cargo.lock npm/deskctl/package.json
+          if ! git diff --cached --quiet; then
+            git commit -m "release: ${{ needs.changes.outputs.tag }} [skip ci]"
+          fi
+          git tag "${{ needs.changes.outputs.tag }}"
+          git push origin main --tags
+
+  build:
+    name: Build Release Asset
+    needs: [changes, update-manifests]
+    if: github.event_name != 'pull_request' && needs.changes.outputs.rust == 'true'
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          ref: ${{ needs.changes.outputs.tag }}
+
+      - uses: dtolnay/rust-toolchain@stable
+        with:
+          components: clippy
+
+      - uses: Swatinem/rust-cache@v2
+
      - name: Install system dependencies
        run: sudo apt-get update && sudo apt-get install -y libx11-dev libxtst-dev

+      - name: Verify version
+        run: |
+          CARGO_VER=$(grep '^version' Cargo.toml | head -1 | sed 's/.*"\(.*\)"/\1/')
+          EXPECTED="${{ needs.changes.outputs.version }}"
+          if [ "$CARGO_VER" != "$EXPECTED" ]; then
+            echo "Version mismatch: Cargo.toml=$CARGO_VER expected=$EXPECTED"
+            exit 1
+          fi
+          echo "Building version $CARGO_VER"
+
      - name: Clippy
        run: cargo clippy -- -D warnings

@ -37,72 +258,107 @@ jobs:
          path: target/release/deskctl
          retention-days: 7

-  docker:
-    name: Docker Build
-    runs-on: ${{ vars.UVA_RUNNER || 'ubuntu-latest' }}
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Get version
-        id: version
-        run: echo "version=$(grep '^version' Cargo.toml | head -1 | sed 's/.*"\(.*\)"/\1/')" >> "$GITHUB_OUTPUT"
-
-      - uses: docker/setup-buildx-action@v3
-
-      - uses: docker/login-action@v3
-        with:
-          registry: ghcr.io
-          username: ${{ github.actor }}
-          password: ${{ secrets.GITHUB_TOKEN }}
-
-      - uses: docker/build-push-action@v6
-        with:
-          context: .
-          file: docker/Dockerfile
-          push: true
-          tags: |
-            ghcr.io/${{ github.repository }}:latest
-            ghcr.io/${{ github.repository }}:v${{ steps.version.outputs.version }}
-          cache-from: type=gha
-          cache-to: type=gha,mode=max
-
  release:
    name: Release
-    needs: [cargo, docker]
+    needs: [changes, build, update-manifests]
+    if: github.event_name != 'pull_request' && needs.changes.outputs.rust == 'true'
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v4

-      - name: Get version
-        id: version
-        run: echo "version=$(grep '^version' Cargo.toml | head -1 | sed 's/.*"\(.*\)"/\1/')" >> "$GITHUB_OUTPUT"
-
      - uses: actions/download-artifact@v4
        with:
          name: deskctl-linux-x86_64
          path: artifacts/

-      - name: Prepare release assets
-        run: |
-          chmod +x artifacts/deskctl
-          mv artifacts/deskctl artifacts/deskctl-linux-x86_64
-
-      - name: Create or update release
+      - name: Create release
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
        run: |
-          TAG="v${{ steps.version.outputs.version }}"
-          IMAGE="ghcr.io/${{ github.repository }}:${TAG}"
-
-          BODY="## Artifacts
-          - **Binary:** \`deskctl-linux-x86_64\` (attached)
-          - **Docker:** \`docker pull ${IMAGE}\`"
-
-          if gh release view "$TAG" &>/dev/null; then
-            gh release upload "$TAG" artifacts/deskctl-linux-x86_64 --clobber
+          chmod +x artifacts/deskctl
+          mv artifacts/deskctl artifacts/deskctl-linux-x86_64
+          cd artifacts && sha256sum deskctl-linux-x86_64 > checksums.txt && cd ..
+          if gh release view "${{ needs.changes.outputs.tag }}" >/dev/null 2>&1; then
+            gh release upload "${{ needs.changes.outputs.tag }}" \
+              artifacts/deskctl-linux-x86_64 \
+              artifacts/checksums.txt \
+              --clobber
          else
-            gh release create "$TAG" \
-              --title "$TAG" \
-              --notes "${BODY}" \
-              artifacts/deskctl-linux-x86_64
+            gh release create "${{ needs.changes.outputs.tag }}" \
+              --title "${{ needs.changes.outputs.tag }}" \
+              --generate-notes \
+              artifacts/deskctl-linux-x86_64 \
+              artifacts/checksums.txt
          fi
+
+  publish-npm:
+    name: Publish npm
+    needs: [changes, update-manifests, release]
+    if: >-
+      github.event_name != 'pull_request'
+      && needs.changes.outputs.rust == 'true'
+      && (inputs.publish_npm == true || inputs.publish_npm == '')
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          ref: ${{ needs.changes.outputs.tag }}
+
+      - uses: actions/setup-node@v4
+        with:
+          node-version: 22
+          registry-url: https://registry.npmjs.org
+
+      - name: Check if already published
+        id: published
+        run: |
+          VERSION="${{ needs.changes.outputs.version }}"
+          if npm view "deskctl@${VERSION}" version >/dev/null 2>&1; then
+            echo "npm=true" >> "$GITHUB_OUTPUT"
+          else
+            echo "npm=false" >> "$GITHUB_OUTPUT"
+          fi
+
+      - name: Validate npm package
+        if: steps.published.outputs.npm != 'true'
+        run: node npm/deskctl/scripts/validate-package.js
+
+      - name: Publish npm
+        if: steps.published.outputs.npm != 'true'
+        env:
+          NODE_AUTH_TOKEN: ${{ secrets.NPM_TOKEN }}
+        run: npm publish ./npm/deskctl --access public
+
+  publish-crates:
+    name: Publish crates.io
+    needs: [changes, update-manifests, release]
+    if: >-
+      github.event_name != 'pull_request'
+      && needs.changes.outputs.rust == 'true'
+      && (inputs.publish_crates == true || inputs.publish_crates == '')
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          ref: ${{ needs.changes.outputs.tag }}
+
+      - uses: dtolnay/rust-toolchain@stable
+
+      - name: Install system dependencies
+        run: sudo apt-get update && sudo apt-get install -y libx11-dev libxtst-dev
+
+      - name: Check if already published
+        id: published
+        run: |
+          VERSION="${{ needs.changes.outputs.version }}"
+          if curl -fsSL "https://crates.io/api/v1/crates/deskctl/${VERSION}" >/dev/null 2>&1; then
+            echo "crates=true" >> "$GITHUB_OUTPUT"
+          else
+            echo "crates=false" >> "$GITHUB_OUTPUT"
+          fi
+
+      - name: Publish crates.io
+        if: steps.published.outputs.crates != 'true'
+        env:
+          CARGO_REGISTRY_TOKEN: ${{ secrets.CARGO_REGISTRY_TOKEN }}
+        run: cargo publish --locked
--- a/.gitignore
+++ b/.gitignore
@ -1,2 +1,9 @@
 target/
-.humanlayer/
+tmp/
+.vercel
+secret/
+.claude/
+.codex/
+openspec/
+npm/deskctl/vendor/
+npm/deskctl/*.tgz
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@ -0,0 +1,15 @@
+repos:
+  - repo: local
+    hooks:
+      - id: rustfmt
+        name: rustfmt
+        entry: cargo fmt --
+        language: system
+        files: \.rs$
+        pass_filenames: true
+      - id: site-format-check
+        name: site format check
+        entry: make site-format-check
+        language: system
+        files: ^site/
+        pass_filenames: false
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@ -0,0 +1,89 @@
+# Contributing
+
+## Prerequisites
+
+- Rust toolchain
+- `make`
+- `pre-commit` for commit-time hooks
+- `pnpm` for site formatting checks
+- Linux with `xvfb-run` for integration tests
+
+Install site dependencies before running site checks:
+
+```bash
+pnpm --dir site install
+```
+
+## Repository Layout
+
+- `src/lib.rs` exposes the library target used by integration tests
+- `src/main.rs` is the thin CLI binary wrapper
+- `src/` holds production code and unit tests
+- `tests/` holds integration tests
+- `tests/support/` holds shared X11 and daemon helpers for integration coverage
+- `docs/runtime-contract.md` is the stable-vs-best-effort runtime output contract for agent-facing CLI work
+
+Keep integration-only helpers out of `src/`.
+
+## Local Validation
+
+The repo uses one local validation surface through `make`:
+
+```bash
+make fmt-check
+make lint
+make test-unit
+make test-integration
+make site-format-check
+make cargo-publish-dry-run
+make npm-package-check
+make nix-flake-check
+make dist-validate
+make validate
+```
+
+`make validate` runs the full Phase 2 validation stack. It requires Linux, `xvfb-run`, and site dependencies to be installed.
+`make dist-validate` runs the distribution validation stack. It requires `npm`, `nix`, and Linux for the full npm runtime smoke path.
+
+## Pre-commit Hooks
+
+Install the hook workflow once:
+
+```bash
+pre-commit install
+```
+
+Run hooks across the repo on demand:
+
+```bash
+pre-commit run --all-files
+```
+
+The hook config intentionally stays small:
+
+- Rust files use default `rustfmt`
+- Site files reuse the existing `site/` Prettier setup
+- Slower checks stay in CI or `make validate`
+
+## Distribution Work
+
+Distribution support currently ships through:
+
+- crate: `deskctl`
+- npm package: `deskctl`
+- repo flake: `flake.nix`
+- command name on every channel: `deskctl`
+
+For maintainer release and publish steps, see [docs/releasing.md](docs/releasing.md).
+
+Source-build and packaging work should keep Docker as a local Linux build convenience, not as the canonical registry release path.
+
+## Integration Tests
+
+Integration coverage is Linux/X11-only in this phase. The supported local entrypoint is:
+
+```bash
+make test-integration
+```
+
+That command runs the top-level X11 integration tests under `xvfb-run` with one test thread so the shared display/session environment stays deterministic.
--- a/Cargo.lock
+++ b/Cargo.lock
@ -1,6 +1,6 @@
 # This file is automatically @generated by Cargo.
 # It is not intended for manual editing.
-version = 4
+version = 3

 [[package]]
 name = "ab_glyph"
@ -241,9 +241,9 @@ checksum = "1e748733b7cbc798e1434b6ac524f0c1ff2ab456fe201501e6497c8417a4fc33"

 [[package]]
 name = "cc"
-version = "1.2.57"
+version = "1.2.58"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7a0dd1ca384932ff3641c8718a02769f1698e7563dc6974ffd03346116310423"
+checksum = "e1e928d4b69e3077709075a938a05ffbedfa53a84c8f766efbf8220bb1ff60e1"
 dependencies = [
 "find-msvc-tools",
 "jobserver",
@ -400,7 +400,7 @@ checksum = "460fbee9c2c2f33933d720630a6a0bac33ba7053db5344fac858d4b8952d77d5"

 [[package]]
 name = "deskctl"
-version = "0.1.0"
+version = "0.1.14"
 dependencies = [
 "ab_glyph",
 "anyhow",
@ -911,9 +911,9 @@ dependencies = [

 [[package]]
 name = "js-sys"
-version = "0.3.91"
+version = "0.3.92"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b49715b7073f385ba4bc528e5747d02e66cb39c6146efb66b781f131f0fb399c"
+checksum = "cc4c90f45aa2e6eacbe8645f77fdea542ac97a494bcd117a67df9ff4d611f995"
 dependencies = [
 "once_cell",
 "wasm-bindgen",
@ -1039,9 +1039,9 @@ dependencies = [

 [[package]]
 name = "mio"
-version = "1.1.1"
+version = "1.2.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a69bcab0ad47271a0234d9422b131806bf3968021e5dc9328caf2d4cd58557fc"
+checksum = "50b7e5b27aa02a74bac8c3f23f448f8d87ff11f92d3aac1a6ed369ee08cc56c1"
 dependencies = [
 "libc",
 "wasi",
@ -1699,9 +1699,9 @@ dependencies = [

 [[package]]
 name = "simd-adler32"
-version = "0.3.8"
+version = "0.3.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e320a6c5ad31d271ad523dcf3ad13e2767ad8b1cb8f047f75a8aeaf8da139da2"
+checksum = "703d5c7ef118737c72f1af64ad2f6f8c5e1921f818cdcb97b8fe6fc69bf66214"

 [[package]]
 name = "simd_helpers"
@ -1861,9 +1861,9 @@ checksum = "06abde3611657adf66d383f00b093d7faecc7fa57071cce2578660c9f1010821"

 [[package]]
 name = "uuid"
-version = "1.22.0"
+version = "1.23.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a68d3c8f01c0cfa54a75291d83601161799e4a89a39e0929f4b0354d88757a37"
+checksum = "5ac8b6f42ead25368cf5b098aeb3dc8a1a2c05a3eee8a9a1a68c640edbfc79d9"
 dependencies = [
 "getrandom 0.4.2",
 "js-sys",
@ -1907,9 +1907,9 @@ dependencies = [

 [[package]]
 name = "wasm-bindgen"
-version = "0.2.114"
+version = "0.2.115"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6532f9a5c1ece3798cb1c2cfdba640b9b3ba884f5db45973a6f442510a87d38e"
+checksum = "6523d69017b7633e396a89c5efab138161ed5aafcbc8d3e5c5a42ae38f50495a"
 dependencies = [
 "cfg-if",
 "once_cell",
@ -1920,9 +1920,9 @@ dependencies = [

 [[package]]
 name = "wasm-bindgen-macro"
-version = "0.2.114"
+version = "0.2.115"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "18a2d50fcf105fb33bb15f00e7a77b772945a2ee45dcf454961fd843e74c18e6"
+checksum = "4e3a6c758eb2f701ed3d052ff5737f5bfe6614326ea7f3bbac7156192dc32e67"
 dependencies = [
 "quote",
 "wasm-bindgen-macro-support",
@ -1930,9 +1930,9 @@ dependencies = [

 [[package]]
 name = "wasm-bindgen-macro-support"
-version = "0.2.114"
+version = "0.2.115"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "03ce4caeaac547cdf713d280eda22a730824dd11e6b8c3ca9e42247b25c631e3"
+checksum = "921de2737904886b52bcbb237301552d05969a6f9c40d261eb0533c8b055fedf"
 dependencies = [
 "bumpalo",
 "proc-macro2",
@ -1943,9 +1943,9 @@ dependencies = [

 [[package]]
 name = "wasm-bindgen-shared"
-version = "0.2.114"
+version = "0.2.115"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "75a326b8c223ee17883a4251907455a2431acc2791c98c26279376490c378c16"
+checksum = "a93e946af942b58934c604527337bad9ae33ba1d5c6900bbb41c2c07c2364a93"
 dependencies = [
 "unicode-ident",
 ]
@ -2297,9 +2297,9 @@ dependencies = [

 [[package]]
 name = "zune-jpeg"
-version = "0.5.14"
+version = "0.5.15"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0b7a1c0af6e5d8d1363f4994b7a091ccf963d8b694f7da5b0b9cceb82da2c0a6"
+checksum = "27bc9d5b815bc103f142aa054f561d9187d191692ec7c2d1e2b4737f8dbd7296"
 dependencies = [
 "zune-core",
 ]
--- a/Cargo.toml
+++ b/Cargo.toml
@ -1,10 +1,23 @@
 [package]
 name = "deskctl"
-version = "0.1.0"
+version = "0.1.14"
 edition = "2021"
 description = "X11 desktop control CLI for agents"
 license = "MIT"
 repository = "https://github.com/harivansh-afk/deskctl"
+homepage = "https://github.com/harivansh-afk/deskctl"
+readme = "README.md"
+keywords = ["x11", "desktop", "automation", "cli", "agent"]
+categories = ["command-line-utilities"]
+rust-version = "1.75"
+include = [
+  "/Cargo.toml",
+  "/Cargo.lock",
+  "/README.md",
+  "/LICENCE",
+  "/assets/**",
+  "/src/**",
+]

 [dependencies]
 clap = { version = "4", features = ["derive", "env"] }
--- a/21
+++ b/21
@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2026 Harivansh Rathi
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
--- a/63
+++ b/63
@ -0,0 +1,63 @@
+.PHONY: fmt fmt-check lint test-unit test-integration site-format-check cargo-publish-dry-run npm-package-check nix-flake-check dist-validate validate
+
+fmt:
+	cargo fmt --all
+
+fmt-check:
+	cargo fmt --all --check
+
+lint:
+	cargo clippy --all-targets -- -D warnings
+
+test-unit:
+	cargo test --lib
+
+test-integration:
+	@if [ "$$(uname -s)" != "Linux" ]; then \
+		echo "Integration tests require Linux and xvfb-run."; \
+		exit 1; \
+	fi
+	@if ! command -v xvfb-run >/dev/null 2>&1; then \
+		echo "xvfb-run is required to execute integration tests."; \
+		exit 1; \
+	fi
+	XDG_SESSION_TYPE=x11 xvfb-run -a cargo test --test x11_runtime -- --test-threads=1
+
+site-format-check:
+	@if ! command -v pnpm >/dev/null 2>&1; then \
+		echo "pnpm is required for site formatting checks."; \
+		exit 1; \
+	fi
+	pnpm --dir site format:check
+
+cargo-publish-dry-run:
+	cargo publish --dry-run --allow-dirty --locked
+
+npm-package-check:
+	@if ! command -v npm >/dev/null 2>&1; then \
+		echo "npm is required for npm packaging validation."; \
+		exit 1; \
+	fi
+	node npm/deskctl/scripts/validate-package.js
+	rm -rf tmp/npm-pack tmp/npm-install
+	mkdir -p tmp/npm-pack tmp/npm-install/bin
+	npm pack ./npm/deskctl --pack-destination ./tmp/npm-pack >/dev/null
+	@if [ "$$(uname -s)" != "Linux" ]; then \
+		echo "Skipping npm package runtime smoke test on non-Linux host."; \
+	else \
+		cargo build && \
+		PACK_TGZ=$$(ls ./tmp/npm-pack/*.tgz | head -n 1) && \
+		DESKCTL_BINARY_PATH="$$(pwd)/target/debug/deskctl" npm install --prefix ./tmp/npm-install "$${PACK_TGZ}" && \
+		./tmp/npm-install/node_modules/.bin/deskctl --version; \
+	fi
+
+nix-flake-check:
+	@if ! command -v nix >/dev/null 2>&1; then \
+		echo "nix is required for flake validation."; \
+		exit 1; \
+	fi
+	nix flake check
+
+dist-validate: test-unit cargo-publish-dry-run npm-package-check nix-flake-check
+
+validate: fmt-check lint test-unit test-integration site-format-check
--- a/README.md
+++ b/README.md
@ -1,75 +1,46 @@
 # deskctl
+[![npm](https://img.shields.io/npm/v/deskctl?label=npm)](https://www.npmjs.com/package/deskctl)
+[![skill](https://img.shields.io/badge/skills.sh-deskctl-111827)](skills/deskctl)
+
+Desktop control cli for AI agents on X11.
+
+https://github.com/user-attachments/assets/e820787e-4d1a-463f-bdcf-a829588778bf

-Desktop control CLI for AI agents on Linux X11. 

 ## Install

 ```bash
-cargo install deskctl
+npm install -g deskctl
 ```

-Build a Linux binary with Docker:
-
 ```bash
-docker compose -f docker/docker-compose.yml run --rm build
+deskctl doctor
+deskctl snapshot --annotate
 ```

-This writes `dist/deskctl-linux-x86_64`.
-
-Copy it to an SSH machine where `scp` is unavailable:
+## Skill

 ```bash
-ssh -p 443 deskctl@ssh.agentcomputer.ai 'cat > ~/deskctl && chmod +x ~/deskctl' < dist/deskctl-linux-x86_64
+npx skills add harivansh-afk/deskctl
 ```

-Run it on an X11 session:
+## Docs
+
+- runtime contract: [docs/runtime-contract.md](docs/runtime-contract.md)
+- releasing: [docs/releasing.md](docs/releasing.md)
+- contributing: [CONTRIBUTING.md](CONTRIBUTING.md)
+
+## Install paths
+
+Nix:

 ```bash
-DISPLAY=:1 XDG_SESSION_TYPE=x11 ~/deskctl --json snapshot --annotate
+nix run github:harivansh-afk/deskctl -- --help
+nix profile install github:harivansh-afk/deskctl
 ```

-Local source build requirements:
+Rust:
+
 ```bash
 cargo build
 ```
-
-At the moment there are no extra native build dependencies beyond a Rust toolchain.
-
-## Quick Start
-
-```bash
-# See the desktop
-deskctl snapshot
-
-# Click a window
-deskctl click @w1
-
-# Type text
-deskctl type "hello world"
-
-# Focus by name
-deskctl focus "firefox"
-```
-
-## Architecture
-
-Client-daemon architecture over Unix sockets (NDJSON wire protocol). 
-The daemon starts automatically on first command and keeps the X11 connection alive for fast repeated calls.
-
-## Runtime Requirements
-
- Linux with X11 session
- Rust 1.75+ (for build)
-
-The binary itself only links the standard glibc runtime on Linux (`libc`, `libm`, `libgcc_s`).
-
-For deskctl to be fully functional on a fresh VM you still need:
-
- an X11 server and an active `DISPLAY`
- `XDG_SESSION_TYPE=x11` or an equivalent X11 session environment
- a window manager or desktop environment that exposes standard EWMH properties such as `_NET_CLIENT_LIST_STACKING` and `_NET_ACTIVE_WINDOW`
- an X server with the extensions needed for input simulation and screen metadata, which is standard on normal desktop X11 setups
-
-## Wayland Support
-
-Coming soon. The trait-based backend design means adding Hyprland/Wayland support is a single trait implementation with zero refactoring of the core which is good.
--- a/SKILL.md
+++ b/SKILL.md
@ -1,116 +0,0 @@
---
-name: deskctl
-description: Desktop control CLI for AI agents 
-allowed-tools: Bash(deskctl:*)
---
-
-# deskctl
-
-Desktop control CLI for AI agents on Linux X11. Provides a unified interface for screenshots, mouse/keyboard input, and window management with compact `@wN` window references.
-
-## Core Workflow
-
-1. **Snapshot** to see the desktop and get window refs
-2. **Act** using refs or coordinates (click, type, focus)
-3. **Repeat** as needed
-
-## Quick Reference
-
-### See the Desktop
-
-```bash
-deskctl snapshot              # Screenshot + window tree with @wN refs
-deskctl snapshot --annotate   # Screenshot with bounding boxes and labels
-deskctl snapshot --json       # Structured JSON output
-deskctl list-windows          # Window tree without screenshot
-deskctl screenshot /tmp/s.png # Screenshot only (no window tree)
-```
-
-### Click and Type
-
-```bash
-deskctl click @w1             # Click center of window @w1
-deskctl click 500,300         # Click absolute coordinates
-deskctl dblclick @w2          # Double-click window @w2
-deskctl type "hello world"    # Type text into focused window
-deskctl press enter           # Press a key
-deskctl hotkey ctrl c         # Send Ctrl+C
-deskctl hotkey ctrl shift t   # Send Ctrl+Shift+T
-```
-
-### Mouse Control
-
-```bash
-deskctl mouse move 500 300    # Move cursor to coordinates
-deskctl mouse scroll 3        # Scroll down 3 units
-deskctl mouse scroll -3       # Scroll up 3 units
-deskctl mouse drag 100 100 500 500  # Drag from (100,100) to (500,500)
-```
-
-### Window Management
-
-```bash
-deskctl focus @w2             # Focus window by ref
-deskctl focus "firefox"       # Focus window by name (substring match)
-deskctl close @w3             # Close window gracefully
-deskctl move-window @w1 100 200     # Move window to position
-deskctl resize-window @w1 800 600   # Resize window
-```
-
-### Utilities
-
-```bash
-deskctl get-screen-size       # Screen resolution
-deskctl get-mouse-position    # Current cursor position
-deskctl launch firefox        # Launch an application
-deskctl launch code -- --new-window  # Launch with arguments
-```
-
-### Daemon
-
-```bash
-deskctl daemon start          # Start daemon manually
-deskctl daemon stop           # Stop daemon
-deskctl daemon status         # Check daemon status
-```
-
-## Global Options
-
- `--json` : Output as structured JSON (all commands)
- `--session NAME` : Session name for multiple daemon instances (default: "default")
- `--socket PATH` : Custom Unix socket path
-
-## Window Refs
-
-After `snapshot` or `list-windows`, windows are assigned short refs:
- `@w1` is the topmost (usually focused) window
- `@w2`, `@w3`, etc. follow z-order (front to back)
- Refs reset on each `snapshot` call
- Use `--json` to see stable `xcb_id` for programmatic tracking
-
-## Example Agent Workflow
-
-```bash
-# 1. See what's on screen
-deskctl snapshot --annotate
-
-# 2. Focus the browser
-deskctl focus "firefox"
-
-# 3. Navigate to a URL
-deskctl hotkey ctrl l
-deskctl type "https://example.com"
-deskctl press enter
-
-# 4. Take a new snapshot to see the result
-deskctl snapshot
-```
-
-## Key Names for press/hotkey
-
-Modifiers: `ctrl`, `alt`, `shift`, `super`
-Navigation: `enter`, `tab`, `escape`, `backspace`, `delete`, `space`
-Arrows: `up`, `down`, `left`, `right`
-Page: `home`, `end`, `pageup`, `pagedown`
-Function: `f1` through `f12`
-Characters: any single character (e.g. `a`, `1`, `/`)
--- a/demo/index.html
+++ b/demo/index.html
@ -0,0 +1,969 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>deskctl - Desktop Control for AI Agents</title>
+<style>
+  *, *::before, *::after { margin: 0; padding: 0; box-sizing: border-box; }
+
+  :root {
+    /* cozybox light */
+    --page-bg: #f2f2f2;
+    --bg: #e7e7e7;
+    --surface: #dcdcdc;
+    --surface-2: #e1e1e1;
+    --border: #c3c7c9;
+    --text: #282828;
+    --text-dim: #504945;
+    --text-muted: #928374;
+    --selection: #c3c7c9;
+    --accent: #4261a5;
+    --green: #427b58;
+    --red: #c5524a;
+    --yellow: #d79921;
+    --orange: #af3a03;
+    --purple: #8f3f71;
+    --aqua: #427b58;
+    --cyan: #3c7678;
+    --gray: #928374;
+    --mono: 'Berkeley Mono', 'JetBrains Mono', 'Fira Code', 'SF Mono', Consolas, monospace;
+    --sans: -apple-system, BlinkMacSystemFont, 'Segoe UI', system-ui, sans-serif;
+  }
+
+  body {
+    font-family: var(--sans);
+    background: var(--page-bg);
+    color: var(--text);
+    overflow: hidden;
+    height: 100vh;
+    display: flex;
+    flex-direction: column;
+    align-items: center;
+    justify-content: center;
+  }
+
+  .hero {
+    text-align: center;
+    margin-bottom: 28px;
+    z-index: 10;
+  }
+
+  .hero h1 {
+    font-family: var(--mono);
+    font-size: 28px;
+    font-weight: 700;
+    letter-spacing: -0.5px;
+    margin-bottom: 4px;
+  }
+
+  .hero p { font-size: 14px; color: var(--text-dim); }
+
+  .demo-container {
+    display: flex;
+    gap: 16px;
+    width: 1140px;
+    max-width: 96vw;
+    height: 580px;
+  }
+
+  /* ── Desktop ──────────────────────────────────────── */
+  .desktop-panel {
+    flex: 1;
+    position: relative;
+    border-radius: 12px;
+    overflow: hidden;
+    background: var(--bg);
+    box-shadow: 0 4px 24px rgba(0,0,0,0.08), 0 0 0 1px rgba(0,0,0,0.04);
+  }
+
+  .desktop-titlebar {
+    height: 30px;
+    background: var(--surface);
+    display: flex;
+    align-items: center;
+    padding: 0 12px;
+    gap: 6px;
+  }
+
+  .dot { width: 10px; height: 10px; border-radius: 50%; }
+
+  .viewport {
+    position: relative;
+    height: calc(100% - 30px);
+    background: var(--bg);
+    overflow: hidden;
+  }
+
+  .wallpaper {
+    position: absolute;
+    inset: 0;
+    background:
+      radial-gradient(ellipse at 25% 35%, rgba(66,97,165,0.04) 0%, transparent 55%),
+      radial-gradient(ellipse at 75% 65%, rgba(66,123,88,0.03) 0%, transparent 55%),
+      var(--bg);
+  }
+
+  /* ── Taskbar ──────────────────────────────────────── */
+  .taskbar {
+    position: absolute;
+    bottom: 0; left: 0; right: 0;
+    height: 28px;
+    background: var(--surface);
+    display: flex;
+    align-items: center;
+    padding: 0 8px;
+    gap: 2px;
+    z-index: 15;
+  }
+
+  .tb-item {
+    height: 20px;
+    padding: 0 10px;
+    font-family: var(--mono);
+    font-size: 9px;
+    color: var(--text-dim);
+    display: flex;
+    align-items: center;
+    border-radius: 3px;
+    opacity: 0;
+    transform: translateX(-4px);
+    transition: opacity 0.3s, transform 0.3s, background 0.15s;
+  }
+
+  .tb-item.visible { opacity: 1; transform: translateX(0); }
+  .tb-item.active { background: rgba(0,0,0,0.06); color: var(--text); }
+
+  /* ── Windows ──────────────────────────────────────── */
+  .win {
+    position: absolute;
+    border-radius: 8px;
+    overflow: hidden;
+    box-shadow: 0 2px 12px rgba(0,0,0,0.08), 0 0 0 1px rgba(0,0,0,0.04);
+    transition: box-shadow 0.2s, opacity 0.4s ease, transform 0.4s ease;
+    opacity: 0;
+    transform: scale(0.92) translateY(14px);
+  }
+
+  .win.visible { opacity: 1; transform: scale(1) translateY(0); }
+  .win.focused { box-shadow: 0 4px 20px rgba(0,0,0,0.12), 0 0 0 1px rgba(66,97,165,0.15); z-index: 10; }
+
+  .wbar {
+    height: 26px;
+    background: var(--surface);
+    display: flex;
+    align-items: center;
+    padding: 0 8px;
+    gap: 5px;
+    font-size: 10px;
+    font-family: var(--mono);
+    color: var(--text-dim);
+  }
+
+  .wbar .dots { display: flex; gap: 3px; }
+  .wbar .dots span { width: 7px; height: 7px; border-radius: 50%; }
+
+  .wbody {
+    background: #f8f8f8;
+    height: calc(100% - 26px);
+    overflow: hidden;
+    position: relative;
+  }
+
+  /* ── File Manager ─────────────────────────────────── */
+  .file-list { padding: 8px; }
+
+  .file-row {
+    display: flex;
+    align-items: center;
+    gap: 8px;
+    padding: 5px 8px;
+    border-radius: 4px;
+    font-family: var(--mono);
+    font-size: 10px;
+    color: var(--text-dim);
+    transition: background 0.15s;
+  }
+
+  .file-row.selected { background: var(--selection); color: var(--text); }
+  .file-row .ficon { font-size: 13px; width: 18px; text-align: center; }
+  .file-row .fmeta { margin-left: auto; font-size: 8px; color: var(--text-muted); }
+
+  .file-preview {
+    position: absolute;
+    bottom: 0; left: 0; right: 0;
+    height: 0;
+    background: var(--surface);
+    overflow: hidden;
+    transition: height 0.3s ease;
+    font-family: var(--mono);
+    font-size: 9px;
+    line-height: 1.5;
+    color: var(--text-dim);
+    padding: 0 10px;
+  }
+
+  .file-preview.open { height: 58px; padding: 8px 10px; }
+
+  /* ── Stock Chart ──────────────────────────────────── */
+  .chart-header {
+    display: flex;
+    align-items: baseline;
+    gap: 8px;
+    padding: 8px 12px 2px;
+    font-family: var(--mono);
+  }
+
+  .chart-ticker { font-size: 14px; font-weight: 700; color: var(--text); }
+  .chart-price { font-size: 12px; color: var(--green); }
+  .chart-change { font-size: 9px; color: var(--green); }
+  .chart-period { font-size: 8px; color: var(--text-muted); margin-left: auto; }
+
+  .chart-area { padding: 4px 12px 8px; height: calc(100% - 60px); }
+  .chart-area svg { width: 100%; height: 100%; }
+
+  .chart-vol {
+    display: flex;
+    align-items: flex-end;
+    gap: 2px;
+    height: 20px;
+    padding: 0 12px;
+  }
+
+  .chart-vol div {
+    flex: 1;
+    background: var(--border);
+    border-radius: 1px 1px 0 0;
+    min-height: 2px;
+  }
+
+  /* ── Google Docs ──────────────────────────────────── */
+  .gdoc-toolbar {
+    height: 24px;
+    background: #f1f3f4;
+    display: flex;
+    align-items: center;
+    padding: 0 8px;
+    gap: 3px;
+  }
+
+  .gdoc-toolbar .tb { width: 16px; height: 12px; background: #dadce0; border-radius: 2px; }
+  .gdoc-toolbar .tb.wide { width: 28px; }
+  .gdoc-toolbar .sep { width: 1px; height: 14px; background: #dadce0; margin: 0 3px; }
+
+  .gdoc-page {
+    background: #ffffff;
+    margin: 10px auto;
+    width: 88%;
+    height: calc(100% - 44px);
+    border-radius: 2px;
+    box-shadow: 0 1px 4px rgba(0,0,0,0.06);
+    padding: 20px 24px;
+    overflow: hidden;
+  }
+
+  .gdoc-title { font-family: var(--sans); font-size: 16px; font-weight: 700; color: #202124; min-height: 22px; margin-bottom: 4px; }
+  .gdoc-subtitle { font-family: var(--sans); font-size: 9px; color: #5f6368; margin-bottom: 10px; min-height: 12px; }
+  .gdoc-body { font-family: var(--sans); font-size: 9px; line-height: 1.6; color: #3c4043; min-height: 14px; }
+
+  .gdoc-chart-img {
+    margin-top: 8px;
+    width: 100%;
+    height: 80px;
+    background: #fafafa;
+    border: 1px solid #e0e0e0;
+    border-radius: 4px;
+    overflow: hidden;
+    opacity: 0;
+    transform: scale(0.95);
+    transition: opacity 0.3s, transform 0.3s;
+    display: flex;
+    align-items: center;
+    justify-content: center;
+  }
+
+  .gdoc-chart-img.visible { opacity: 1; transform: scale(1); }
+  .gdoc-chart-img svg { width: 95%; height: 80%; }
+
+  @keyframes blink { 50% { opacity: 0; } }
+
+  /* ── Annotations ──────────────────────────────────── */
+  .annot {
+    position: absolute;
+    border: 2px solid;
+    border-radius: 4px;
+    pointer-events: none;
+    opacity: 0;
+    transition: opacity 0.3s;
+    z-index: 20;
+  }
+
+  .annot.visible { opacity: 1; }
+
+  .annot-label {
+    position: absolute;
+    top: -16px;
+    left: -2px;
+    font-family: var(--mono);
+    font-size: 8px;
+    font-weight: 700;
+    padding: 1px 5px;
+    border-radius: 3px 3px 0 0;
+    color: #fff;
+  }
+
+  .annot.c1 { border-color: var(--accent); }
+  .annot.c1 .annot-label { background: var(--accent); }
+  .annot.c2 { border-color: var(--green); }
+  .annot.c2 .annot-label { background: var(--green); }
+  .annot.c3 { border-color: var(--orange); }
+  .annot.c3 .annot-label { background: var(--orange); }
+
+  .flash {
+    position: absolute;
+    inset: 0;
+    background: white;
+    opacity: 0;
+    pointer-events: none;
+    z-index: 50;
+    transition: opacity 0.05s;
+  }
+
+  .flash.fire { opacity: 0.3; }
+
+  /* ── Cursor ───────────────────────────────────────── */
+  .agent-cursor {
+    position: absolute;
+    width: 18px;
+    height: 22px;
+    z-index: 100;
+    pointer-events: none;
+    filter: drop-shadow(0 1px 2px rgba(0,0,0,0.15));
+  }
+
+  .agent-cursor svg { width: 100%; height: 100%; }
+  .agent-cursor.clicking { transform: scale(0.85); transition: transform 0.06s ease-out; }
+
+  .click-ripple {
+    position: absolute;
+    width: 24px; height: 24px;
+    border-radius: 50%;
+    border: 2px solid var(--accent);
+    opacity: 0;
+    pointer-events: none;
+    z-index: 99;
+    transform: translate(-50%, -50%) scale(0.3);
+  }
+
+  .click-ripple.animate { animation: ripple 0.4s ease-out forwards; }
+
+  @keyframes ripple {
+    0% { opacity: 0.6; transform: translate(-50%, -50%) scale(0.3); }
+    100% { opacity: 0; transform: translate(-50%, -50%) scale(1.5); }
+  }
+
+  /* ── Command Panel (light) ────────────────────────── */
+  .cmd-panel {
+    width: 340px;
+    border-radius: 12px;
+    overflow: hidden;
+    background: var(--bg);
+    box-shadow: 0 4px 24px rgba(0,0,0,0.08), 0 0 0 1px rgba(0,0,0,0.04);
+    display: flex;
+    flex-direction: column;
+  }
+
+  .cmd-titlebar {
+    height: 30px;
+    background: var(--surface);
+    display: flex;
+    align-items: center;
+    padding: 0 12px;
+    gap: 6px;
+  }
+
+  .cmd-titlebar .label {
+    font-family: var(--mono);
+    font-size: 10px;
+    color: var(--text-dim);
+    margin-left: 6px;
+  }
+
+  .cmd-body {
+    flex: 1;
+    padding: 12px;
+    font-family: var(--mono);
+    font-size: 11px;
+    line-height: 1.7;
+    overflow-y: auto;
+    scrollbar-width: none;
+  }
+
+  .cmd-body::-webkit-scrollbar { display: none; }
+
+  .cmd-line {
+    opacity: 0;
+    transform: translateY(4px);
+    transition: opacity 0.25s, transform 0.25s;
+    margin-bottom: 2px;
+  }
+
+  .cmd-line.visible { opacity: 1; transform: translateY(0); }
+  .cmd-line .ps { color: var(--green); user-select: none; }
+  .cmd-line .c { color: var(--text); }
+  .cmd-line .f { color: var(--orange); }
+  .cmd-line .s { color: var(--accent); }
+  .cmd-line .o { color: var(--text-dim); font-size: 10px; padding-left: 2px; }
+  .cmd-line .ok { color: var(--green); }
+  .cmd-line .jk { color: var(--purple); }
+  .cmd-line .jv { color: var(--accent); }
+  .cmd-line .link { color: var(--accent); text-decoration: underline; }
+  .cmd-line .agent-msg { color: var(--text); font-size: 10px; line-height: 1.5; padding-left: 2px; }
+
+  .cmd-divider {
+    height: 1px;
+    background: var(--border);
+    margin: 8px 0;
+    opacity: 0;
+    transition: opacity 0.3s;
+  }
+
+  .cmd-divider.visible { opacity: 1; }
+
+  .step-ind {
+    display: flex;
+    align-items: center;
+    gap: 6px;
+    margin-bottom: 4px;
+    opacity: 0;
+    transform: translateY(4px);
+    transition: opacity 0.25s, transform 0.25s;
+  }
+
+  .step-ind.visible { opacity: 1; transform: translateY(0); }
+
+  .badge {
+    font-size: 8px;
+    font-weight: 700;
+    text-transform: uppercase;
+    letter-spacing: 0.5px;
+    padding: 2px 5px;
+    border-radius: 3px;
+    font-family: var(--mono);
+  }
+
+  .badge.observe { background: rgba(66,97,165,0.12); color: var(--accent); }
+  .badge.act { background: rgba(66,123,88,0.12); color: var(--green); }
+  .badge.wait { background: rgba(175,58,3,0.1); color: var(--orange); }
+  .badge.verify { background: rgba(143,63,113,0.1); color: var(--purple); }
+  .badge.done { background: rgba(66,123,88,0.15); color: var(--green); }
+
+  .step-lbl { font-size: 9px; color: var(--text-muted); }
+
+  .caption {
+    text-align: center;
+    margin-top: 20px;
+    z-index: 10;
+  }
+
+  .caption p { font-size: 11px; color: var(--text-muted); font-family: var(--mono); }
+
+  .caption .replay-btn {
+    display: inline-flex;
+    align-items: center;
+    gap: 6px;
+    margin-top: 8px;
+    padding: 5px 12px;
+    border-radius: 6px;
+    border: 1px solid var(--border);
+    background: #fff;
+    color: var(--text-dim);
+    font-family: var(--mono);
+    font-size: 10px;
+    cursor: pointer;
+    transition: color 0.2s, background 0.2s;
+  }
+
+  .caption .replay-btn:hover { background: var(--bg); color: var(--text); }
+</style>
+</head>
+<body>
+
+<div class="hero">
+  <h1>deskctl</h1>
+  <p>desktop control CLI for AI agents</p>
+</div>
+
+<div class="demo-container">
+  <div class="desktop-panel">
+    <div class="desktop-titlebar">
+      <div class="dot" style="background:#c5524a"></div>
+      <div class="dot" style="background:#d79921"></div>
+      <div class="dot" style="background:#427b58"></div>
+    </div>
+    <div class="viewport" id="vp">
+      <div class="wallpaper"></div>
+
+      <!-- File Manager -->
+      <div class="win" id="w-files" style="left:16px; top:16px; width:200px; height:220px;">
+        <div class="wbar">
+          <div class="dots"><span style="background:#c5524a"></span><span style="background:#d79921"></span><span style="background:#427b58"></span></div>
+          <span>Files ~/reports</span>
+        </div>
+        <div class="wbody">
+          <div class="file-list">
+            <div class="file-row" id="f-notes">
+              <span class="ficon">&#128221;</span>
+              <span>task_brief.txt</span>
+              <span class="fmeta">2.1 KB</span>
+            </div>
+            <div class="file-row" id="f-csv">
+              <span class="ficon">&#128202;</span>
+              <span>nvda_q1_data.csv</span>
+              <span class="fmeta">48 KB</span>
+            </div>
+            <div class="file-row" id="f-prev">
+              <span class="ficon">&#128196;</span>
+              <span>prev_report.pdf</span>
+              <span class="fmeta">1.2 MB</span>
+            </div>
+            <div class="file-row">
+              <span class="ficon">&#128193;</span>
+              <span>archive/</span>
+              <span class="fmeta">--</span>
+            </div>
+          </div>
+          <div class="file-preview" id="file-preview">
+            <span style="color:#427b58">task:</span> Prepare NVDA Q1 earnings summary<br>
+            <span style="color:#427b58">source:</span> finance.yahoo.com, local csv<br>
+            <span style="color:#427b58">output:</span> Google Docs report with chart
+          </div>
+        </div>
+      </div>
+
+      <!-- Stock Chart -->
+      <div class="win" id="w-chart" style="left:140px; top:40px; width:380px; height:260px;">
+        <div class="wbar">
+          <div class="dots"><span style="background:#c5524a"></span><span style="background:#d79921"></span><span style="background:#427b58"></span></div>
+          <span>Chrome - Yahoo Finance</span>
+        </div>
+        <div class="wbody">
+          <div class="chart-header">
+            <span class="chart-ticker">NVDA</span>
+            <span class="chart-price">$924.68</span>
+            <span class="chart-change">+3.42%</span>
+            <span class="chart-period">1Y</span>
+          </div>
+          <div class="chart-area">
+            <svg viewBox="0 0 360 140" preserveAspectRatio="none">
+              <defs>
+                <linearGradient id="cg" x1="0" y1="0" x2="0" y2="1">
+                  <stop offset="0%" stop-color="#427b58" stop-opacity="0.2"/>
+                  <stop offset="100%" stop-color="#427b58" stop-opacity="0"/>
+                </linearGradient>
+              </defs>
+              <line x1="0" y1="35" x2="360" y2="35" stroke="#dcdcdc" stroke-width="0.5"/>
+              <line x1="0" y1="70" x2="360" y2="70" stroke="#dcdcdc" stroke-width="0.5"/>
+              <line x1="0" y1="105" x2="360" y2="105" stroke="#dcdcdc" stroke-width="0.5"/>
+              <path d="M0,120 L20,115 40,118 60,110 80,105 100,95 120,100 140,85 160,75 180,80 200,65 220,55 240,60 260,45 280,35 300,40 320,28 340,22 360,18 L360,140 L0,140 Z" fill="url(#cg)"/>
+              <path d="M0,120 L20,115 40,118 60,110 80,105 100,95 120,100 140,85 160,75 180,80 200,65 220,55 240,60 260,45 280,35 300,40 320,28 340,22 360,18" fill="none" stroke="#427b58" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"/>
+              <text x="352" y="33" fill="#928374" font-size="7" font-family="monospace" text-anchor="end">$950</text>
+              <text x="352" y="68" fill="#928374" font-size="7" font-family="monospace" text-anchor="end">$800</text>
+              <text x="352" y="103" fill="#928374" font-size="7" font-family="monospace" text-anchor="end">$650</text>
+            </svg>
+          </div>
+          <div class="chart-vol" id="chart-vol"></div>
+        </div>
+      </div>
+
+      <!-- Google Docs -->
+      <div class="win" id="w-docs" style="left:80px; top:60px; width:440px; height:340px;">
+        <div class="wbar">
+          <div class="dots"><span style="background:#c5524a"></span><span style="background:#d79921"></span><span style="background:#427b58"></span></div>
+          <span>Chrome - Google Docs</span>
+        </div>
+        <div class="wbody" style="background:#f1f3f4">
+          <div class="gdoc-toolbar">
+            <div class="tb"></div><div class="tb"></div><div class="tb wide"></div>
+            <div class="sep"></div>
+            <div class="tb"></div><div class="tb"></div><div class="tb"></div>
+            <div class="sep"></div>
+            <div class="tb wide"></div><div class="tb"></div>
+          </div>
+          <div class="gdoc-page">
+            <div class="gdoc-title" id="doc-title"></div>
+            <div class="gdoc-subtitle" id="doc-subtitle"></div>
+            <div class="gdoc-body" id="doc-body"></div>
+            <div class="gdoc-chart-img" id="doc-chart">
+              <svg viewBox="0 0 360 80" preserveAspectRatio="none">
+                <defs>
+                  <linearGradient id="cg2" x1="0" y1="0" x2="0" y2="1">
+                    <stop offset="0%" stop-color="#427b58" stop-opacity="0.15"/>
+                    <stop offset="100%" stop-color="#427b58" stop-opacity="0"/>
+                  </linearGradient>
+                </defs>
+                <rect width="360" height="80" fill="#fafafa"/>
+                <path d="M0,65 L20,62 40,64 60,58 80,55 100,48 120,52 140,42 160,36 180,39 200,30 220,24 240,27 260,19 280,14 300,17 320,10 340,7 360,5 L360,80 L0,80 Z" fill="url(#cg2)"/>
+                <path d="M0,65 L20,62 40,64 60,58 80,55 100,48 120,52 140,42 160,36 180,39 200,30 220,24 240,27 260,19 280,14 300,17 320,10 340,7 360,5" fill="none" stroke="#427b58" stroke-width="1.5" stroke-linecap="round" stroke-linejoin="round"/>
+                <text x="8" y="12" fill="#928374" font-size="7" font-family="monospace">NVDA 1Y</text>
+              </svg>
+            </div>
+          </div>
+        </div>
+      </div>
+
+      <!-- Annotations -->
+      <div class="annot c1" id="a1"><div class="annot-label">@w1</div></div>
+      <div class="annot c2" id="a2"><div class="annot-label">@w2</div></div>
+      <div class="annot c3" id="a3"><div class="annot-label">@w3</div></div>
+
+      <div class="flash" id="flash"></div>
+
+      <div class="agent-cursor" id="cur" style="left:380px; top:260px;">
+        <svg viewBox="0 0 24 24" fill="none"><path d="M5.5 3.21V20.8c0 .45.54.67.85.35l4.86-4.86a.5.5 0 0 1 .35-.15h6.87a.5.5 0 0 0 .35-.85L6.35 2.86a.5.5 0 0 0-.85.35Z" fill="#282828" stroke="#fff" stroke-width="1"/></svg>
+      </div>
+      <div class="click-ripple" id="rip"></div>
+
+      <!-- Taskbar -->
+      <div class="taskbar">
+        <div class="tb-item" id="tb-files">Files</div>
+        <div class="tb-item" id="tb-chart">Yahoo Finance</div>
+        <div class="tb-item" id="tb-docs">Google Docs</div>
+      </div>
+    </div>
+  </div>
+
+  <div class="cmd-panel">
+    <div class="cmd-titlebar">
+      <div class="dot" style="background:#c5524a"></div>
+      <div class="dot" style="background:#d79921"></div>
+      <div class="dot" style="background:#427b58"></div>
+      <span class="label">agent computer</span>
+    </div>
+    <div class="cmd-body" id="cb"></div>
+  </div>
+</div>
+
+<div class="caption">
+  <p>AI agent controlling a live desktop via deskctl</p>
+  <button class="replay-btn" id="replay" style="display:none" onclick="run()">&#8634; Replay</button>
+</div>
+
+<script>
+const $ = s => document.getElementById(s);
+const W = ms => new Promise(r => setTimeout(r, ms));
+const cur = $('cur'), rip = $('rip'), cb = $('cb');
+let cx = 380, cy = 260;
+
+(() => {
+  const v = $('chart-vol');
+  [8,12,6,14,10,18,8,15,20,12,7,16,10,22,14,8,18,12,9,16].forEach(h => {
+    const d = document.createElement('div'); d.style.height = h + 'px'; v.appendChild(d);
+  });
+})();
+
+function move(x, y, dur = 500) {
+  return new Promise(res => {
+    const sx = cx, sy = cy, dx = x - sx, dy = y - sy, t0 = performance.now();
+    (function f(n) {
+      const t = Math.min((n - t0) / dur, 1), e = 1 - (1 - t) ** 3;
+      const arc = -Math.sin(t * Math.PI) * Math.min(Math.abs(dy) * 0.25, 25);
+      cur.style.left = (sx + dx * e) + 'px';
+      cur.style.top = (sy + dy * e + arc) + 'px';
+      if (t < 1) requestAnimationFrame(f); else { cx = x; cy = y; res(); }
+    })(performance.now());
+  });
+}
+
+async function clk() {
+  cur.classList.add('clicking');
+  rip.style.left = (cx + 4) + 'px'; rip.style.top = (cy + 4) + 'px';
+  rip.classList.remove('animate'); void rip.offsetWidth; rip.classList.add('animate');
+  await W(80); cur.classList.remove('clicking');
+}
+
+async function flash() {
+  const f = $('flash'); f.classList.add('fire'); await W(80); f.classList.remove('fire');
+}
+
+function show(id) { $(id).classList.add('visible'); }
+function hide(id) { $(id).classList.remove('visible'); }
+
+function tbShow(id) { const el = $(id); el.classList.add('visible'); }
+function tbActive(id) {
+  document.querySelectorAll('.tb-item').forEach(t => t.classList.remove('active'));
+  if (id) $(id).classList.add('active');
+}
+
+function focus(id) {
+  document.querySelectorAll('.win').forEach(w => { w.classList.remove('focused'); w.style.zIndex = ''; });
+  if (id) { $(id).classList.add('focused'); $(id).style.zIndex = '10'; }
+}
+
+function posAnnot(aid, wid) {
+  const w = $(wid), a = $(aid);
+  a.style.left = (parseInt(w.style.left) - 2) + 'px';
+  a.style.top = (parseInt(w.style.top) + 26) + 'px';
+  a.style.width = (parseInt(w.style.width) + 4) + 'px';
+  a.style.height = (parseInt(w.style.height) - 22) + 'px';
+}
+
+function hideAnnots() { document.querySelectorAll('.annot').forEach(a => a.classList.remove('visible')); }
+
+function typeEl(el, text, ms = 40) {
+  return new Promise(async res => {
+    for (const c of text) { el.textContent += c; await W(ms); }
+    res();
+  });
+}
+
+function step(type, label) {
+  const d = document.createElement('div'); d.className = 'step-ind';
+  d.innerHTML = `<span class="badge ${type}">${type}</span><span class="step-lbl">${label}</span>`;
+  cb.appendChild(d); void d.offsetWidth; d.classList.add('visible'); cb.scrollTop = cb.scrollHeight;
+}
+
+function ln(html) {
+  const d = document.createElement('div'); d.className = 'cmd-line';
+  d.innerHTML = `<span class="ps">$ </span>${html}`;
+  cb.appendChild(d); void d.offsetWidth; d.classList.add('visible'); cb.scrollTop = cb.scrollHeight;
+}
+
+function out(html) {
+  const d = document.createElement('div'); d.className = 'cmd-line';
+  d.innerHTML = `<span class="o">${html}</span>`;
+  cb.appendChild(d); void d.offsetWidth; d.classList.add('visible'); cb.scrollTop = cb.scrollHeight;
+}
+
+function agentMsg(html) {
+  const d = document.createElement('div'); d.className = 'cmd-line';
+  d.innerHTML = `<span class="agent-msg">${html}</span>`;
+  cb.appendChild(d); void d.offsetWidth; d.classList.add('visible'); cb.scrollTop = cb.scrollHeight;
+}
+
+function div() {
+  const d = document.createElement('div'); d.className = 'cmd-divider';
+  cb.appendChild(d); void d.offsetWidth; d.classList.add('visible'); cb.scrollTop = cb.scrollHeight;
+}
+
+function cm(c, f, s) {
+  let h = `<span class="c">${c}</span>`;
+  if (f) h += ` <span class="f">${f}</span>`;
+  if (s) h += ` <span class="s">${s}</span>`;
+  return h;
+}
+
+async function run() {
+  $('replay').style.display = 'none';
+  cb.innerHTML = '';
+  ['w-files','w-chart','w-docs'].forEach(id => { hide(id); $(id).classList.remove('focused'); $(id).style.zIndex = ''; });
+  document.querySelectorAll('.tb-item').forEach(t => { t.classList.remove('visible','active'); });
+  hideAnnots();
+  $('f-notes').classList.remove('selected');
+  $('f-csv').classList.remove('selected');
+  $('file-preview').classList.remove('open');
+  $('doc-title').textContent = '';
+  $('doc-subtitle').textContent = '';
+  $('doc-body').textContent = '';
+  $('doc-chart').classList.remove('visible');
+  cur.style.left = '380px'; cur.style.top = '260px'; cur.style.opacity = '0';
+  cx = 380; cy = 260;
+
+  await W(500);
+  cur.style.transition = 'opacity 0.3s'; cur.style.opacity = '1';
+  await W(400); cur.style.transition = 'none';
+
+  // 1: Empty desktop
+  step('observe', 'Scan desktop');
+  await W(250);
+  ln(cm('deskctl snapshot'));
+  await W(400);
+  out('<span class="jk">"windows"</span>: <span class="o">[]</span>');
+  out('<span class="ok">empty desktop</span>');
+  await W(400); div();
+
+  // 2: Launch file manager
+  step('act', 'Open local files');
+  await W(250);
+  ln(cm('deskctl launch', '', 'nautilus ~/reports'));
+  await W(350);
+  show('w-files'); focus('w-files');
+  tbShow('tb-files'); tbActive('tb-files');
+  await W(300);
+  out('<span class="ok">launched nautilus (pid 3841)</span>');
+  await W(300);
+
+  step('wait', 'Wait for window');
+  ln(cm('deskctl wait window', "--selector 'title=Files'", '--timeout 5'));
+  await W(500);
+  out('<span class="ok">window ready: "Files ~/reports"</span>');
+  await W(300); div();
+
+  // 3: Read task brief
+  step('observe', 'Read task brief');
+  await W(250);
+  ln(cm('deskctl click', '', "'title=Files'"));
+  await move(100, 62, 450);
+  await clk();
+  $('f-notes').classList.add('selected');
+  await W(200);
+  out('<span class="ok">clicked "task_brief.txt"</span>');
+  await W(200);
+
+  ln(cm('deskctl hotkey', '', 'space'));
+  await W(300);
+  $('file-preview').classList.add('open');
+  await W(400);
+  out('<span class="o">task: Prepare NVDA Q1 earnings summary</span>');
+  out('<span class="o">source: finance.yahoo.com, local csv</span>');
+  out('<span class="o">output: Google Docs report with chart</span>');
+  await W(500); div();
+
+  // 4: Launch browser
+  step('act', 'Research stock data');
+  await W(250);
+  ln(cm('deskctl launch', '', 'google-chrome finance.yahoo.com/NVDA'));
+  await W(400);
+  show('w-chart'); focus('w-chart');
+  tbShow('tb-chart'); tbActive('tb-chart');
+  await W(350);
+  out('<span class="ok">launched chrome (pid 3912)</span>');
+
+  step('wait', 'Wait for page');
+  ln(cm('deskctl wait window', "--selector 'title=Yahoo'", '--timeout 8'));
+  await W(600);
+  out('<span class="ok">window ready: "Yahoo Finance - NVDA"</span>');
+  await W(300); div();
+
+  // 5: Snapshot chart
+  step('observe', 'Capture chart screenshot');
+  await W(250);
+  ln(cm('deskctl snapshot', '--annotate'));
+  await W(300);
+  await flash();
+  posAnnot('a1', 'w-files'); posAnnot('a2', 'w-chart');
+  show('a1'); show('a2');
+  await W(200);
+  out('<span class="jk">"windows"</span>: [');
+  out('&nbsp;&nbsp;{ <span class="jv">"@w1"</span>: <span class="jv">"Files"</span> }');
+  out('&nbsp;&nbsp;{ <span class="jv">"@w2"</span>: <span class="jv">"Yahoo Finance"</span> }');
+  out(']');
+  out('<span class="ok">screenshot saved: chart_nvda.png</span>');
+  await W(600);
+  hideAnnots(); div();
+
+  // 6: Open Google Docs
+  step('act', 'Create report document');
+  await W(250);
+  ln(cm('deskctl hotkey', '', 'ctrl t'));
+  await W(300);
+  out('<span class="ok">new tab opened</span>');
+  await W(200);
+
+  ln(cm('deskctl type', '', '"docs.google.com/document/new"'));
+  await W(200);
+  ln(cm('deskctl press', '', 'enter'));
+  await W(400);
+  show('w-docs'); focus('w-docs');
+  tbShow('tb-docs'); tbActive('tb-docs');
+  await W(350);
+  out('<span class="ok">navigated to Google Docs</span>');
+
+  step('wait', 'Wait for Docs');
+  ln(cm('deskctl wait window', "--selector 'title=Google Docs'", '--timeout 8'));
+  await W(500);
+  out('<span class="ok">document ready</span>');
+  await W(300); div();
+
+  // 7: Type title
+  step('act', 'Write report');
+  await W(250);
+  await move(310, 140, 450);
+  await clk();
+  await W(200);
+
+  ln(cm('deskctl type', '', '"NVDA Q1 2025 Earnings Summary"'));
+  await W(200);
+  await typeEl($('doc-title'), 'NVDA Q1 2025 Earnings Summary', 35);
+  out('<span class="ok">typed title</span>');
+  await W(200);
+
+  ln(cm('deskctl press', '', 'enter'));
+  await W(150);
+  ln(cm('deskctl type', '', '"Prepared by AI Agent via deskctl"'));
+  await W(200);
+  await typeEl($('doc-subtitle'), 'Prepared by AI Agent via deskctl', 28);
+  await W(200);
+  ln(cm('deskctl press', '', 'enter enter'));
+  await W(200); div();
+
+  // 8: Type body
+  step('act', 'Write analysis');
+  await W(250);
+  const body = "NVIDIA reported strong Q1 results driven by data center revenue growth of 427% YoY. The stock is up 3.42% today at $924.68. Key drivers include H100/H200 GPU demand from hyperscalers and continued AI infrastructure buildout.";
+  ln(cm('deskctl type', '', '"NVIDIA reported strong Q1..."'));
+  await W(200);
+  await typeEl($('doc-body'), body, 12);
+  out('<span class="ok">typed analysis (224 chars)</span>');
+  await W(400); div();
+
+  // 9: Paste chart
+  step('act', 'Insert chart screenshot');
+  await W(250);
+  ln(cm('deskctl press', '', 'enter enter'));
+  await W(200);
+  ln(cm('deskctl hotkey', '', 'ctrl v'));
+  await W(400);
+  $('doc-chart').classList.add('visible');
+  await W(300);
+  out('<span class="ok">pasted chart_nvda.png into document</span>');
+  await W(500); div();
+
+  // 10: Final verify
+  step('verify', 'Verify completed report');
+  await W(250);
+  ln(cm('deskctl snapshot', '--annotate'));
+  await W(300);
+  await flash();
+  posAnnot('a1', 'w-files'); posAnnot('a2', 'w-chart'); posAnnot('a3', 'w-docs');
+  show('a1'); show('a2'); show('a3');
+  await W(200);
+  out('<span class="jk">"windows"</span>: [');
+  out('&nbsp;&nbsp;{ <span class="jv">"@w1"</span>: <span class="jv">"Files"</span>, <span class="jv">"@w2"</span>: <span class="jv">"Yahoo Finance"</span>, <span class="jv">"@w3"</span>: <span class="jv">"Google Docs"</span> }');
+  out(']');
+  await W(600);
+  hideAnnots();
+  await W(300); div();
+
+  // 11: Agent summary (Claude-style)
+  step('done', 'Task complete');
+  await W(400);
+  agentMsg('I\'ve completed the NVDA Q1 earnings report.');
+  await W(300);
+  agentMsg('');
+  await W(100);
+  agentMsg('Here\'s what I did:');
+  await W(200);
+  agentMsg('  - Read task_brief.txt from ~/reports for context');
+  await W(150);
+  agentMsg('  - Pulled the NVDA 1Y chart from Yahoo Finance');
+  await W(150);
+  agentMsg('  - Created a new Google Doc with title, analysis,');
+  await W(100);
+  agentMsg('    and embedded the stock chart screenshot');
+  await W(300);
+  agentMsg('');
+  agentMsg('Document: <span class="link">docs.google.com/d/1xK9m...r4/edit</span>');
+
+  // Cursor exits
+  await W(500);
+  await move(600, 10, 700);
+  cur.style.transition = 'opacity 0.5s'; cur.style.opacity = '0';
+  await W(600);
+  $('replay').style.display = 'inline-flex';
+}
+
+window.addEventListener('load', () => setTimeout(run, 300));
+</script>
+</body>
+</html>
--- a/docs/releasing.md
+++ b/docs/releasing.md
@ -0,0 +1,110 @@
+# Releasing deskctl
+
+This document covers the operator flow for shipping `deskctl` across:
+
+- GitHub Releases
+- crates.io
+- npm
+- the repo flake
+
+GitHub Releases are the canonical binary source. The npm package consumes those release assets instead of building a separate binary.
+
+## Package Names
+
+- crate: `deskctl`
+- npm package: `deskctl`
+- installed command: `deskctl`
+
+## Prerequisites
+
+Before the first live publish on each registry:
+
+- npm ownership for `deskctl`
+- crates.io ownership for `deskctl`
+- repository secrets:
+  - `NPM_TOKEN`
+  - `CARGO_REGISTRY_TOKEN`
+
+These are user-owned prerequisites. The repo can validate and automate the rest, but it cannot create registry ownership for you.
+
+## Normal Release Flow
+
+1. Merge release-ready changes to `main`.
+2. Let CI run:
+   - validation
+   - integration
+   - distribution validation
+   - release asset build
+3. Confirm the GitHub Release exists for the version tag and includes:
+   - `deskctl-linux-x86_64`
+   - `checksums.txt`
+4. Trigger the `Publish Registries` workflow with:
+   - `tag`
+   - `publish_npm`
+   - `publish_crates`
+5. Confirm the publish summary for each channel.
+
+## What CI Validates
+
+The repository validates:
+
+- `cargo publish --dry-run --locked`
+- npm package metadata and packability
+- npm install smoke path on Linux using the packaged `deskctl` command
+- repo flake evaluation/build
+
+The repository release workflow:
+
+- builds the Linux release binary
+- publishes the canonical GitHub Release asset
+- uploads `checksums.txt`
+
+The registry publish jobs (npm and crates.io run in parallel):
+
+- target an existing release tag
+- check whether that version is already published on the respective registry
+- skip already-published versions
+- both default to enabled; can be toggled via workflow_dispatch inputs
+
+## Rerun Safety
+
+Registry publishing is intentionally separate from release asset creation.
+
+If a partial failure happens:
+
+- GitHub Release assets remain the source of truth
+- rerun the `Publish Registries` workflow for the same tag
+- already-published channels are reported and skipped
+- remaining channels can still be published
+
+## Local Validation
+
+Run the distribution checks locally with:
+
+```bash
+make cargo-publish-dry-run
+make npm-package-check
+make nix-flake-check
+make dist-validate
+```
+
+Notes:
+
+- `make npm-package-check` does a runtime smoke test only on Linux
+- `make nix-flake-check` requires a local Nix installation
+- Docker remains a local Linux build convenience, not the canonical release path
+
+## Nix Boundary
+
+The repo-owned `flake.nix` is the supported Nix surface in this phase.
+
+In scope:
+
+- `nix run github:harivansh-afk/deskctl`
+- `nix profile install github:harivansh-afk/deskctl`
+- CI validation for the repo flake
+
+Out of scope for this phase:
+
+- `nixpkgs` upstreaming
+- extra distro packaging outside the repo
--- a/docs/runtime-contract.md
+++ b/docs/runtime-contract.md
@ -0,0 +1,70 @@
+# deskctl runtime contract
+
+All commands support `--json` and use the same top-level envelope:
+
+```json
+{
+  "success": true,
+  "data": {},
+  "error": null
+}
+```
+
+Use `--json` whenever you need to parse output programmatically.
+
+## Stable window fields
+
+Whenever a response includes a window payload, these fields are stable:
+
+- `ref_id`
+- `window_id`
+- `title`
+- `app_name`
+- `x`
+- `y`
+- `width`
+- `height`
+- `focused`
+- `minimized`
+
+Use `window_id` for stable targeting inside a live daemon session. Use
+`ref_id` or `@wN` for short-lived follow-up actions after `snapshot` or
+`list-windows`.
+
+## Stable grouped reads
+
+- `deskctl get active-window` -> `data.window`
+- `deskctl get monitors` -> `data.count`, `data.monitors`
+- `deskctl get version` -> `data.version`, `data.backend`
+- `deskctl get systeminfo` -> runtime-scoped diagnostic fields such as
+  `backend`, `display`, `session_type`, `session`, `socket_path`, `screen`,
+  `monitor_count`, and `monitors`
+
+## Stable waits
+
+- `deskctl wait window` -> `data.wait`, `data.selector`, `data.elapsed_ms`,
+  `data.window`
+- `deskctl wait focus` -> `data.wait`, `data.selector`, `data.elapsed_ms`,
+  `data.window`
+
+## Stable structured error kinds
+
+When a command fails with structured JSON data, these `kind` values are stable:
+
+- `selector_not_found`
+- `selector_ambiguous`
+- `selector_invalid`
+- `timeout`
+- `not_found`
+
+Wait failures may also include `window_not_focused` in the last observation
+payload.
+
+## Best-effort fields
+
+Treat these as useful but non-contractual:
+
+- exact monitor names
+- incidental text formatting in non-JSON mode
+- default screenshot file names when no explicit path was provided
+- environment-dependent ordering details from the window manager
--- a/flake.lock
+++ b/flake.lock
@ -0,0 +1,61 @@
+{
+  "nodes": {
+    "flake-utils": {
+      "inputs": {
+        "systems": "systems"
+      },
+      "locked": {
+        "lastModified": 1731533236,
+        "narHash": "sha256-l0KFg5HjrsfsO/JpG+r7fRrqm12kzFHyUHqHCVpMMbI=",
+        "owner": "numtide",
+        "repo": "flake-utils",
+        "rev": "11707dc2f618dd54ca8739b309ec4fc024de578b",
+        "type": "github"
+      },
+      "original": {
+        "owner": "numtide",
+        "repo": "flake-utils",
+        "type": "github"
+      }
+    },
+    "nixpkgs": {
+      "locked": {
+        "lastModified": 1774386573,
+        "narHash": "sha256-4hAV26quOxdC6iyG7kYaZcM3VOskcPUrdCQd/nx8obc=",
+        "owner": "NixOS",
+        "repo": "nixpkgs",
+        "rev": "46db2e09e1d3f113a13c0d7b81e2f221c63b8ce9",
+        "type": "github"
+      },
+      "original": {
+        "owner": "NixOS",
+        "ref": "nixos-unstable",
+        "repo": "nixpkgs",
+        "type": "github"
+      }
+    },
+    "root": {
+      "inputs": {
+        "flake-utils": "flake-utils",
+        "nixpkgs": "nixpkgs"
+      }
+    },
+    "systems": {
+      "locked": {
+        "lastModified": 1681028828,
+        "narHash": "sha256-Vy1rq5AaRuLzOxct8nz4T6wlgyUR7zLU309k9mBC768=",
+        "owner": "nix-systems",
+        "repo": "default",
+        "rev": "da67096a3b9bf56a91d16901293e51ba5b49a27e",
+        "type": "github"
+      },
+      "original": {
+        "owner": "nix-systems",
+        "repo": "default",
+        "type": "github"
+      }
+    }
+  },
+  "root": "root",
+  "version": 7
+}
--- a/flake.nix
+++ b/flake.nix
@ -0,0 +1,77 @@
+{
+  description = "deskctl - Desktop control CLI for AI agents on Linux X11";
+
+  inputs = {
+    nixpkgs.url = "github:NixOS/nixpkgs/nixos-unstable";
+    flake-utils.url = "github:numtide/flake-utils";
+  };
+
+  outputs =
+    { self, nixpkgs, flake-utils }:
+    flake-utils.lib.eachDefaultSystem (
+      system:
+      let
+        pkgs = import nixpkgs { inherit system; };
+        lib = pkgs.lib;
+        cargoToml = builtins.fromTOML (builtins.readFile ./Cargo.toml);
+
+        deskctl =
+          pkgs.rustPlatform.buildRustPackage {
+            pname = cargoToml.package.name;
+            version = cargoToml.package.version;
+            src = ./.;
+            cargoLock.lockFile = ./Cargo.lock;
+            nativeBuildInputs = [ pkgs.pkg-config ];
+            buildInputs = lib.optionals pkgs.stdenv.isLinux [
+              pkgs.libx11
+              pkgs.libxtst
+            ];
+            doCheck = false;
+
+            meta = with lib; {
+              description = cargoToml.package.description;
+              homepage = cargoToml.package.homepage;
+              license = licenses.mit;
+              mainProgram = "deskctl";
+              platforms = platforms.linux;
+            };
+          };
+      in
+      {
+        formatter = pkgs.nixfmt;
+
+        packages = lib.optionalAttrs pkgs.stdenv.isLinux {
+          inherit deskctl;
+          default = deskctl;
+        };
+
+        apps = lib.optionalAttrs pkgs.stdenv.isLinux {
+          default = flake-utils.lib.mkApp { drv = deskctl; };
+          deskctl = flake-utils.lib.mkApp { drv = deskctl; };
+        };
+
+        checks = lib.optionalAttrs pkgs.stdenv.isLinux {
+          build = deskctl;
+        };
+
+        devShells.default = pkgs.mkShell {
+          packages =
+            [
+              pkgs.cargo
+              pkgs.clippy
+              pkgs.nodejs
+              pkgs.nixfmt
+              pkgs.pkg-config
+              pkgs.pnpm
+              pkgs.rustc
+              pkgs.rustfmt
+            ]
+            ++ lib.optionals pkgs.stdenv.isLinux [
+              pkgs.libx11
+              pkgs.libxtst
+              pkgs.xorg.xorgserver
+            ];
+        };
+      }
+    );
+}
--- a/npm/deskctl/README.md
+++ b/npm/deskctl/README.md
@ -0,0 +1,48 @@
+# deskctl
+
+`deskctl` installs the command for Linux X11 systems.
+
+## Install
+
+```bash
+npm install -g deskctl
+```
+
+After install, run:
+
+```bash
+deskctl --help
+```
+
+To upgrade version:
+
+```bash
+deskctl upgrade
+```
+
+For non-interactive use:
+
+```bash
+deskctl upgrade --yes
+```
+
+One-shot usage is also supported:
+
+```bash
+npx deskctl --help
+```
+
+## Runtime Support
+
+- Linux
+- X11 session
+- currently packaged release asset: `linux-x64`
+
+`deskctl` downloads the matching GitHub Release binary during install.
+Unsupported targets fail during install with a clear runtime support error instead of installing a broken command.
+
+If you want the Rust source-install path instead, use:
+
+```bash
+cargo install deskctl
+```
--- a/npm/deskctl/bin/deskctl.js
+++ b/npm/deskctl/bin/deskctl.js
@ -0,0 +1,36 @@
+#!/usr/bin/env node
+
+const fs = require("node:fs");
+const { spawn } = require("node:child_process");
+
+const { readPackageJson, releaseTag, supportedTarget, vendorBinaryPath } = require("../scripts/support");
+
+function main() {
+  const pkg = readPackageJson();
+  const target = supportedTarget();
+  const binaryPath = vendorBinaryPath(target);
+
+  if (!fs.existsSync(binaryPath)) {
+    console.error(
+      [
+        "deskctl binary is missing from the npm package install.",
+        `Expected: ${binaryPath}`,
+        `Package version: ${pkg.version}`,
+        `Release tag: ${releaseTag(pkg)}`,
+        "Try reinstalling deskctl or check that your target is supported."
+      ].join("\n")
+    );
+    process.exit(1);
+  }
+
+  const child = spawn(binaryPath, process.argv.slice(2), { stdio: "inherit" });
+  child.on("exit", (code, signal) => {
+    if (signal) {
+      process.kill(process.pid, signal);
+      return;
+    }
+    process.exit(code ?? 1);
+  });
+}
+
+main();
--- a/npm/deskctl/package.json
+++ b/npm/deskctl/package.json
@ -0,0 +1,36 @@
+{
+  "name": "deskctl",
+  "version": "0.1.14",
+  "description": "Installable deskctl package for Linux X11 agents",
+  "license": "MIT",
+  "homepage": "https://github.com/harivansh-afk/deskctl",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/harivansh-afk/deskctl.git"
+  },
+  "bugs": {
+    "url": "https://github.com/harivansh-afk/deskctl/issues"
+  },
+  "engines": {
+    "node": ">=18"
+  },
+  "bin": {
+    "deskctl": "bin/deskctl.js"
+  },
+  "files": [
+    "README.md",
+    "bin",
+    "scripts"
+  ],
+  "scripts": {
+    "postinstall": "node scripts/postinstall.js",
+    "validate": "node scripts/validate-package.js"
+  },
+  "keywords": [
+    "deskctl",
+    "x11",
+    "desktop",
+    "automation",
+    "cli"
+  ]
+}
--- a/npm/deskctl/scripts/postinstall.js
+++ b/npm/deskctl/scripts/postinstall.js
@ -0,0 +1,49 @@
+const fs = require("node:fs");
+
+const {
+  checksumsUrl,
+  checksumForAsset,
+  download,
+  ensureVendorDir,
+  installLocalBinary,
+  readPackageJson,
+  releaseAssetUrl,
+  releaseTag,
+  sha256,
+  supportedTarget,
+  vendorBinaryPath
+} = require("./support");
+
+async function main() {
+  const pkg = readPackageJson();
+  const target = supportedTarget();
+  const targetPath = vendorBinaryPath(target);
+
+  ensureVendorDir();
+
+  if (process.env.DESKCTL_BINARY_PATH) {
+    installLocalBinary(process.env.DESKCTL_BINARY_PATH, targetPath);
+    return;
+  }
+
+  const tag = releaseTag(pkg);
+  const assetUrl = releaseAssetUrl(tag, target.assetName);
+  const checksumText = (await download(checksumsUrl(tag))).toString("utf8");
+  const expectedSha = checksumForAsset(checksumText, target.assetName);
+  const asset = await download(assetUrl);
+  const actualSha = sha256(asset);
+
+  if (actualSha !== expectedSha) {
+    throw new Error(
+      `Checksum mismatch for ${target.assetName}. Expected ${expectedSha}, got ${actualSha}.`
+    );
+  }
+
+  fs.writeFileSync(targetPath, asset);
+  fs.chmodSync(targetPath, 0o755);
+}
+
+main().catch((error) => {
+  console.error(`deskctl install failed: ${error.message}`);
+  process.exit(1);
+});
--- a/npm/deskctl/scripts/support.js
+++ b/npm/deskctl/scripts/support.js
@ -0,0 +1,120 @@
+const crypto = require("node:crypto");
+const fs = require("node:fs");
+const path = require("node:path");
+const https = require("node:https");
+
+const PACKAGE_ROOT = path.resolve(__dirname, "..");
+const VENDOR_DIR = path.join(PACKAGE_ROOT, "vendor");
+const PACKAGE_JSON = path.join(PACKAGE_ROOT, "package.json");
+
+function readPackageJson() {
+  return JSON.parse(fs.readFileSync(PACKAGE_JSON, "utf8"));
+}
+
+function releaseTag(pkg) {
+  return process.env.DESKCTL_RELEASE_TAG || `v${pkg.version}`;
+}
+
+function supportedTarget(platform = process.platform, arch = process.arch) {
+  if (platform === "linux" && arch === "x64") {
+    return {
+      platform,
+      arch,
+      assetName: "deskctl-linux-x86_64",
+      binaryName: "deskctl-linux-x86_64"
+    };
+  }
+
+  throw new Error(
+    `deskctl currently supports linux-x64 only. Received ${platform}-${arch}.`
+  );
+}
+
+function vendorBinaryPath(target) {
+  return path.join(VENDOR_DIR, target.binaryName);
+}
+
+function releaseBaseUrl(tag) {
+  return (
+    process.env.DESKCTL_RELEASE_BASE_URL ||
+    `https://github.com/harivansh-afk/deskctl/releases/download/${tag}`
+  );
+}
+
+function releaseAssetUrl(tag, assetName) {
+  return process.env.DESKCTL_DOWNLOAD_URL || `${releaseBaseUrl(tag)}/${assetName}`;
+}
+
+function checksumsUrl(tag) {
+  return `${releaseBaseUrl(tag)}/checksums.txt`;
+}
+
+function ensureVendorDir() {
+  fs.mkdirSync(VENDOR_DIR, { recursive: true });
+}
+
+function checksumForAsset(contents, assetName) {
+  const line = contents
+    .split("\n")
+    .map((value) => value.trim())
+    .find((value) => value.endsWith(`  ${assetName}`) || value.endsWith(` *${assetName}`));
+
+  if (!line) {
+    throw new Error(`Could not find checksum entry for ${assetName}.`);
+  }
+
+  return line.split(/\s+/)[0];
+}
+
+function sha256(buffer) {
+  return crypto.createHash("sha256").update(buffer).digest("hex");
+}
+
+function download(url) {
+  return new Promise((resolve, reject) => {
+    https
+      .get(url, (response) => {
+        if (
+          response.statusCode &&
+          response.statusCode >= 300 &&
+          response.statusCode < 400 &&
+          response.headers.location
+        ) {
+          response.resume();
+          resolve(download(response.headers.location));
+          return;
+        }
+
+        if (response.statusCode !== 200) {
+          reject(new Error(`Download failed for ${url}: HTTP ${response.statusCode}`));
+          return;
+        }
+
+        const chunks = [];
+        response.on("data", (chunk) => chunks.push(chunk));
+        response.on("end", () => resolve(Buffer.concat(chunks)));
+      })
+      .on("error", reject);
+  });
+}
+
+function installLocalBinary(sourcePath, targetPath) {
+  fs.copyFileSync(sourcePath, targetPath);
+  fs.chmodSync(targetPath, 0o755);
+}
+
+module.exports = {
+  PACKAGE_ROOT,
+  VENDOR_DIR,
+  checksumsUrl,
+  checksumForAsset,
+  download,
+  ensureVendorDir,
+  installLocalBinary,
+  readPackageJson,
+  releaseAssetUrl,
+  releaseTag,
+  sha256,
+  supportedTarget,
+  vendorBinaryPath
+};
--- a/npm/deskctl/scripts/validate-package.js
+++ b/npm/deskctl/scripts/validate-package.js
@ -0,0 +1,40 @@
+const fs = require("node:fs");
+const path = require("node:path");
+
+const { readPackageJson, supportedTarget, vendorBinaryPath } = require("./support");
+
+function readCargoVersion() {
+  const cargoToml = fs.readFileSync(
+    path.resolve(__dirname, "..", "..", "..", "Cargo.toml"),
+    "utf8"
+  );
+  const match = cargoToml.match(/^version = "([^"]+)"/m);
+  if (!match) {
+    throw new Error("Could not determine Cargo.toml version.");
+  }
+  return match[1];
+}
+
+function main() {
+  const pkg = readPackageJson();
+  const cargoVersion = readCargoVersion();
+
+  if (pkg.version !== cargoVersion) {
+    throw new Error(
+      `Version mismatch: npm package is ${pkg.version}, Cargo.toml is ${cargoVersion}.`
+    );
+  }
+
+  if (pkg.bin?.deskctl !== "bin/deskctl.js") {
+    throw new Error("deskctl must expose the deskctl bin entrypoint.");
+  }
+
+  const target = supportedTarget("linux", "x64");
+  const targetPath = vendorBinaryPath(target);
+  const vendorDir = path.dirname(targetPath);
+  if (!vendorDir.endsWith(path.join("deskctl", "vendor"))) {
+    throw new Error("Vendor binary directory resolved unexpectedly.");
+  }
+}
+
+main();
--- a/site/.gitignore
+++ b/site/.gitignore
@ -0,0 +1,4 @@
+node_modules/
+dist/
+.astro/
+.vercel/
--- a/site/.prettierrc
+++ b/site/.prettierrc
@ -0,0 +1,11 @@
+{
+  "plugins": ["prettier-plugin-astro"],
+  "overrides": [
+    {
+      "files": "*.astro",
+      "options": {
+        "parser": "astro"
+      }
+    }
+  ]
+}
--- a/site/astro.config.mjs
+++ b/site/astro.config.mjs
@ -0,0 +1,22 @@
+import { defineConfig } from "astro/config";
+import mdx from "@astrojs/mdx";
+import vercel from "@astrojs/vercel";
+import { midnight, daylight } from "./src/themes.mjs";
+
+export default defineConfig({
+  output: "static",
+  adapter: vercel(),
+  build: {
+    format: "file",
+  },
+  integrations: [mdx()],
+  markdown: {
+    shikiConfig: {
+      themes: {
+        light: daylight,
+        dark: midnight,
+      },
+      wrap: true,
+    },
+  },
+});
--- a/site/package.json
+++ b/site/package.json
@ -0,0 +1,24 @@
+{
+  "name": "deskctl-site",
+  "type": "module",
+  "version": "0.0.1",
+  "private": true,
+  "scripts": {
+    "dev": "astro dev",
+    "build": "astro build",
+    "preview": "astro preview",
+    "check": "astro check",
+    "format:check": "prettier --check 'src/**/*.{astro,mdx,css}' astro.config.mjs"
+  },
+  "dependencies": {
+    "@astrojs/mdx": "^4.3.14",
+    "@astrojs/vercel": "^9.0.5",
+    "astro": "^5.18.1"
+  },
+  "devDependencies": {
+    "@astrojs/check": "^0.9.8",
+    "prettier": "^3.8.1",
+    "prettier-plugin-astro": "^0.14.1",
+    "typescript": "^5.9.3"
+  }
+}
--- a/site/pnpm-lock.yaml
+++ b/site/pnpm-lock.yaml
--- a/site/public/favicon.png
+++ b/site/public/favicon.png
--- a/site/public/favicon.svg
+++ b/site/public/favicon.svg
@ -0,0 +1,6 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="256" height="256" viewBox="0 0 256 256">
+  <rect width="256" height="256" rx="40" fill="#2a2a2a"/>
+  <g fill="#ffffff" transform="translate(28,28) scale(0.78)">
+    <path d="M200,80v32a8,8,0,0,1-16,0V88H160a8,8,0,0,1,0-16h32A8,8,0,0,1,200,80ZM96,168H72V144a8,8,0,0,0-16,0v32a8,8,0,0,0,8,8H96a8,8,0,0,0,0-16ZM232,56V200a16,16,0,0,1-16,16H40a16,16,0,0,1-16-16V56A16,16,0,0,1,40,40H216A16,16,0,0,1,232,56ZM216,200V56H40V200H216Z"/>
+  </g>
+</svg>
--- a/site/src/layouts/DocLayout.astro
+++ b/site/src/layouts/DocLayout.astro
@ -0,0 +1,115 @@
+---
+import "../styles/base.css";
+import type { MarkdownHeading } from "astro";
+const fm = Astro.props.frontmatter || Astro.props;
+const title = fm.title;
+const description = fm.description || "desktop control for AI agents";
+const toc = fm.toc ?? false;
+const headings: MarkdownHeading[] = Astro.props.headings ?? [];
+const isIndex =
+  Astro.url.pathname === "/" || Astro.url.pathname === "/index.html";
+const h2s = headings.filter((h) => h.depth === 2);
+
+function formatTocText(text: string): string {
+  if (!text.includes(" ") && /[-.]/.test(text)) {
+    return `<code>${text}</code>`;
+  }
+  return text.replace(/\(([^)]+)\)/g, "(<code>$1</code>)");
+}
+---
+
+<!doctype html>
+<html lang="en">
+  <head>
+    <meta charset="UTF-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1" />
+    <meta name="description" content={description} />
+    <link rel="icon" type="image/svg+xml" href="/favicon.svg" />
+    <title>{title ? `${title} — deskctl` : "deskctl"}</title>
+  </head>
+  <body>
+    {
+      !isIndex && (
+        <nav class="breadcrumbs">
+          <a class="title" href="/">
+            deskctl
+          </a>
+          <span class="sep">/</span>
+          <a href={Astro.url.pathname}>{title}</a>
+        </nav>
+      )
+    }
+
+    {
+      toc && (
+        <aside class="toc-nav">
+          <ul>
+            {h2s.map((h) => (
+              <li>
+                <a href={`#${h.slug}`} set:html={formatTocText(h.text)} />
+              </li>
+            ))}
+          </ul>
+        </aside>
+      )
+    }
+
+    <main>
+      <slot />
+    </main>
+
+    <script>
+      const links = document.querySelectorAll(".toc-nav a");
+      if (links.length) {
+        const ids = Array.from(links).map((a) =>
+          a.getAttribute("href")!.slice(1),
+        );
+        const sections = ids
+          .map((id) => document.getElementById(id))
+          .filter(Boolean) as HTMLElement[];
+
+        let clickLock = false;
+        let scrollTimer: number;
+
+        function activate(id: string) {
+          links.forEach((a) => {
+            a.classList.toggle("active", a.getAttribute("href") === `#${id}`);
+          });
+        }
+
+        links.forEach((a) => {
+          a.addEventListener("click", () => {
+            activate(a.getAttribute("href")!.slice(1));
+            clickLock = true;
+          });
+        });
+
+        const observer = new IntersectionObserver(
+          (entries) => {
+            if (clickLock) return;
+            for (const entry of entries) {
+              if (entry.isIntersecting) {
+                activate(entry.target.id);
+                break;
+              }
+            }
+          },
+          { rootMargin: "0px 0px -60% 0px" },
+        );
+
+        sections.forEach((s) => observer.observe(s));
+
+        window.addEventListener(
+          "scroll",
+          () => {
+            clearTimeout(scrollTimer);
+            scrollTimer = window.setTimeout(() => {
+              clickLock = false;
+            }, 150);
+          },
+          { passive: true },
+        );
+      }
+    </script>
+  </body>
+</html>
--- a/site/src/pages/commands.mdx
+++ b/site/src/pages/commands.mdx
@ -0,0 +1,114 @@
+---
+layout: ../layouts/DocLayout.astro
+title: Commands
+toc: true
+---
+
+# Commands
+
+The public CLI is intentionally small. Most workflows boil down to grouped
+reads, grouped waits, selector-driven actions, and a few input primitives.
+
+## Observe and inspect
+
+```sh
+deskctl doctor
+deskctl upgrade
+deskctl snapshot
+deskctl snapshot --annotate
+deskctl list-windows
+deskctl screenshot
+deskctl screenshot /tmp/screen.png
+deskctl get active-window
+deskctl get monitors
+deskctl get version
+deskctl get systeminfo
+deskctl get-screen-size
+deskctl get-mouse-position
+```
+
+`doctor` checks the runtime before daemon startup. `upgrade` checks for a newer
+published version, shows a short confirmation prompt when an update is
+available, and supports `--yes` for non-interactive use. `snapshot` produces a
+screenshot plus window refs. `list-windows` is the same window tree without the
+side effect of writing a screenshot. The grouped `get` commands are the
+preferred read surface for focused state queries.
+
+## Wait for state transitions
+
+```sh
+deskctl wait window --selector 'title=Chromium' --timeout 10
+deskctl wait focus --selector 'id=win3' --timeout 5
+deskctl --json wait window --selector 'class=chromium' --poll-ms 100
+```
+
+Wait commands return the matched window payload on success. In `--json` mode,
+timeouts and selector failures expose structured `kind` values.
+
+## Act on windows
+
+```sh
+deskctl launch chromium
+deskctl focus @w1
+deskctl focus 'title=Chromium'
+deskctl click @w1
+deskctl click 960,540
+deskctl dblclick @w2
+deskctl close @w3
+deskctl move-window @w1 100 120
+deskctl resize-window @w1 1280 720
+```
+
+Selector-driven actions accept refs, explicit selector modes, or absolute
+coordinates where appropriate.
+
+## Keyboard and mouse input
+
+```sh
+deskctl type "hello world"
+deskctl press enter
+deskctl hotkey ctrl shift t
+deskctl mouse move 100 200
+deskctl mouse scroll 3
+deskctl mouse scroll 3 --axis horizontal
+deskctl mouse drag 100 200 500 600
+```
+
+Supported key names include `enter`, `tab`, `escape`, `backspace`, `delete`,
+`space`, arrow keys, paging keys, `f1` through `f12`, and any single
+character.
+
+## Selectors
+
+Prefer explicit selectors when the target matters. They are clearer in logs,
+more deterministic for automation, and easier to retry safely.
+
+```sh
+ref=w1
+id=win1
+title=Chromium
+class=chromium
+focused
+```
+
+Legacy shorthand is still supported:
+
+```sh
+@w1
+w1
+win1
+```
+
+Bare strings like `chromium` are fuzzy matches. They resolve when there is one
+match and fail with candidate windows when there are multiple matches.
+
+## Global options
+
+| Flag               | Env              | Description                                            |
+| ------------------ | ---------------- | ------------------------------------------------------ |
+| `--json`           |                  | Output as JSON                                         |
+| `--socket <path>`  | `DESKCTL_SOCKET` | Path to daemon Unix socket                             |
+| `--session <name>` |                  | Session name for multiple daemons (default: `default`) |
+
+`deskctl` manages the daemon automatically. Most users never need to think
+about it beyond `--session` and `--socket`.
--- a/site/src/pages/index.astro
+++ b/site/src/pages/index.astro
@ -0,0 +1,53 @@
+---
+import DocLayout from "../layouts/DocLayout.astro";
+---
+
+<DocLayout title="" description="desktop control for AI agents">
+  <header style="justify-content: flex-start;">
+    <h1>deskctl</h1>
+    <img src="/favicon.svg" alt="" width="40" height="40" />
+  </header>
+
+  <p class="tagline">non-interactive desktop control cli for AI agents</p>
+
+  <p class="lede">
+    A thin X11 control primitive for agent loops: diagnose the runtime, observe
+    the desktop, wait for state transitions, act deterministically, then verify.
+  </p>
+
+  <h2>Start</h2>
+
+  <ul>
+    <li>
+      <a href="/installation">Installation</a>
+    </li>
+    <li>
+      <a href="/quick-start">Quick start</a>
+    </li>
+  </ul>
+
+  <h2>Reference</h2>
+
+  <ul>
+    <li>
+      <a href="/commands">Commands</a>
+    </li>
+    <li>
+      <a href="/runtime-contract">Runtime contract</a>
+    </li>
+  </ul>
+
+  <h2>Links</h2>
+
+  <ul>
+    <li>
+      <a href="https://github.com/harivansh-afk/deskctl">GitHub</a>
+    </li>
+    <li>
+      <a href="https://crates.io/crates/deskctl">crates.io</a>
+    </li>
+    <li>
+      <a href="https://www.npmjs.com/package/deskctl">npm</a>
+    </li>
+  </ul>
+</DocLayout>
--- a/site/src/pages/installation.mdx
+++ b/site/src/pages/installation.mdx
@ -0,0 +1,76 @@
+---
+layout: ../layouts/DocLayout.astro
+title: Installation
+toc: true
+---
+
+# Installation
+
+Install the public `deskctl` command first, then validate the desktop runtime
+with `deskctl doctor` before trying to automate anything.
+
+## Recommended path
+
+```sh
+npm install -g deskctl
+deskctl doctor
+```
+
+`deskctl` is the default install path. It installs the command by
+downloading the matching GitHub Release asset for the supported runtime target.
+
+This path does not require a Rust toolchain. The installed command is always
+`deskctl`, even though the release asset itself is target-specific.
+
+## Skill install
+
+The repo skill lives under `skills/deskctl`, so you can install it
+directly uring `skills.sh`
+
+```sh
+npx skills add harivansh-afk/deskctl
+```
+
+## Other install paths
+
+### Nix
+
+```sh
+nix run github:harivansh-afk/deskctl -- --help
+nix profile install github:harivansh-afk/deskctl
+```
+
+### Rust
+
+```sh
+git clone https://github.com/harivansh-afk/deskctl
+cd deskctl
+cargo build
+```
+
+Source builds on Linux require:
+
+- Rust 1.75+
+- `pkg-config`
+- X11 development libraries such as `libx11-dev` and `libxtst-dev`
+
+## Runtime requirements
+
+- Linux with an active X11 session
+- `DISPLAY` set to a usable X11 display, such as `DISPLAY=:1`
+- `XDG_SESSION_TYPE=x11` or an equivalent X11 session environment
+- a window manager or desktop environment that exposes standard EWMH properties
+  such as `_NET_CLIENT_LIST_STACKING` and `_NET_ACTIVE_WINDOW`
+
+The binary itself only depends on the standard Linux glibc runtime.
+
+## Verification
+
+If setup fails for any reason start here:
+
+```sh
+deskctl doctor
+```
+
+`doctor` checks X11 connectivity, window enumeration, screenshot viability, and
+daemon/socket health before normal command execution.
--- a/site/src/pages/quick-start.mdx
+++ b/site/src/pages/quick-start.mdx
@ -0,0 +1,105 @@
+---
+layout: ../layouts/DocLayout.astro
+title: Quick start
+toc: true
+---
+
+# Quick start
+
+The fastest way to use `deskctl` is to follow the same four-step loop : observe, wait, act, verify.
+
+## 1. Install and diagnose
+
+```sh
+npm install -g deskctl
+deskctl doctor
+```
+
+Run `deskctl doctor` first. It checks X11 connectivity, basic enumeration,
+screenshot viability, and socket health before you start driving the desktop.
+
+## 2. Observe the desktop
+
+```sh
+deskctl snapshot --annotate
+deskctl list-windows
+deskctl get active-window
+deskctl get monitors
+```
+
+Use `snapshot` when you want a screenshot artifact plus window refs. Use
+`list-windows` when you only need the current window tree without writing a
+screenshot.
+
+## 3. Pick selectors that stay readable
+
+Prefer explicit selectors when you need deterministic targeting:
+
+```sh
+ref=w1
+id=win1
+title=Chromium
+class=chromium
+focused
+```
+
+Legacy refs such as `@w1` still work after `snapshot` or `list-windows`. Bare
+strings like `chromium` are fuzzy matches and now fail on ambiguity.
+
+## 4. Wait, act, verify
+
+The core loop is:
+
+```sh
+# observe
+deskctl snapshot --annotate
+
+# wait
+deskctl wait window --selector 'title=Chromium' --timeout 10
+
+# act
+deskctl focus 'title=Chromium'
+deskctl hotkey ctrl l
+deskctl type "https://example.com"
+deskctl press enter
+
+# verify
+deskctl wait focus --selector 'title=Chromium' --timeout 5
+deskctl snapshot
+```
+
+The wait commands return the matched window payload on success, so they compose
+cleanly into the next action.
+
+## 5. Use `--json` when parsing matters
+
+Every command supports `--json` and uses the same top-level envelope:
+
+```json
+{
+  "success": true,
+  "data": {
+    "screenshot": "/tmp/deskctl-1234567890.png",
+    "windows": [
+      {
+        "ref_id": "w1",
+        "window_id": "win1",
+        "title": "Chromium",
+        "app_name": "chromium",
+        "x": 0,
+        "y": 0,
+        "width": 1920,
+        "height": 1080,
+        "focused": true,
+        "minimized": false
+      }
+    ]
+  }
+}
+```
+
+Use `window_id` for stable targeting inside a live daemon session. The exact
+text formatting is intentionally compact, but JSON is the parsing contract.
+
+The full stable-vs-best-effort contract lives on the
+[runtime contract](/runtime-contract) page.
--- a/site/src/pages/runtime-contract.mdx
+++ b/site/src/pages/runtime-contract.mdx
@ -0,0 +1,177 @@
+---
+layout: ../layouts/DocLayout.astro
+title: Runtime contract
+toc: true
+---
+
+# Runtime contract
+
+This page defines the current public output contract for `deskctl`.
+
+It is intentionally scoped to the current Linux X11 runtime surface. It does
+not promise stability for future Wayland or window-manager-specific features.
+
+## Stable top-level envelope
+
+Every command supports `--json` and uses the same top-level envelope:
+
+```json
+{
+  "success": true,
+  "data": {},
+  "error": null
+}
+```
+
+Stable top-level fields:
+
+- `success`
+- `data`
+- `error`
+
+If `success` is `false`, the command exits non-zero in both text mode and JSON
+mode.
+
+## Stable window payload
+
+Whenever a response includes a window payload, these fields are stable:
+
+- `ref_id`
+- `window_id`
+- `title`
+- `app_name`
+- `x`
+- `y`
+- `width`
+- `height`
+- `focused`
+- `minimized`
+
+`window_id` is the public session-scoped identifier for programmatic targeting.
+`ref_id` is a short-lived convenience handle from the current ref map.
+
+## Stable grouped reads
+
+`deskctl get active-window`
+
+- stable: `data.window`
+
+`deskctl get monitors`
+
+- stable: `data.count`
+- stable: `data.monitors`
+
+Stable per-monitor fields:
+
+- `name`
+- `x`
+- `y`
+- `width`
+- `height`
+- `width_mm`
+- `height_mm`
+- `primary`
+- `automatic`
+
+`deskctl get version`
+
+- stable: `data.version`
+- stable: `data.backend`
+
+`deskctl get systeminfo`
+
+- stable: `data.backend`
+- stable: `data.display`
+- stable: `data.session_type`
+- stable: `data.session`
+- stable: `data.socket_path`
+- stable: `data.screen`
+- stable: `data.monitor_count`
+- stable: `data.monitors`
+
+## Stable waits
+
+`deskctl wait window`
+`deskctl wait focus`
+
+- stable: `data.wait`
+- stable: `data.selector`
+- stable: `data.elapsed_ms`
+- stable: `data.window`
+
+## Stable selector-driven action fields
+
+When selector-driven actions return resolved window data, these fields are
+stable when present:
+
+- `data.ref_id`
+- `data.window_id`
+- `data.title`
+- `data.selector`
+
+This applies to:
+
+- `click`
+- `dblclick`
+- `focus`
+- `close`
+- `move-window`
+- `resize-window`
+
+## Stable artifact fields
+
+For `snapshot` and `screenshot`:
+
+- stable: `data.screenshot`
+
+When a command also returns windows, `data.windows` uses the stable window
+payload documented above.
+
+## Stable structured error kinds
+
+When a command fails with structured JSON data, these error kinds are stable:
+
+- `selector_not_found`
+- `selector_ambiguous`
+- `selector_invalid`
+- `timeout`
+- `not_found`
+- `window_not_focused` in `data.last_observation.kind` or an equivalent wait
+  observation payload
+
+Stable structured failure fields include:
+
+- `data.kind`
+- `data.selector`
+- `data.mode`
+- `data.candidates`
+- `data.message`
+- `data.wait`
+- `data.timeout_ms`
+- `data.poll_ms`
+- `data.last_observation`
+
+## Best-effort fields
+
+These values are useful but environment-dependent and should not be treated as
+strict parsing guarantees:
+
+- exact monitor naming conventions
+- EWMH/window-manager-dependent ordering details
+- cosmetic text formatting in non-JSON mode
+- default screenshot file names when no explicit path was provided
+- stderr wording outside the structured `kind` classifications above
+
+## Text mode expectations
+
+Text mode is intended to stay compact and follow-up-useful.
+
+The exact whitespace and alignment are not stable. The stable behavioral
+expectations are:
+
+- important reads print actionable identifiers or geometry
+- selector failures print enough detail to recover without `--json`
+- artifact-producing commands print the artifact path
+- window listings print both `@wN` refs and `window_id` values
+
+If you need strict parsing, use `--json`.
--- a/site/src/styles/base.css
+++ b/site/src/styles/base.css
@ -0,0 +1,303 @@
+@import url("https://fonts.googleapis.com/css2?family=Manrope:wght@300;400;500;700&display=swap");
+
+@font-face {
+  font-family: "Berkeley Mono";
+  src: url("https://www.barrettruth.com/fonts/berkeley-mono/BerkeleyMono-Regular.ttf")
+    format("truetype");
+  font-weight: 400;
+  font-style: normal;
+  font-display: swap;
+}
+
+@font-face {
+  font-family: "Berkeley Mono";
+  src: url("https://www.barrettruth.com/fonts/berkeley-mono/BerkeleyMono-Bold.ttf")
+    format("truetype");
+  font-weight: 700;
+  font-style: normal;
+  font-display: swap;
+}
+
+@font-face {
+  font-family: "Berkeley Mono";
+  src: url("https://www.barrettruth.com/fonts/berkeley-mono/BerkeleyMono-Italic.ttf")
+    format("truetype");
+  font-weight: 400;
+  font-style: italic;
+  font-display: swap;
+}
+
+*,
+*::before,
+*::after {
+  margin: 0;
+  padding: 0;
+  box-sizing: border-box;
+}
+
+html,
+body {
+  font-family: "Manrope", sans-serif;
+  line-height: 1.65;
+  color: #1a1a1a;
+  background: #f5f5f5;
+}
+
+@media (prefers-color-scheme: dark) {
+  html,
+  body {
+    background: #121212;
+    color: #e0e0e0;
+  }
+}
+
+main {
+  max-width: 50rem;
+  margin: 0 auto;
+  padding: 3rem clamp(1.25rem, 5vw, 3rem) 6rem;
+}
+
+.tagline {
+  font-size: 1.1rem;
+  opacity: 0.5;
+  margin-top: -0.75rem;
+  margin-bottom: 1.75rem;
+  font-style: italic;
+}
+
+.lede {
+  font-size: 1.05rem;
+  max-width: 42rem;
+}
+
+header {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  flex-wrap: nowrap;
+  gap: 20px;
+  margin-bottom: 1.5rem;
+}
+
+header h1 {
+  margin-bottom: 0;
+}
+
+header code {
+  font-size: clamp(1.75rem, 5vw, 2.5rem);
+}
+
+h1 {
+  font-weight: 300;
+  font-size: clamp(1.75rem, 5vw, 2.5rem);
+  line-height: 1.2;
+  margin-bottom: 1.5rem;
+}
+
+h2 {
+  font-weight: 400;
+  font-size: 1.35rem;
+  margin-top: 2.5rem;
+  margin-bottom: 0.75rem;
+}
+
+h3 {
+  font-weight: 500;
+  font-size: 1.1rem;
+  margin-top: 2rem;
+  margin-bottom: 0.5rem;
+}
+
+p {
+  margin-bottom: 1rem;
+}
+
+a {
+  color: inherit;
+  text-decoration-thickness: 1px;
+  text-underline-offset: 0.15em;
+}
+
+a:hover {
+  text-decoration-thickness: 2px;
+}
+
+img {
+  max-width: 100%;
+}
+
+ul,
+ol {
+  padding-left: 1.25em;
+  margin-bottom: 1rem;
+}
+
+li {
+  margin-bottom: 0.35rem;
+}
+
+pre,
+code,
+.astro-code {
+  font-family: "Berkeley Mono", monospace !important;
+  font-variant-ligatures: none;
+}
+
+code {
+  font-size: 0.88em;
+  padding: 0.15em 0.35em;
+  border-radius: 3px;
+  background: #e8e8e8;
+}
+
+@media (prefers-color-scheme: dark) {
+  code {
+    background: #222222;
+  }
+}
+
+pre {
+  padding: 1rem 1.25rem;
+  border-radius: 4px;
+  overflow-x: auto;
+  white-space: pre;
+  word-wrap: normal;
+  margin-bottom: 1.25rem;
+  line-height: 1.5;
+  background: #ebebeb;
+}
+
+@media (prefers-color-scheme: dark) {
+  pre {
+    background: #222222;
+  }
+}
+
+pre code {
+  padding: 0;
+  background: none;
+  font-size: 0.85em;
+}
+
+@media (prefers-color-scheme: dark) {
+  .astro-code,
+  .astro-code span {
+    color: var(--shiki-dark) !important;
+    background-color: var(--shiki-dark-bg) !important;
+  }
+}
+
+table {
+  width: 100%;
+  border-collapse: collapse;
+  margin-bottom: 1.25rem;
+  font-size: 0.95em;
+}
+
+th,
+td {
+  text-align: left;
+  padding: 0.5rem 0.75rem;
+  border-bottom: 1px solid #d0d0d0;
+}
+
+@media (prefers-color-scheme: dark) {
+  th,
+  td {
+    border-bottom-color: #2d2d2d;
+  }
+}
+
+th {
+  font-weight: 500;
+}
+
+hr {
+  border: none;
+  border-top: 1px solid #d0d0d0;
+  margin: 2.5rem 0;
+}
+
+@media (prefers-color-scheme: dark) {
+  hr {
+    border-top-color: #2d2d2d;
+  }
+}
+
+.breadcrumbs {
+  max-width: 50rem;
+  margin: 0 auto;
+  padding: 1.5rem clamp(1.25rem, 5vw, 3rem) 0;
+  font-size: 0.9rem;
+}
+
+.breadcrumbs a {
+  color: inherit;
+  text-decoration: none;
+  opacity: 0.6;
+  transition: opacity 0.15s;
+}
+
+.breadcrumbs a:hover {
+  opacity: 1;
+}
+
+.breadcrumbs .title {
+  font-weight: 500;
+  opacity: 1;
+}
+
+.breadcrumbs .sep {
+  opacity: 0.3;
+  margin: 0 0.5em;
+}
+
+.toc-nav {
+  position: fixed;
+  top: 6.5rem;
+  left: max(1rem, calc(50vw - 25rem - 2rem - 11rem));
+  width: 11rem;
+  font-size: 0.9rem;
+  line-height: 1.5;
+}
+
+.toc-nav code {
+  font-size: 0.85em;
+  padding: 0.1em 0.25em;
+  border-radius: 2px;
+  background: #e8e8e8;
+}
+
+@media (prefers-color-scheme: dark) {
+  .toc-nav code {
+    background: #222222;
+  }
+}
+
+@media (max-width: 64em) {
+  .toc-nav {
+    display: none;
+  }
+}
+
+.toc-nav ul {
+  list-style: none;
+  padding: 0;
+  margin: 0;
+}
+
+.toc-nav li {
+  margin-bottom: 0.45rem;
+}
+
+.toc-nav a {
+  color: inherit;
+  text-decoration: none;
+  opacity: 0.6;
+  transition: opacity 0.15s;
+}
+
+.toc-nav a:hover,
+.toc-nav a.active {
+  opacity: 1;
+}
--- a/site/src/themes.mjs
+++ b/site/src/themes.mjs
@ -0,0 +1,59 @@
+export const midnight = {
+  name: "midnight",
+  type: "dark",
+  colors: {
+    "editor.background": "#222222",
+    "editor.foreground": "#e0e0e0",
+  },
+  tokenColors: [
+    {
+      scope: [
+        "storage.type",
+        "storage.modifier",
+        "keyword.control",
+        "keyword.operator.new",
+      ],
+      settings: { foreground: "#7aa2f7" },
+    },
+    {
+      scope: [
+        "string.quoted",
+        "constant.numeric",
+        "constant.language",
+        "constant.character",
+        "number",
+      ],
+      settings: { foreground: "#98c379" },
+    },
+  ],
+};
+
+export const daylight = {
+  name: "daylight",
+  type: "light",
+  colors: {
+    "editor.background": "#ebebeb",
+    "editor.foreground": "#1a1a1a",
+  },
+  tokenColors: [
+    {
+      scope: [
+        "storage.type",
+        "storage.modifier",
+        "keyword.control",
+        "keyword.operator.new",
+      ],
+      settings: { foreground: "#3b5bdb" },
+    },
+    {
+      scope: [
+        "string.quoted",
+        "constant.numeric",
+        "constant.language",
+        "constant.character",
+        "number",
+      ],
+      settings: { foreground: "#2d7f3e" },
+    },
+  ],
+};
--- a/site/tsconfig.json
+++ b/site/tsconfig.json
@ -0,0 +1,10 @@
+{
+  "extends": "astro/tsconfigs/strict",
+  "compilerOptions": {
+    "baseUrl": ".",
+    "paths": {
+      "@layouts/*": ["src/layouts/*"],
+      "@components/*": ["src/components/*"]
+    }
+  }
+}
--- a/skills/deskctl/SKILL.md
+++ b/skills/deskctl/SKILL.md
@ -0,0 +1,60 @@
+---
+name: deskctl
+description: Non-interactive X11 desktop control for AI agents. Use when the task involves controlling a Linux desktop - clicking, typing, reading windows, waiting for UI state, or taking screenshots inside a sandbox or VM.
+allowed-tools: Bash(deskctl:*), Bash(npx deskctl:*), Bash(npm:*), Bash(which:*), Bash(printenv:*), Bash(echo:*)
+---
+
+# deskctl
+
+Non-interactive desktop control CLI for Linux X11 agents.
+
+All output follows the runtime contract defined in [references/runtime-contract.md](references/runtime-contract.md). Every command returns a stable JSON envelope when called with `--json`. Use `--json` whenever you need to parse output programmatically.
+
+## Quick start
+
+```bash
+npm install -g deskctl
+deskctl doctor
+deskctl snapshot --annotate
+```
+
+If `deskctl` was installed through npm, refresh it later with:
+
+```bash
+deskctl upgrade --yes
+```
+
+## Agent loop
+
+Every desktop interaction follows: **observe -> wait -> act -> verify**.
+
+```bash
+deskctl snapshot --annotate        # observe
+deskctl wait window --selector 'title=Chromium' --timeout 10  # wait
+deskctl click 'title=Chromium'      # act
+deskctl snapshot                   # verify
+```
+
+See [workflows/observe-act.sh](workflows/observe-act.sh) for a reusable script. See [workflows/poll-condition.sh](workflows/poll-condition.sh) for polling loops.
+
+## Selectors
+
+```bash
+ref=w1          # snapshot ref (short-lived)
+id=win1         # stable window ID (session-scoped)
+title=Chromium   # match by title
+class=chromium   # match by WM class
+focused         # currently focused window
+```
+
+Bare strings like `chromium` do fuzzy matching but fail on ambiguity. Prefer explicit selectors.
+
+## References
+
+- [references/runtime-contract.md](references/runtime-contract.md) - output contract, stable fields, error kinds
+- [references/commands.md](references/commands.md) - all available commands
+
+## Workflows
+
+- [workflows/observe-act.sh](workflows/observe-act.sh) - main observe-act loop
+- [workflows/poll-condition.sh](workflows/poll-condition.sh) - poll for a condition on screen
--- a/skills/deskctl/agents/openai.yaml
+++ b/skills/deskctl/agents/openai.yaml
@ -0,0 +1,7 @@
+interface:
+  display_name: "deskctl"
+  short_description: "Control Linux X11 desktops from agent loops"
+  default_prompt: "Use $deskctl to diagnose the desktop, observe state, wait for UI changes, act deterministically, and verify the result."
+
+policy:
+  allow_implicit_invocation: true
--- a/skills/deskctl/references/commands.md
+++ b/skills/deskctl/references/commands.md
@ -0,0 +1,66 @@
+# deskctl commands
+
+All commands support `--json` for machine-parseable output following the
+runtime contract.
+
+## Observe
+
+```bash
+deskctl doctor
+deskctl upgrade
+deskctl snapshot
+deskctl snapshot --annotate
+deskctl list-windows
+deskctl screenshot /tmp/screen.png
+deskctl get active-window
+deskctl get monitors
+deskctl get version
+deskctl get systeminfo
+deskctl get-screen-size
+deskctl get-mouse-position
+```
+
+## Wait
+
+```bash
+deskctl wait window --selector 'title=Chromium' --timeout 10
+deskctl wait focus --selector 'class=chromium' --timeout 5
+```
+
+Returns the matched window payload on success. Failures include structured
+`kind` values in `--json` mode.
+
+## Selectors
+
+```bash
+ref=w1
+id=win1
+title=Chromium
+class=chromium
+focused
+```
+
+Legacy shorthand: `@w1`, `w1`, `win1`. Bare strings do fuzzy matching but fail
+on ambiguity.
+
+## Act
+
+```bash
+deskctl focus 'class=chromium'
+deskctl click @w1
+deskctl dblclick @w2
+deskctl type "hello world"
+deskctl press enter
+deskctl hotkey ctrl shift t
+deskctl mouse move 500 300
+deskctl mouse scroll 3
+deskctl mouse scroll 3 --axis horizontal
+deskctl mouse drag 100 100 500 500
+deskctl move-window @w1 100 120
+deskctl resize-window @w1 1280 720
+deskctl close @w3
+deskctl launch chromium
+```
+
+The daemon starts automatically on first command. In normal usage you should
+not need to manage it directly.
--- a/skills/deskctl/references/runtime-contract.md
+++ b/skills/deskctl/references/runtime-contract.md
@ -0,0 +1,73 @@
+# deskctl runtime contract
+
+This copy ships inside the installable skill so `npx skills add ...` installs a
+self-contained reference bundle.
+
+All commands support `--json` and use the same top-level envelope:
+
+```json
+{
+  "success": true,
+  "data": {},
+  "error": null
+}
+```
+
+Use `--json` whenever you need to parse output programmatically.
+
+## Stable window fields
+
+Whenever a response includes a window payload, these fields are stable:
+
+- `ref_id`
+- `window_id`
+- `title`
+- `app_name`
+- `x`
+- `y`
+- `width`
+- `height`
+- `focused`
+- `minimized`
+
+Use `window_id` for stable targeting inside a live daemon session. Use
+`ref_id` or `@wN` for short-lived follow-up actions after `snapshot` or
+`list-windows`.
+
+## Stable grouped reads
+
+- `deskctl get active-window` -> `data.window`
+- `deskctl get monitors` -> `data.count`, `data.monitors`
+- `deskctl get version` -> `data.version`, `data.backend`
+- `deskctl get systeminfo` -> runtime-scoped diagnostic fields such as
+  `backend`, `display`, `session_type`, `session`, `socket_path`, `screen`,
+  `monitor_count`, and `monitors`
+
+## Stable waits
+
+- `deskctl wait window` -> `data.wait`, `data.selector`, `data.elapsed_ms`,
+  `data.window`
+- `deskctl wait focus` -> `data.wait`, `data.selector`, `data.elapsed_ms`,
+  `data.window`
+
+## Stable structured error kinds
+
+When a command fails with structured JSON data, these `kind` values are stable:
+
+- `selector_not_found`
+- `selector_ambiguous`
+- `selector_invalid`
+- `timeout`
+- `not_found`
+
+Wait failures may also include `window_not_focused` in the last observation
+payload.
+
+## Best-effort fields
+
+Treat these as useful but non-contractual:
+
+- exact monitor names
+- incidental text formatting in non-JSON mode
+- default screenshot file names when no explicit path was provided
+- environment-dependent ordering details from the window manager
--- a/skills/deskctl/workflows/observe-act.sh
+++ b/skills/deskctl/workflows/observe-act.sh
@ -0,0 +1,37 @@
+#!/usr/bin/env bash
+# observe-act.sh - main desktop interaction loop
+# usage: ./observe-act.sh <selector> [action] [action-args...]
+# example: ./observe-act.sh 'title=Chromium' click
+# example: ./observe-act.sh 'class=terminal' type "ls -la"
+set -euo pipefail
+
+SELECTOR="${1:?usage: observe-act.sh <selector> [action] [action-args...]}"
+ACTION="${2:-click}"
+shift 2 2>/dev/null || true
+
+# 1. observe - snapshot the desktop, get current state
+echo "--- observe ---"
+deskctl snapshot --annotate --json | head -1
+deskctl get active-window
+
+# 2. wait - ensure target exists
+echo "--- wait ---"
+deskctl wait window --selector "$SELECTOR" --timeout 10
+
+# 3. act - perform the action on the target
+echo "--- act ---"
+case "$ACTION" in
+  click)    deskctl click "$SELECTOR" ;;
+  dblclick) deskctl dblclick "$SELECTOR" ;;
+  focus)    deskctl focus "$SELECTOR" ;;
+  type)     deskctl focus "$SELECTOR" && deskctl type "$@" ;;
+  press)    deskctl focus "$SELECTOR" && deskctl press "$@" ;;
+  hotkey)   deskctl focus "$SELECTOR" && deskctl hotkey "$@" ;;
+  close)    deskctl close "$SELECTOR" ;;
+  *)        echo "unknown action: $ACTION"; exit 1 ;;
+esac
+
+# 4. verify - snapshot again to confirm result
+echo "--- verify ---"
+sleep 0.5
+deskctl snapshot --json | head -1
--- a/skills/deskctl/workflows/poll-condition.sh
+++ b/skills/deskctl/workflows/poll-condition.sh
@ -0,0 +1,42 @@
+#!/usr/bin/env bash
+# poll-condition.sh - poll the desktop until a condition is met
+# usage: ./poll-condition.sh <match-string> [interval-seconds] [max-attempts]
+# example: ./poll-condition.sh "Tickets Available" 5 60
+# example: ./poll-condition.sh "Order Confirmed" 3 20
+# example: ./poll-condition.sh "Download Complete" 10 30
+#
+# checks window titles for the match string every N seconds.
+# exits 0 when found, exits 1 after max attempts.
+set -euo pipefail
+
+MATCH="${1:?usage: poll-condition.sh <match-string> [interval] [max-attempts]}"
+INTERVAL="${2:-5}"
+MAX="${3:-60}"
+
+attempt=0
+while [ "$attempt" -lt "$MAX" ]; do
+  attempt=$((attempt + 1))
+
+  # snapshot and check window titles
+  windows=$(deskctl list-windows --json 2>/dev/null || echo '{"success":false}')
+  if echo "$windows" | grep -qi "$MATCH"; then
+    echo "FOUND: '$MATCH' detected on attempt $attempt"
+    deskctl snapshot --annotate
+    exit 0
+  fi
+
+  # also check screenshot text via active window title
+  active=$(deskctl get active-window --json 2>/dev/null || echo '{}')
+  if echo "$active" | grep -qi "$MATCH"; then
+    echo "FOUND: '$MATCH' in active window on attempt $attempt"
+    deskctl snapshot --annotate
+    exit 0
+  fi
+
+  echo "attempt $attempt/$MAX - '$MATCH' not found, waiting ${INTERVAL}s..."
+  sleep "$INTERVAL"
+done
+
+echo "NOT FOUND: '$MATCH' after $MAX attempts"
+deskctl snapshot --annotate
+exit 1
--- a/src/backend/annotate.rs
+++ b/src/backend/annotate.rs
@ -5,7 +5,7 @@ use imageproc::rect::Rect;

 use crate::core::types::WindowInfo;

-// Embedded font - DejaVu Sans Mono for guaranteed availability
+// Embedded font
 const FONT_BYTES: &[u8] = include_bytes!("../../assets/DejaVuSansMono.ttf");

 const COLORS: &[Rgba<u8>] = &[
--- a/src/backend/mod.rs
+++ b/src/backend/mod.rs
@ -1,25 +1,60 @@
 pub mod annotate;
 pub mod x11;

-use crate::core::types::Snapshot;
 use anyhow::Result;
+use image::RgbaImage;
+
+#[derive(Debug, Clone)]
+pub struct BackendWindow {
+    pub native_id: u32,
+    pub title: String,
+    pub app_name: String,
+    pub x: i32,
+    pub y: i32,
+    pub width: u32,
+    pub height: u32,
+    pub focused: bool,
+    pub minimized: bool,
+}
+
+#[derive(Debug, Clone)]
+pub struct BackendMonitor {
+    pub name: String,
+    pub x: i32,
+    pub y: i32,
+    pub width: u32,
+    pub height: u32,
+    pub width_mm: u32,
+    pub height_mm: u32,
+    pub primary: bool,
+    pub automatic: bool,
+}

 #[allow(dead_code)]
 pub trait DesktopBackend: Send {
-    /// Capture a screenshot and return a z-ordered window tree with @wN refs.
-    fn snapshot(&mut self, annotate: bool) -> Result<Snapshot>;
+    /// Collect z-ordered windows for read-only queries and targeting.
+    fn list_windows(&mut self) -> Result<Vec<BackendWindow>>;

-    /// Focus a window by its X11 window ID.
-    fn focus_window(&mut self, xcb_id: u32) -> Result<()>;
+    /// Get the currently focused window, if one is known.
+    fn active_window(&mut self) -> Result<Option<BackendWindow>>;
+
+    /// Collect monitor geometry and metadata.
+    fn list_monitors(&self) -> Result<Vec<BackendMonitor>>;
+
+    /// Capture the current desktop image without writing it to disk.
+    fn capture_screenshot(&mut self) -> Result<RgbaImage>;
+
+    /// Focus a window by its backend-native window handle.
+    fn focus_window(&mut self, native_id: u32) -> Result<()>;

    /// Move a window to absolute coordinates.
-    fn move_window(&mut self, xcb_id: u32, x: i32, y: i32) -> Result<()>;
+    fn move_window(&mut self, native_id: u32, x: i32, y: i32) -> Result<()>;

    /// Resize a window.
-    fn resize_window(&mut self, xcb_id: u32, w: u32, h: u32) -> Result<()>;
+    fn resize_window(&mut self, native_id: u32, w: u32, h: u32) -> Result<()>;

    /// Close a window gracefully.
-    fn close_window(&mut self, xcb_id: u32) -> Result<()>;
+    fn close_window(&mut self, native_id: u32) -> Result<()>;

    /// Click at absolute coordinates.
    fn click(&mut self, x: i32, y: i32) -> Result<()>;
@ -51,9 +86,9 @@ pub trait DesktopBackend: Send {
    /// Get the current mouse position.
    fn mouse_position(&self) -> Result<(i32, i32)>;

-    /// Take a screenshot and save to a path (no window tree).
-    fn screenshot(&mut self, path: &str, annotate: bool) -> Result<String>;
-
    /// Launch an application.
    fn launch(&self, command: &str, args: &[String]) -> Result<u32>;
+
+    /// Human-readable backend name for diagnostics and runtime queries.
+    fn backend_name(&self) -> &'static str;
 }
--- a/src/backend/x11.rs
+++ b/src/backend/x11.rs
@ -2,6 +2,7 @@ use anyhow::{Context, Result};
 use enigo::{Axis, Button, Coordinate, Direction, Enigo, Key, Keyboard, Mouse, Settings};
 use image::RgbaImage;
 use x11rb::connection::Connection;
+use x11rb::protocol::randr::ConnectionExt as RandrConnectionExt;
 use x11rb::protocol::xproto::{
    Atom, AtomEnum, ClientMessageData, ClientMessageEvent, ConfigureWindowAux,
    ConnectionExt as XprotoConnectionExt, EventMask, GetPropertyReply, ImageFormat, ImageOrder,
@ -9,8 +10,7 @@ use x11rb::protocol::xproto::{
 };
 use x11rb::rust_connection::RustConnection;

-use super::annotate::annotate_screenshot;
-use crate::core::types::{Snapshot, WindowInfo};
+use crate::backend::{BackendMonitor, BackendWindow};

 struct Atoms {
    client_list_stacking: Atom,
@ -71,10 +71,9 @@ impl X11Backend {
        Ok(windows)
    }

-    fn collect_window_infos(&self) -> Result<Vec<WindowInfo>> {
+    fn collect_window_infos(&self) -> Result<Vec<BackendWindow>> {
        let active_window = self.active_window()?;
        let mut window_infos = Vec::new();
-        let mut ref_counter = 1usize;

        for window in self.stacked_windows()? {
            let title = self.window_title(window).unwrap_or_default();
@ -89,9 +88,8 @@ impl X11Backend {
            };

            let minimized = self.window_is_minimized(window).unwrap_or(false);
-            window_infos.push(WindowInfo {
-                ref_id: format!("w{ref_counter}"),
-                xcb_id: window,
+            window_infos.push(BackendWindow {
+                native_id: window,
                title,
                app_name,
                x,
@ -101,12 +99,79 @@ impl X11Backend {
                focused: active_window == Some(window),
                minimized,
            });
-            ref_counter += 1;
        }

        Ok(window_infos)
    }

+    fn active_window_info(&self) -> Result<Option<BackendWindow>> {
+        let Some(active_window) = self.active_window()? else {
+            return Ok(None);
+        };
+
+        let title = self.window_title(active_window).unwrap_or_default();
+        let app_name = self.window_app_name(active_window).unwrap_or_default();
+        if title.is_empty() && app_name.is_empty() {
+            return Ok(None);
+        }
+
+        let (x, y, width, height) = self.window_geometry(active_window)?;
+        let minimized = self.window_is_minimized(active_window).unwrap_or(false);
+        Ok(Some(BackendWindow {
+            native_id: active_window,
+            title,
+            app_name,
+            x,
+            y,
+            width,
+            height,
+            focused: true,
+            minimized,
+        }))
+    }
+
+    fn collect_monitors(&self) -> Result<Vec<BackendMonitor>> {
+        let reply = self
+            .conn
+            .randr_get_monitors(self.root, true)?
+            .reply()
+            .context("Failed to query RANDR monitors")?;
+
+        let mut monitors = Vec::with_capacity(reply.monitors.len());
+        for (index, monitor) in reply.monitors.into_iter().enumerate() {
+            monitors.push(BackendMonitor {
+                name: self
+                    .atom_name(monitor.name)
+                    .unwrap_or_else(|_| format!("monitor{}", index + 1)),
+                x: i32::from(monitor.x),
+                y: i32::from(monitor.y),
+                width: u32::from(monitor.width),
+                height: u32::from(monitor.height),
+                width_mm: monitor.width_in_millimeters,
+                height_mm: monitor.height_in_millimeters,
+                primary: monitor.primary,
+                automatic: monitor.automatic,
+            });
+        }
+
+        if monitors.is_empty() {
+            let (width, height) = self.root_geometry()?;
+            monitors.push(BackendMonitor {
+                name: "screen".to_string(),
+                x: 0,
+                y: 0,
+                width,
+                height,
+                width_mm: 0,
+                height_mm: 0,
+                primary: true,
+                automatic: true,
+            });
+        }
+
+        Ok(monitors)
+    }
+
    fn capture_root_image(&self) -> Result<RgbaImage> {
        let (width, height) = self.root_geometry()?;
        let reply = self
@ -228,35 +293,50 @@ impl X11Backend {
            .reply()
            .with_context(|| format!("Failed to read property {property} from window {window}"))
    }
+
+    fn atom_name(&self, atom: Atom) -> Result<String> {
+        self.conn
+            .get_atom_name(atom)?
+            .reply()
+            .map(|reply| String::from_utf8_lossy(&reply.name).to_string())
+            .with_context(|| format!("Failed to read atom name for {atom}"))
+    }
 }

 impl super::DesktopBackend for X11Backend {
-    fn snapshot(&mut self, annotate: bool) -> Result<Snapshot> {
-        let window_infos = self.collect_window_infos()?;
-        let mut image = self.capture_root_image()?;
-
-        // Annotate if requested - draw bounding boxes and @wN labels
-        if annotate {
-            annotate_screenshot(&mut image, &window_infos);
-        }
-
-        // Save screenshot
-        let timestamp = std::time::SystemTime::now()
-            .duration_since(std::time::UNIX_EPOCH)
-            .unwrap_or_default()
-            .as_millis();
-        let screenshot_path = format!("/tmp/deskctl-{timestamp}.png");
-        image
-            .save(&screenshot_path)
-            .context("Failed to save screenshot")?;
-
-        Ok(Snapshot {
-            screenshot: screenshot_path,
-            windows: window_infos,
-        })
+    fn list_windows(&mut self) -> Result<Vec<BackendWindow>> {
+        self.collect_window_infos()
    }

-    fn focus_window(&mut self, xcb_id: u32) -> Result<()> {
+    fn active_window(&mut self) -> Result<Option<BackendWindow>> {
+        self.active_window_info()
+    }
+
+    fn list_monitors(&self) -> Result<Vec<BackendMonitor>> {
+        match self.collect_monitors() {
+            Ok(monitors) => Ok(monitors),
+            Err(_) => {
+                let (width, height) = self.root_geometry()?;
+                Ok(vec![BackendMonitor {
+                    name: "screen".to_string(),
+                    x: 0,
+                    y: 0,
+                    width,
+                    height,
+                    width_mm: 0,
+                    height_mm: 0,
+                    primary: true,
+                    automatic: true,
+                }])
+            }
+        }
+    }
+
+    fn capture_screenshot(&mut self) -> Result<RgbaImage> {
+        self.capture_root_image()
+    }
+
+    fn focus_window(&mut self, native_id: u32) -> Result<()> {
        // Use _NET_ACTIVE_WINDOW client message (avoids focus-stealing prevention)
        let net_active = self
            .conn
@ -269,7 +349,7 @@ impl super::DesktopBackend for X11Backend {
            response_type: x11rb::protocol::xproto::CLIENT_MESSAGE_EVENT,
            format: 32,
            sequence: 0,
-            window: xcb_id,
+            window: native_id,
            type_: net_active,
            data: ClientMessageData::from([
                2u32, 0, 0, 0, 0, // source=2 (pager), timestamp=0, currently_active=0
@ -288,25 +368,25 @@ impl super::DesktopBackend for X11Backend {
        Ok(())
    }

-    fn move_window(&mut self, xcb_id: u32, x: i32, y: i32) -> Result<()> {
+    fn move_window(&mut self, native_id: u32, x: i32, y: i32) -> Result<()> {
        self.conn
-            .configure_window(xcb_id, &ConfigureWindowAux::new().x(x).y(y))?;
+            .configure_window(native_id, &ConfigureWindowAux::new().x(x).y(y))?;
        self.conn
            .flush()
            .context("Failed to flush X11 connection")?;
        Ok(())
    }

-    fn resize_window(&mut self, xcb_id: u32, w: u32, h: u32) -> Result<()> {
+    fn resize_window(&mut self, native_id: u32, w: u32, h: u32) -> Result<()> {
        self.conn
-            .configure_window(xcb_id, &ConfigureWindowAux::new().width(w).height(h))?;
+            .configure_window(native_id, &ConfigureWindowAux::new().width(w).height(h))?;
        self.conn
            .flush()
            .context("Failed to flush X11 connection")?;
        Ok(())
    }

-    fn close_window(&mut self, xcb_id: u32) -> Result<()> {
+    fn close_window(&mut self, native_id: u32) -> Result<()> {
        // Use _NET_CLOSE_WINDOW for graceful close (respects WM protocols)
        let net_close = self
            .conn
@ -319,7 +399,7 @@ impl super::DesktopBackend for X11Backend {
            response_type: x11rb::protocol::xproto::CLIENT_MESSAGE_EVENT,
            format: 32,
            sequence: 0,
-            window: xcb_id,
+            window: native_id,
            type_: net_close,
            data: ClientMessageData::from([
                0u32, 2, 0, 0, 0, // timestamp=0, source=2 (pager)
@ -463,18 +543,6 @@ impl super::DesktopBackend for X11Backend {
        Ok((reply.root_x as i32, reply.root_y as i32))
    }

-    fn screenshot(&mut self, path: &str, annotate: bool) -> Result<String> {
-        let mut image = self.capture_root_image()?;
-
-        if annotate {
-            let window_infos = self.collect_window_infos()?;
-            annotate_screenshot(&mut image, &window_infos);
-        }
-
-        image.save(path).context("Failed to save screenshot")?;
-        Ok(path.to_string())
-    }
-
    fn launch(&self, command: &str, args: &[String]) -> Result<u32> {
        let child = std::process::Command::new(command)
            .args(args)
@ -485,6 +553,10 @@ impl super::DesktopBackend for X11Backend {
            .with_context(|| format!("Failed to launch: {command}"))?;
        Ok(child.id())
    }
+
+    fn backend_name(&self) -> &'static str {
+        "x11"
+    }
 }

 fn parse_key(name: &str) -> Result<Key> {
--- a/src/cli/connection.rs
+++ b/src/cli/connection.rs
@ -1,7 +1,7 @@
 use std::io::{BufRead, BufReader, Write};
 use std::os::unix::net::UnixStream;
 use std::os::unix::process::CommandExt;
-use std::path::PathBuf;
+use std::path::{Path, PathBuf};
 use std::process::{Command, Stdio};
 use std::thread;
 use std::time::Duration;
@ -9,33 +9,48 @@ use std::time::Duration;
 use anyhow::{bail, Context, Result};

 use crate::cli::GlobalOpts;
+use crate::core::doctor::{run as run_doctor_report, DoctorReport};
+use crate::core::paths::{pid_path_for_session, socket_dir, socket_path_for_session};
 use crate::core::protocol::{Request, Response};

-fn socket_dir() -> PathBuf {
-    if let Ok(dir) = std::env::var("DESKCTL_SOCKET_DIR") {
-        return PathBuf::from(dir);
-    }
-    if let Ok(runtime) = std::env::var("XDG_RUNTIME_DIR") {
-        return PathBuf::from(runtime).join("deskctl");
-    }
-    dirs::home_dir()
-        .unwrap_or_else(|| PathBuf::from("/tmp"))
-        .join(".deskctl")
-}
-
 fn socket_path(opts: &GlobalOpts) -> PathBuf {
    if let Some(ref path) = opts.socket {
        return path.clone();
    }
-    socket_dir().join(format!("{}.sock", opts.session))
+    socket_path_for_session(&opts.session)
 }

 fn pid_path(opts: &GlobalOpts) -> PathBuf {
-    socket_dir().join(format!("{}.pid", opts.session))
+    pid_path_for_session(&opts.session)
 }

-fn try_connect(opts: &GlobalOpts) -> Option<UnixStream> {
-    UnixStream::connect(socket_path(opts)).ok()
+fn connect_socket(path: &Path) -> Result<UnixStream> {
+    UnixStream::connect(path).with_context(|| format!("Failed to connect to {}", path.display()))
+}
+
+fn is_stale_socket_error(error: &std::io::Error) -> bool {
+    matches!(
+        error.kind(),
+        std::io::ErrorKind::ConnectionRefused | std::io::ErrorKind::NotFound
+    )
+}
+
+fn cleanup_stale_socket(opts: &GlobalOpts) -> Result<bool> {
+    let path = socket_path(opts);
+    if !path.exists() {
+        return Ok(false);
+    }
+
+    match UnixStream::connect(&path) {
+        Ok(_) => Ok(false),
+        Err(error) if is_stale_socket_error(&error) => {
+            std::fs::remove_file(&path)
+                .with_context(|| format!("Failed to remove stale socket {}", path.display()))?;
+            Ok(true)
+        }
+        Err(error) => Err(error)
+            .with_context(|| format!("Failed to inspect daemon socket {}", path.display())),
+    }
 }

 fn spawn_daemon(opts: &GlobalOpts) -> Result<()> {
@ -51,9 +66,8 @@ fn spawn_daemon(opts: &GlobalOpts) -> Result<()> {
        .env("DESKCTL_PID_PATH", pid_path(opts))
        .stdin(Stdio::null())
        .stdout(Stdio::null())
-        .stderr(Stdio::piped());
+        .stderr(Stdio::null());

-    // Detach the daemon process on Unix
    unsafe {
        cmd.pre_exec(|| {
            libc::setsid();
@ -65,82 +79,136 @@ fn spawn_daemon(opts: &GlobalOpts) -> Result<()> {
    Ok(())
 }

+fn request_read_timeout(request: &Request) -> Duration {
+    let default_timeout = Duration::from_secs(30);
+    match request.action.as_str() {
+        "wait-window" | "wait-focus" => {
+            let wait_timeout = request
+                .extra
+                .get("timeout_ms")
+                .and_then(|value| value.as_u64())
+                .unwrap_or(10_000);
+            Duration::from_millis(wait_timeout.saturating_add(5_000))
+        }
+        _ => default_timeout,
+    }
+}
+
+fn send_request_over_stream(mut stream: UnixStream, request: &Request) -> Result<Response> {
+    stream.set_read_timeout(Some(request_read_timeout(request)))?;
+    stream.set_write_timeout(Some(Duration::from_secs(5)))?;
+
+    let json = serde_json::to_string(request)?;
+    writeln!(stream, "{json}")?;
+    stream.flush()?;
+
+    let mut reader = BufReader::new(&stream);
+    let mut line = String::new();
+    reader.read_line(&mut line)?;
+
+    serde_json::from_str(line.trim()).context("Failed to parse daemon response")
+}
+
+fn ping_daemon(opts: &GlobalOpts) -> Result<()> {
+    let response =
+        send_request_over_stream(connect_socket(&socket_path(opts))?, &Request::new("ping"))?;
+    if response.success {
+        Ok(())
+    } else {
+        bail!(
+            "{}",
+            response
+                .error
+                .unwrap_or_else(|| "Daemon health probe failed".to_string())
+        );
+    }
+}
+
 fn ensure_daemon(opts: &GlobalOpts) -> Result<UnixStream> {
-    // Try connecting first
-    if let Some(stream) = try_connect(opts) {
-        return Ok(stream);
+    if ping_daemon(opts).is_ok() {
+        return connect_socket(&socket_path(opts));
+    }
+
+    let removed_stale_socket = cleanup_stale_socket(opts)?;
+    if removed_stale_socket && ping_daemon(opts).is_ok() {
+        return connect_socket(&socket_path(opts));
    }

-    // Spawn daemon
    spawn_daemon(opts)?;

-    // Retry with backoff
    let max_retries = 20;
    let base_delay = Duration::from_millis(50);
-    for i in 0..max_retries {
-        thread::sleep(base_delay * (i + 1).min(4));
-        if let Some(stream) = try_connect(opts) {
-            return Ok(stream);
+    for attempt in 0..max_retries {
+        thread::sleep(base_delay * (attempt + 1).min(4));
+        if ping_daemon(opts).is_ok() {
+            return connect_socket(&socket_path(opts));
        }
    }

    bail!(
-        "Failed to connect to daemon after {} retries.\n\
-         Socket path: {}",
+        "Failed to start a healthy daemon after {} retries.\nSocket path: {}",
        max_retries,
        socket_path(opts).display()
    );
 }

 pub fn send_command(opts: &GlobalOpts, request: &Request) -> Result<Response> {
-    let mut stream = ensure_daemon(opts)?;
-    stream.set_read_timeout(Some(Duration::from_secs(30)))?;
-    stream.set_write_timeout(Some(Duration::from_secs(5)))?;
-
-    // Send NDJSON request
-    let json = serde_json::to_string(request)?;
-    writeln!(stream, "{json}")?;
-    stream.flush()?;
-
-    // Read NDJSON response
-    let mut reader = BufReader::new(&stream);
-    let mut line = String::new();
-    reader.read_line(&mut line)?;
-
-    let response: Response =
-        serde_json::from_str(line.trim()).context("Failed to parse daemon response")?;
-
-    Ok(response)
+    send_request_over_stream(ensure_daemon(opts)?, request)
 }

-pub fn start_daemon(opts: &GlobalOpts) -> Result<()> {
-    if try_connect(opts).is_some() {
-        println!("Daemon already running ({})", socket_path(opts).display());
-        return Ok(());
-    }
-    spawn_daemon(opts)?;
-    // Wait briefly and verify
-    thread::sleep(Duration::from_millis(200));
-    if try_connect(opts).is_some() {
-        println!("Daemon started ({})", socket_path(opts).display());
-    } else {
-        bail!("Daemon failed to start");
+pub fn run_doctor(opts: &GlobalOpts) -> Result<()> {
+    let report = run_doctor_report(&socket_path(opts));
+    print_doctor_report(&report, opts.json)?;
+    if !report.healthy {
+        std::process::exit(1);
    }
    Ok(())
 }

-pub fn stop_daemon(opts: &GlobalOpts) -> Result<()> {
-    match try_connect(opts) {
-        Some(mut stream) => {
-            let req = Request::new("shutdown");
-            let json = serde_json::to_string(&req)?;
-            writeln!(stream, "{json}")?;
-            stream.flush()?;
-            println!("Daemon stopped");
+pub fn start_daemon(opts: &GlobalOpts) -> Result<()> {
+    if ping_daemon(opts).is_ok() {
+        println!("Daemon already running ({})", socket_path(opts).display());
+        return Ok(());
+    }
+
+    if cleanup_stale_socket(opts)? {
+        println!("Removed stale socket: {}", socket_path(opts).display());
+    }
+
+    spawn_daemon(opts)?;
+
+    let max_retries = 20;
+    for attempt in 0..max_retries {
+        thread::sleep(Duration::from_millis(50 * (attempt + 1).min(4) as u64));
+        if ping_daemon(opts).is_ok() {
+            println!("Daemon started ({})", socket_path(opts).display());
+            return Ok(());
        }
-        None => {
-            // Try to clean up stale socket
-            let path = socket_path(opts);
+    }
+
+    bail!(
+        "Daemon failed to become healthy.\nSocket path: {}",
+        socket_path(opts).display()
+    );
+}
+
+pub fn stop_daemon(opts: &GlobalOpts) -> Result<()> {
+    let path = socket_path(opts);
+    match UnixStream::connect(&path) {
+        Ok(stream) => {
+            let response = send_request_over_stream(stream, &Request::new("shutdown"))?;
+            if response.success {
+                println!("Daemon stopped");
+            } else {
+                bail!(
+                    "{}",
+                    response
+                        .error
+                        .unwrap_or_else(|| "Failed to stop daemon".to_string())
+                );
+            }
+        }
+        Err(error) if is_stale_socket_error(&error) => {
            if path.exists() {
                std::fs::remove_file(&path)?;
                println!("Removed stale socket: {}", path.display());
@ -148,15 +216,78 @@ pub fn stop_daemon(opts: &GlobalOpts) -> Result<()> {
                println!("Daemon not running");
            }
        }
+        Err(error) => {
+            return Err(error)
+                .with_context(|| format!("Failed to inspect daemon socket {}", path.display()));
+        }
    }
    Ok(())
 }

 pub fn daemon_status(opts: &GlobalOpts) -> Result<()> {
-    if try_connect(opts).is_some() {
-        println!("Daemon running ({})", socket_path(opts).display());
-    } else {
-        println!("Daemon not running");
+    let path = socket_path(opts);
+    match ping_daemon(opts) {
+        Ok(()) => println!("Daemon running ({})", path.display()),
+        Err(_) if path.exists() => {
+            println!("Daemon socket exists but is unhealthy ({})", path.display())
+        }
+        Err(_) => println!("Daemon not running"),
    }
    Ok(())
 }
+
+fn print_doctor_report(report: &DoctorReport, json_output: bool) -> Result<()> {
+    if json_output {
+        println!("{}", serde_json::to_string_pretty(report)?);
+        return Ok(());
+    }
+
+    println!(
+        "deskctl doctor: {}",
+        if report.healthy {
+            "healthy"
+        } else {
+            "issues found"
+        }
+    );
+    for check in &report.checks {
+        let status = if check.ok { "OK" } else { "FAIL" };
+        println!("[{status}] {}: {}", check.name, check.details);
+        if let Some(fix) = &check.fix {
+            println!("       fix: {fix}");
+        }
+    }
+    Ok(())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::{cleanup_stale_socket, socket_path};
+    use crate::cli::GlobalOpts;
+    use std::time::{SystemTime, UNIX_EPOCH};
+
+    #[test]
+    fn cleanup_stale_socket_removes_refused_socket_path() {
+        let temp = std::env::temp_dir().join(format!(
+            "deskctl-test-{}",
+            SystemTime::now()
+                .duration_since(UNIX_EPOCH)
+                .unwrap()
+                .as_nanos()
+        ));
+        std::fs::create_dir_all(&temp).unwrap();
+        let opts = GlobalOpts {
+            socket: Some(temp.join("stale.sock")),
+            session: "test".to_string(),
+            json: false,
+        };
+
+        let listener = std::os::unix::net::UnixListener::bind(socket_path(&opts)).unwrap();
+        drop(listener);
+
+        assert!(cleanup_stale_socket(&opts).unwrap());
+        assert!(!socket_path(&opts).exists());
+
+        let _ = std::fs::remove_dir_all(&temp);
+    }
+}
--- a/src/cli/mod.rs
+++ b/src/cli/mod.rs
--- a/src/cli/upgrade.rs
+++ b/src/cli/upgrade.rs
@ -0,0 +1,465 @@
+use std::io::{self, IsTerminal, Write};
+use std::path::{Path, PathBuf};
+use std::process::Command;
+
+use anyhow::{Context, Result};
+use serde_json::json;
+
+use crate::cli::{GlobalOpts, UpgradeOpts};
+use crate::core::protocol::Response;
+
+#[derive(Clone, Copy, Debug, Eq, PartialEq)]
+enum InstallMethod {
+    Npm,
+    Cargo,
+    Nix,
+    Source,
+    Unknown,
+}
+
+impl InstallMethod {
+    fn as_str(self) -> &'static str {
+        match self {
+            Self::Npm => "npm",
+            Self::Cargo => "cargo",
+            Self::Nix => "nix",
+            Self::Source => "source",
+            Self::Unknown => "unknown",
+        }
+    }
+}
+
+#[derive(Debug)]
+struct UpgradePlan {
+    install_method: InstallMethod,
+    program: &'static str,
+    args: Vec<&'static str>,
+}
+
+impl UpgradePlan {
+    fn command_line(&self) -> String {
+        std::iter::once(self.program)
+            .chain(self.args.iter().copied())
+            .collect::<Vec<_>>()
+            .join(" ")
+    }
+}
+
+#[derive(Debug)]
+struct VersionInfo {
+    current: String,
+    latest: String,
+}
+
+pub fn run_upgrade(opts: &GlobalOpts, upgrade_opts: &UpgradeOpts) -> Result<Response> {
+    let current_exe = std::env::current_exe().context("Failed to determine executable path")?;
+    let install_method = detect_install_method(&current_exe);
+
+    let Some(plan) = upgrade_plan(install_method) else {
+        return Ok(Response::err_with_data(
+            format!(
+                "deskctl upgrade is not supported for {} installs.",
+                install_method.as_str()
+            ),
+            json!({
+                "kind": "upgrade_unsupported",
+                "install_method": install_method.as_str(),
+                "current_exe": current_exe.display().to_string(),
+                "hint": upgrade_hint(install_method),
+            }),
+        ));
+    };
+
+    if !opts.json {
+        println!("- Checking for updates...");
+    }
+
+    let versions = match resolve_versions(&plan) {
+        Ok(versions) => versions,
+        Err(response) => return Ok(response),
+    };
+
+    if versions.current == versions.latest {
+        return Ok(Response::ok(json!({
+            "action": "upgrade",
+            "status": "up_to_date",
+            "install_method": plan.install_method.as_str(),
+            "current_version": versions.current,
+            "latest_version": versions.latest,
+        })));
+    }
+
+    if !upgrade_opts.yes {
+        if opts.json || !io::stdin().is_terminal() {
+            return Ok(Response::err_with_data(
+                format!(
+                    "Upgrade confirmation required for {} -> {}.",
+                    versions.current, versions.latest
+                ),
+                json!({
+                    "kind": "upgrade_confirmation_required",
+                    "install_method": plan.install_method.as_str(),
+                    "current_version": versions.current,
+                    "latest_version": versions.latest,
+                    "command": plan.command_line(),
+                    "hint": "Re-run with --yes to upgrade non-interactively.",
+                }),
+            ));
+        }
+
+        if !confirm_upgrade(&versions)? {
+            return Ok(Response::ok(json!({
+                "action": "upgrade",
+                "status": "cancelled",
+                "install_method": plan.install_method.as_str(),
+                "current_version": versions.current,
+                "latest_version": versions.latest,
+            })));
+        }
+    }
+
+    if !opts.json {
+        println!(
+            "- Upgrading deskctl from {} -> {}...",
+            versions.current, versions.latest
+        );
+    }
+
+    let output = match Command::new(plan.program).args(&plan.args).output() {
+        Ok(output) => output,
+        Err(error) => return Ok(upgrade_spawn_error_response(&plan, &versions, &error)),
+    };
+
+    if output.status.success() {
+        return Ok(Response::ok(json!({
+            "action": "upgrade",
+            "status": "upgraded",
+            "install_method": plan.install_method.as_str(),
+            "current_version": versions.current,
+            "latest_version": versions.latest,
+            "command": plan.command_line(),
+            "exit_code": output.status.code(),
+        })));
+    }
+
+    Ok(upgrade_command_failed_response(&plan, &versions, &output))
+}
+
+fn resolve_versions(plan: &UpgradePlan) -> std::result::Result<VersionInfo, Response> {
+    let current = env!("CARGO_PKG_VERSION").to_string();
+    let latest = match plan.install_method {
+        InstallMethod::Npm => query_npm_latest_version()?,
+        InstallMethod::Cargo => query_cargo_latest_version()?,
+        InstallMethod::Nix | InstallMethod::Source | InstallMethod::Unknown => {
+            return Err(Response::err_with_data(
+                "Could not determine the latest published version.".to_string(),
+                json!({
+                    "kind": "upgrade_failed",
+                    "install_method": plan.install_method.as_str(),
+                    "reason": "Could not determine the latest published version for this install method.",
+                    "command": plan.command_line(),
+                    "hint": upgrade_hint(plan.install_method),
+                }),
+            ));
+        }
+    };
+
+    Ok(VersionInfo { current, latest })
+}
+
+fn query_npm_latest_version() -> std::result::Result<String, Response> {
+    let output = Command::new("npm")
+        .args(["view", "deskctl", "version", "--json"])
+        .output()
+        .map_err(|error| {
+            Response::err_with_data(
+                "Failed to check the latest npm version.".to_string(),
+                json!({
+                    "kind": "upgrade_failed",
+                    "install_method": InstallMethod::Npm.as_str(),
+                    "reason": "Failed to run npm view deskctl version --json.",
+                    "io_error": error.to_string(),
+                    "command": "npm view deskctl version --json",
+                    "hint": upgrade_hint(InstallMethod::Npm),
+                }),
+            )
+        })?;
+
+    if !output.status.success() {
+        return Err(Response::err_with_data(
+            "Failed to check the latest npm version.".to_string(),
+            json!({
+                "kind": "upgrade_failed",
+                "install_method": InstallMethod::Npm.as_str(),
+                "reason": command_failure_reason(&output),
+                "command": "npm view deskctl version --json",
+                "hint": upgrade_hint(InstallMethod::Npm),
+            }),
+        ));
+    }
+
+    serde_json::from_slice::<String>(&output.stdout).map_err(|_| {
+        Response::err_with_data(
+            "Failed to parse the latest npm version.".to_string(),
+            json!({
+                "kind": "upgrade_failed",
+                "install_method": InstallMethod::Npm.as_str(),
+                "reason": "npm view returned an unexpected version payload.",
+                "command": "npm view deskctl version --json",
+                "hint": upgrade_hint(InstallMethod::Npm),
+            }),
+        )
+    })
+}
+
+fn query_cargo_latest_version() -> std::result::Result<String, Response> {
+    let output = Command::new("cargo")
+        .args(["search", "deskctl", "--limit", "1"])
+        .output()
+        .map_err(|error| {
+            Response::err_with_data(
+                "Failed to check the latest crates.io version.".to_string(),
+                json!({
+                    "kind": "upgrade_failed",
+                    "install_method": InstallMethod::Cargo.as_str(),
+                    "reason": "Failed to run cargo search deskctl --limit 1.",
+                    "io_error": error.to_string(),
+                    "command": "cargo search deskctl --limit 1",
+                    "hint": upgrade_hint(InstallMethod::Cargo),
+                }),
+            )
+        })?;
+
+    if !output.status.success() {
+        return Err(Response::err_with_data(
+            "Failed to check the latest crates.io version.".to_string(),
+            json!({
+                "kind": "upgrade_failed",
+                "install_method": InstallMethod::Cargo.as_str(),
+                "reason": command_failure_reason(&output),
+                "command": "cargo search deskctl --limit 1",
+                "hint": upgrade_hint(InstallMethod::Cargo),
+            }),
+        ));
+    }
+
+    let stdout = String::from_utf8_lossy(&output.stdout);
+    let latest = stdout
+        .split('"')
+        .nth(1)
+        .map(str::to_string)
+        .filter(|value| !value.is_empty());
+
+    latest.ok_or_else(|| {
+        Response::err_with_data(
+            "Failed to determine the latest crates.io version.".to_string(),
+            json!({
+                "kind": "upgrade_failed",
+                "install_method": InstallMethod::Cargo.as_str(),
+                "reason": "cargo search did not return a published deskctl crate version.",
+                "command": "cargo search deskctl --limit 1",
+                "hint": upgrade_hint(InstallMethod::Cargo),
+            }),
+        )
+    })
+}
+
+fn confirm_upgrade(versions: &VersionInfo) -> Result<bool> {
+    print!(
+        "Upgrade deskctl from {} -> {}? [y/N] ",
+        versions.current, versions.latest
+    );
+    io::stdout().flush()?;
+
+    let mut input = String::new();
+    io::stdin().read_line(&mut input)?;
+
+    let trimmed = input.trim();
+    Ok(matches!(trimmed, "y" | "Y" | "yes" | "YES" | "Yes"))
+}
+
+fn upgrade_command_failed_response(
+    plan: &UpgradePlan,
+    versions: &VersionInfo,
+    output: &std::process::Output,
+) -> Response {
+    Response::err_with_data(
+        format!("Upgrade command failed: {}", plan.command_line()),
+        json!({
+            "kind": "upgrade_failed",
+            "install_method": plan.install_method.as_str(),
+            "current_version": versions.current,
+            "latest_version": versions.latest,
+            "command": plan.command_line(),
+            "exit_code": output.status.code(),
+            "reason": command_failure_reason(output),
+            "hint": upgrade_hint(plan.install_method),
+        }),
+    )
+}
+
+fn upgrade_spawn_error_response(
+    plan: &UpgradePlan,
+    versions: &VersionInfo,
+    error: &std::io::Error,
+) -> Response {
+    Response::err_with_data(
+        format!("Failed to run {}", plan.command_line()),
+        json!({
+            "kind": "upgrade_failed",
+            "install_method": plan.install_method.as_str(),
+            "current_version": versions.current,
+            "latest_version": versions.latest,
+            "command": plan.command_line(),
+            "io_error": error.to_string(),
+            "hint": upgrade_hint(plan.install_method),
+        }),
+    )
+}
+
+fn command_failure_reason(output: &std::process::Output) -> String {
+    let stderr = String::from_utf8_lossy(&output.stderr);
+    let stdout = String::from_utf8_lossy(&output.stdout);
+
+    stderr
+        .lines()
+        .chain(stdout.lines())
+        .map(str::trim)
+        .find(|line| !line.is_empty())
+        .map(str::to_string)
+        .unwrap_or_else(|| {
+            output
+                .status
+                .code()
+                .map(|code| format!("Command exited with status {code}."))
+                .unwrap_or_else(|| "Command exited unsuccessfully.".to_string())
+        })
+}
+
+fn upgrade_plan(install_method: InstallMethod) -> Option<UpgradePlan> {
+    match install_method {
+        InstallMethod::Npm => Some(UpgradePlan {
+            install_method,
+            program: "npm",
+            args: vec!["install", "-g", "deskctl@latest"],
+        }),
+        InstallMethod::Cargo => Some(UpgradePlan {
+            install_method,
+            program: "cargo",
+            args: vec!["install", "deskctl", "--locked"],
+        }),
+        InstallMethod::Nix | InstallMethod::Source | InstallMethod::Unknown => None,
+    }
+}
+
+fn upgrade_hint(install_method: InstallMethod) -> &'static str {
+    match install_method {
+        InstallMethod::Nix => {
+            "Use nix profile upgrade or update the flake reference you installed from."
+        }
+        InstallMethod::Source => {
+            "Rebuild from source or reinstall deskctl through npm, cargo, or nix."
+        }
+        InstallMethod::Unknown => {
+            "Reinstall deskctl through a supported channel such as npm, cargo, or nix."
+        }
+        InstallMethod::Npm => "Retry with --yes or run npm install -g deskctl@latest directly.",
+        InstallMethod::Cargo => "Retry with --yes or run cargo install deskctl --locked directly.",
+    }
+}
+
+fn detect_install_method(current_exe: &Path) -> InstallMethod {
+    if looks_like_npm_install(current_exe) {
+        return InstallMethod::Npm;
+    }
+    if looks_like_nix_install(current_exe) {
+        return InstallMethod::Nix;
+    }
+    if looks_like_cargo_install(current_exe) {
+        return InstallMethod::Cargo;
+    }
+    if looks_like_source_tree(current_exe) {
+        return InstallMethod::Source;
+    }
+    InstallMethod::Unknown
+}
+
+fn looks_like_npm_install(path: &Path) -> bool {
+    let value = normalize(path);
+    value.contains("/node_modules/deskctl/") && value.contains("/vendor/")
+}
+
+fn looks_like_nix_install(path: &Path) -> bool {
+    normalize(path).starts_with("/nix/store/")
+}
+
+fn looks_like_cargo_install(path: &Path) -> bool {
+    let Some(home) = std::env::var_os("HOME") else {
+        return false;
+    };
+
+    let cargo_home = std::env::var_os("CARGO_HOME")
+        .map(PathBuf::from)
+        .unwrap_or_else(|| PathBuf::from(home).join(".cargo"));
+    path == cargo_home.join("bin").join("deskctl")
+}
+
+fn looks_like_source_tree(path: &Path) -> bool {
+    let value = normalize(path);
+    value.contains("/target/debug/deskctl") || value.contains("/target/release/deskctl")
+}
+
+fn normalize(path: &Path) -> String {
+    path.to_string_lossy().replace('\\', "/")
+}
+
+#[cfg(test)]
+mod tests {
+    use std::os::unix::process::ExitStatusExt;
+    use std::path::Path;
+
+    use super::{command_failure_reason, detect_install_method, upgrade_plan, InstallMethod};
+
+    #[test]
+    fn detects_npm_install_path() {
+        let method = detect_install_method(Path::new(
+            "/usr/local/lib/node_modules/deskctl/vendor/deskctl-linux-x86_64",
+        ));
+        assert_eq!(method, InstallMethod::Npm);
+    }
+
+    #[test]
+    fn detects_nix_install_path() {
+        let method = detect_install_method(Path::new("/nix/store/abc123-deskctl/bin/deskctl"));
+        assert_eq!(method, InstallMethod::Nix);
+    }
+
+    #[test]
+    fn detects_source_tree_path() {
+        let method =
+            detect_install_method(Path::new("/Users/example/src/deskctl/target/debug/deskctl"));
+        assert_eq!(method, InstallMethod::Source);
+    }
+
+    #[test]
+    fn npm_upgrade_plan_uses_global_install() {
+        let plan = upgrade_plan(InstallMethod::Npm).expect("npm installs should support upgrade");
+        assert_eq!(plan.command_line(), "npm install -g deskctl@latest");
+    }
+
+    #[test]
+    fn nix_install_has_no_upgrade_plan() {
+        assert!(upgrade_plan(InstallMethod::Nix).is_none());
+    }
+
+    #[test]
+    fn failure_reason_prefers_stderr() {
+        let output = std::process::Output {
+            status: std::process::ExitStatus::from_raw(1 << 8),
+            stdout: b"".to_vec(),
+            stderr: b"boom\n".to_vec(),
+        };
+
+        assert_eq!(command_failure_reason(&output), "boom");
+    }
+}
--- a/src/core/doctor.rs
+++ b/src/core/doctor.rs
@ -0,0 +1,211 @@
+use std::io::{BufRead, BufReader, Write};
+use std::os::unix::net::UnixStream;
+use std::path::Path;
+use std::time::Duration;
+
+use anyhow::Result;
+use serde::Serialize;
+
+use crate::backend::{x11::X11Backend, DesktopBackend};
+use crate::core::protocol::{Request, Response};
+use crate::core::session::detect_session;
+
+#[derive(Debug, Serialize)]
+pub struct DoctorReport {
+    pub healthy: bool,
+    pub checks: Vec<DoctorCheck>,
+}
+
+#[derive(Debug, Serialize)]
+pub struct DoctorCheck {
+    pub name: String,
+    pub ok: bool,
+    pub details: String,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub fix: Option<String>,
+}
+
+pub fn run(socket_path: &Path) -> DoctorReport {
+    let mut checks = Vec::new();
+
+    let display = std::env::var("DISPLAY").ok();
+    checks.push(match display {
+        Some(ref value) if !value.is_empty() => check_ok("display", format!("DISPLAY={value}")),
+        _ => check_fail(
+            "display",
+            "DISPLAY is not set".to_string(),
+            "Export DISPLAY to point at the active X11 server.".to_string(),
+        ),
+    });
+
+    checks.push(match detect_session() {
+        Ok(_) => check_ok("session", "X11 session detected".to_string()),
+        Err(error) => check_fail(
+            "session",
+            error.to_string(),
+            "Run deskctl inside an X11 session. Wayland is not supported in this phase."
+                .to_string(),
+        ),
+    });
+
+    let mut backend = match X11Backend::new() {
+        Ok(backend) => {
+            checks.push(check_ok(
+                "backend",
+                "Connected to the X11 backend successfully".to_string(),
+            ));
+            Some(backend)
+        }
+        Err(error) => {
+            checks.push(check_fail(
+                "backend",
+                error.to_string(),
+                "Ensure the X server is reachable and the current session can access it."
+                    .to_string(),
+            ));
+            None
+        }
+    };
+
+    if let Some(backend) = backend.as_mut() {
+        checks.push(match backend.list_windows() {
+            Ok(windows) => check_ok(
+                "window-enumeration",
+                format!("Enumerated {} visible windows", windows.len()),
+            ),
+            Err(error) => check_fail(
+                "window-enumeration",
+                error.to_string(),
+                "Verify the desktop session exposes EWMH window metadata and the X11 connection is healthy."
+                    .to_string(),
+            ),
+        });
+
+        checks.push(match backend.capture_screenshot() {
+            Ok(image) => check_ok(
+                "screenshot",
+                format!(
+                    "Captured {}x{} desktop image",
+                    image.width(),
+                    image.height()
+                ),
+            ),
+            Err(error) => check_fail(
+                "screenshot",
+                error.to_string(),
+                "Verify the X11 session permits desktop capture on the active display.".to_string(),
+            ),
+        });
+    } else {
+        checks.push(check_fail(
+            "window-enumeration",
+            "Skipped because backend initialization failed".to_string(),
+            "Fix the X11 backend error before retrying.".to_string(),
+        ));
+        checks.push(check_fail(
+            "screenshot",
+            "Skipped because backend initialization failed".to_string(),
+            "Fix the X11 backend error before retrying.".to_string(),
+        ));
+    }
+
+    checks.push(check_socket_dir(socket_path));
+    checks.push(check_daemon_socket(socket_path));
+
+    let healthy = checks.iter().all(|check| check.ok);
+    DoctorReport { healthy, checks }
+}
+
+fn check_socket_dir(socket_path: &Path) -> DoctorCheck {
+    let Some(socket_dir) = socket_path.parent() else {
+        return check_fail(
+            "socket-dir",
+            format!(
+                "Socket path {} has no parent directory",
+                socket_path.display()
+            ),
+            "Use a socket path inside a writable directory.".to_string(),
+        );
+    };
+
+    match std::fs::create_dir_all(socket_dir) {
+        Ok(()) => check_ok(
+            "socket-dir",
+            format!("Socket directory is ready at {}", socket_dir.display()),
+        ),
+        Err(error) => check_fail(
+            "socket-dir",
+            error.to_string(),
+            format!("Ensure {} exists and is writable.", socket_dir.display()),
+        ),
+    }
+}
+
+fn check_daemon_socket(socket_path: &Path) -> DoctorCheck {
+    if !socket_path.exists() {
+        return check_ok(
+            "daemon-socket",
+            format!("No stale socket found at {}", socket_path.display()),
+        );
+    }
+
+    match ping_socket(socket_path) {
+        Ok(()) => check_ok(
+            "daemon-socket",
+            format!("Daemon is healthy at {}", socket_path.display()),
+        ),
+        Err(error) => check_fail(
+            "daemon-socket",
+            error.to_string(),
+            format!(
+                "Remove the stale socket at {} or run `deskctl daemon stop`.",
+                socket_path.display()
+            ),
+        ),
+    }
+}
+
+fn ping_socket(socket_path: &Path) -> Result<()> {
+    let mut stream = UnixStream::connect(socket_path)?;
+    stream.set_read_timeout(Some(Duration::from_secs(1)))?;
+    stream.set_write_timeout(Some(Duration::from_secs(1)))?;
+
+    let request = Request::new("ping");
+    let json = serde_json::to_string(&request)?;
+    writeln!(stream, "{json}")?;
+    stream.flush()?;
+
+    let mut reader = BufReader::new(&stream);
+    let mut line = String::new();
+    reader.read_line(&mut line)?;
+    let response: Response = serde_json::from_str(line.trim())?;
+
+    if response.success {
+        Ok(())
+    } else {
+        anyhow::bail!(
+            "{}",
+            response
+                .error
+                .unwrap_or_else(|| "Daemon health probe failed".to_string())
+        )
+    }
+}
+
+fn check_ok(name: &str, details: String) -> DoctorCheck {
+    DoctorCheck {
+        name: name.to_string(),
+        ok: true,
+        details,
+        fix: None,
+    }
+}
+
+fn check_fail(name: &str, details: String, fix: String) -> DoctorCheck {
+    DoctorCheck {
+        name: name.to_string(),
+        ok: false,
+        details,
+        fix: Some(fix),
+    }
+}
--- a/src/core/mod.rs
+++ b/src/core/mod.rs
@ -1,3 +1,5 @@
+pub mod doctor;
+pub mod paths;
 pub mod protocol;
 pub mod refs;
 pub mod session;
--- a/src/core/paths.rs
+++ b/src/core/paths.rs
@ -0,0 +1,29 @@
+use std::path::PathBuf;
+
+pub fn socket_dir() -> PathBuf {
+    if let Ok(dir) = std::env::var("DESKCTL_SOCKET_DIR") {
+        return PathBuf::from(dir);
+    }
+    if let Ok(runtime) = std::env::var("XDG_RUNTIME_DIR") {
+        return PathBuf::from(runtime).join("deskctl");
+    }
+    dirs::home_dir()
+        .unwrap_or_else(|| PathBuf::from("/tmp"))
+        .join(".deskctl")
+}
+
+pub fn socket_path_for_session(session: &str) -> PathBuf {
+    socket_dir().join(format!("{session}.sock"))
+}
+
+pub fn pid_path_for_session(session: &str) -> PathBuf {
+    socket_dir().join(format!("{session}.pid"))
+}
+
+pub fn socket_path_from_env() -> Option<PathBuf> {
+    std::env::var("DESKCTL_SOCKET_PATH").ok().map(PathBuf::from)
+}
+
+pub fn pid_path_from_env() -> Option<PathBuf> {
+    std::env::var("DESKCTL_PID_PATH").ok().map(PathBuf::from)
+}
--- a/src/core/protocol.rs
+++ b/src/core/protocol.rs
@ -58,4 +58,12 @@ impl Response {
            error: Some(msg.into()),
        }
    }
+
+    pub fn err_with_data(msg: impl Into<String>, data: Value) -> Self {
+        Self {
+            success: false,
+            data: Some(data),
+            error: Some(msg.into()),
+        }
+    }
 }
--- a/src/core/refs.rs
+++ b/src/core/refs.rs
@ -1,10 +1,15 @@
 use serde::{Deserialize, Serialize};
-use std::collections::HashMap;
+use std::collections::{HashMap, HashSet};
+
+use crate::backend::BackendWindow;
+use crate::core::types::WindowInfo;

 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[allow(dead_code)]
 pub struct RefEntry {
-    pub xcb_id: u32,
+    pub ref_id: String,
+    pub window_id: String,
+    pub backend_window_id: u32,
    pub app_class: String,
    pub title: String,
    pub pid: u32,
@ -19,58 +24,462 @@ pub struct RefEntry {
 #[derive(Debug, Default)]
 #[allow(dead_code)]
 pub struct RefMap {
-    map: HashMap<String, RefEntry>,
+    refs: HashMap<String, RefEntry>,
+    window_id_to_ref: HashMap<String, String>,
+    backend_id_to_window_id: HashMap<u32, String>,
    next_ref: usize,
+    next_window: usize,
+}
+
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub enum SelectorQuery {
+    Ref(String),
+    WindowId(String),
+    Title(String),
+    Class(String),
+    Focused,
+    Fuzzy(String),
+}
+
+#[derive(Debug, Clone)]
+pub enum ResolveResult {
+    Match(RefEntry),
+    NotFound {
+        selector: String,
+        mode: &'static str,
+    },
+    Ambiguous {
+        selector: String,
+        mode: &'static str,
+        candidates: Vec<WindowInfo>,
+    },
+    Invalid {
+        selector: String,
+        mode: &'static str,
+        message: String,
+    },
 }

 #[allow(dead_code)]
 impl RefMap {
    pub fn new() -> Self {
        Self {
-            map: HashMap::new(),
+            refs: HashMap::new(),
+            window_id_to_ref: HashMap::new(),
+            backend_id_to_window_id: HashMap::new(),
            next_ref: 1,
+            next_window: 1,
        }
    }

    pub fn clear(&mut self) {
-        self.map.clear();
+        self.refs.clear();
+        self.window_id_to_ref.clear();
        self.next_ref = 1;
    }

-    pub fn insert(&mut self, entry: RefEntry) -> String {
-        let ref_id = format!("w{}", self.next_ref);
-        self.next_ref += 1;
-        self.map.insert(ref_id.clone(), entry);
-        ref_id
-    }
+    pub fn rebuild(&mut self, windows: &[BackendWindow]) -> Vec<WindowInfo> {
+        self.clear();

-    /// Resolve a selector to a RefEntry.
-    /// Accepts: "@w1", "w1", "ref=w1", or a substring match on app_class/title.
-    pub fn resolve(&self, selector: &str) -> Option<&RefEntry> {
-        let normalized = selector
-            .strip_prefix('@')
-            .or_else(|| selector.strip_prefix("ref="))
-            .unwrap_or(selector);
+        let active_backend_ids = windows
+            .iter()
+            .map(|window| window.native_id)
+            .collect::<HashSet<_>>();
+        self.backend_id_to_window_id
+            .retain(|backend_id, _| active_backend_ids.contains(backend_id));

-        // Try direct ref lookup
-        if let Some(entry) = self.map.get(normalized) {
-            return Some(entry);
+        let mut public_windows = Vec::with_capacity(windows.len());
+        for window in windows {
+            let ref_id = format!("w{}", self.next_ref);
+            self.next_ref += 1;
+
+            let window_id = self.window_id_for_backend(window.native_id);
+            let entry = RefEntry {
+                ref_id: ref_id.clone(),
+                window_id: window_id.clone(),
+                backend_window_id: window.native_id,
+                app_class: window.app_name.clone(),
+                title: window.title.clone(),
+                pid: 0,
+                x: window.x,
+                y: window.y,
+                width: window.width,
+                height: window.height,
+                focused: window.focused,
+                minimized: window.minimized,
+            };
+
+            self.window_id_to_ref
+                .insert(window_id.clone(), ref_id.clone());
+            self.refs.insert(ref_id.clone(), entry);
+            public_windows.push(WindowInfo {
+                ref_id,
+                window_id,
+                title: window.title.clone(),
+                app_name: window.app_name.clone(),
+                x: window.x,
+                y: window.y,
+                width: window.width,
+                height: window.height,
+                focused: window.focused,
+                minimized: window.minimized,
+            });
        }

-        // Try substring match on app_class or title (case-insensitive)
-        let lower = selector.to_lowercase();
-        self.map.values().find(|e| {
-            e.app_class.to_lowercase().contains(&lower) || e.title.to_lowercase().contains(&lower)
-        })
+        public_windows
+    }
+
+    fn window_id_for_backend(&mut self, backend_window_id: u32) -> String {
+        if let Some(existing) = self.backend_id_to_window_id.get(&backend_window_id) {
+            return existing.clone();
+        }
+
+        let window_id = format!("win{}", self.next_window);
+        self.next_window += 1;
+        self.backend_id_to_window_id
+            .insert(backend_window_id, window_id.clone());
+        window_id
+    }
+
+    pub fn resolve(&self, selector: &str) -> ResolveResult {
+        self.resolve_query(SelectorQuery::parse(selector), selector)
    }

    /// Resolve a selector to the center coordinates of the window.
-    pub fn resolve_to_center(&self, selector: &str) -> Option<(i32, i32)> {
+    pub fn resolve_to_center(&self, selector: &str) -> ResolveResult {
        self.resolve(selector)
-            .map(|e| (e.x + e.width as i32 / 2, e.y + e.height as i32 / 2))
    }

    pub fn entries(&self) -> impl Iterator<Item = (&String, &RefEntry)> {
-        self.map.iter()
+        self.refs.iter()
+    }
+
+    fn resolve_query(&self, query: SelectorQuery, selector: &str) -> ResolveResult {
+        match query {
+            SelectorQuery::Ref(ref_id) => self
+                .refs
+                .get(&ref_id)
+                .cloned()
+                .map(ResolveResult::Match)
+                .unwrap_or_else(|| ResolveResult::NotFound {
+                    selector: selector.to_string(),
+                    mode: "ref",
+                }),
+            SelectorQuery::WindowId(window_id) => self
+                .window_id_to_ref
+                .get(&window_id)
+                .and_then(|ref_id| self.refs.get(ref_id))
+                .cloned()
+                .map(ResolveResult::Match)
+                .unwrap_or_else(|| ResolveResult::NotFound {
+                    selector: selector.to_string(),
+                    mode: "id",
+                }),
+            SelectorQuery::Focused => self.resolve_candidates(
+                selector,
+                "focused",
+                self.refs
+                    .values()
+                    .filter(|entry| entry.focused)
+                    .cloned()
+                    .collect(),
+            ),
+            SelectorQuery::Title(title) => {
+                if title.is_empty() {
+                    return ResolveResult::Invalid {
+                        selector: selector.to_string(),
+                        mode: "title",
+                        message: "title selectors must not be empty".to_string(),
+                    };
+                }
+                self.resolve_candidates(
+                    selector,
+                    "title",
+                    self.refs
+                        .values()
+                        .filter(|entry| entry.title.eq_ignore_ascii_case(&title))
+                        .cloned()
+                        .collect(),
+                )
+            }
+            SelectorQuery::Class(app_class) => {
+                if app_class.is_empty() {
+                    return ResolveResult::Invalid {
+                        selector: selector.to_string(),
+                        mode: "class",
+                        message: "class selectors must not be empty".to_string(),
+                    };
+                }
+                self.resolve_candidates(
+                    selector,
+                    "class",
+                    self.refs
+                        .values()
+                        .filter(|entry| entry.app_class.eq_ignore_ascii_case(&app_class))
+                        .cloned()
+                        .collect(),
+                )
+            }
+            SelectorQuery::Fuzzy(value) => {
+                if let Some(entry) = self.refs.get(&value).cloned() {
+                    return ResolveResult::Match(entry);
+                }
+
+                if let Some(entry) = self
+                    .window_id_to_ref
+                    .get(&value)
+                    .and_then(|ref_id| self.refs.get(ref_id))
+                    .cloned()
+                {
+                    return ResolveResult::Match(entry);
+                }
+
+                let lower = value.to_lowercase();
+                self.resolve_candidates(
+                    selector,
+                    "fuzzy",
+                    self.refs
+                        .values()
+                        .filter(|entry| {
+                            entry.app_class.to_lowercase().contains(&lower)
+                                || entry.title.to_lowercase().contains(&lower)
+                        })
+                        .cloned()
+                        .collect(),
+                )
+            }
+        }
+    }
+
+    fn resolve_candidates(
+        &self,
+        selector: &str,
+        mode: &'static str,
+        mut candidates: Vec<RefEntry>,
+    ) -> ResolveResult {
+        candidates.sort_by(|left, right| left.ref_id.cmp(&right.ref_id));
+        match candidates.len() {
+            0 => ResolveResult::NotFound {
+                selector: selector.to_string(),
+                mode,
+            },
+            1 => ResolveResult::Match(candidates.remove(0)),
+            _ => ResolveResult::Ambiguous {
+                selector: selector.to_string(),
+                mode,
+                candidates: candidates
+                    .into_iter()
+                    .map(|entry| entry.to_window_info())
+                    .collect(),
+            },
+        }
+    }
+}
+
+impl SelectorQuery {
+    pub fn parse(selector: &str) -> Self {
+        if let Some(value) = selector.strip_prefix('@') {
+            return Self::Ref(value.to_string());
+        }
+        if let Some(value) = selector.strip_prefix("ref=") {
+            return Self::Ref(value.to_string());
+        }
+        if let Some(value) = selector.strip_prefix("id=") {
+            return Self::WindowId(value.to_string());
+        }
+        if let Some(value) = selector.strip_prefix("title=") {
+            return Self::Title(value.to_string());
+        }
+        if let Some(value) = selector.strip_prefix("class=") {
+            return Self::Class(value.to_string());
+        }
+        if selector == "focused" {
+            return Self::Focused;
+        }
+        Self::Fuzzy(selector.to_string())
+    }
+
+    pub fn needs_live_refresh(&self) -> bool {
+        !matches!(self, Self::Ref(_))
+    }
+}
+
+impl RefEntry {
+    pub fn center(&self) -> (i32, i32) {
+        (
+            self.x + self.width as i32 / 2,
+            self.y + self.height as i32 / 2,
+        )
+    }
+
+    pub fn to_window_info(&self) -> WindowInfo {
+        WindowInfo {
+            ref_id: self.ref_id.clone(),
+            window_id: self.window_id.clone(),
+            title: self.title.clone(),
+            app_name: self.app_class.clone(),
+            x: self.x,
+            y: self.y,
+            width: self.width,
+            height: self.height,
+            focused: self.focused,
+            minimized: self.minimized,
+        }
+    }
+}
+
+impl ResolveResult {
+    pub fn matched_entry(&self) -> Option<&RefEntry> {
+        match self {
+            Self::Match(entry) => Some(entry),
+            _ => None,
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::{RefMap, ResolveResult, SelectorQuery};
+    use crate::backend::BackendWindow;
+
+    fn sample_window(native_id: u32, title: &str) -> BackendWindow {
+        BackendWindow {
+            native_id,
+            title: title.to_string(),
+            app_name: "TestApp".to_string(),
+            x: 10,
+            y: 20,
+            width: 300,
+            height: 200,
+            focused: native_id == 1,
+            minimized: false,
+        }
+    }
+
+    #[test]
+    fn rebuild_assigns_stable_window_ids_for_same_native_window() {
+        let mut refs = RefMap::new();
+        let first = refs.rebuild(&[sample_window(1, "First")]);
+        let second = refs.rebuild(&[sample_window(1, "First Updated")]);
+
+        assert_eq!(first[0].window_id, second[0].window_id);
+        assert_eq!(second[0].ref_id, "w1");
+    }
+
+    #[test]
+    fn resolve_accepts_ref_and_window_id() {
+        let mut refs = RefMap::new();
+        let public = refs.rebuild(&[sample_window(42, "Editor")]);
+        let window_id = public[0].window_id.clone();
+
+        match refs.resolve("@w1") {
+            ResolveResult::Match(entry) => assert_eq!(entry.window_id, window_id),
+            other => panic!("unexpected resolve result: {other:?}"),
+        }
+        match refs.resolve(&window_id) {
+            ResolveResult::Match(entry) => assert_eq!(entry.backend_window_id, 42),
+            other => panic!("unexpected resolve result: {other:?}"),
+        }
+        match refs.resolve(&format!("id={window_id}")) {
+            ResolveResult::Match(entry) => assert_eq!(entry.title, "Editor"),
+            other => panic!("unexpected resolve result: {other:?}"),
+        }
+    }
+
+    #[test]
+    fn resolve_to_center_uses_window_geometry() {
+        let mut refs = RefMap::new();
+        refs.rebuild(&[sample_window(7, "Browser")]);
+
+        match refs.resolve_to_center("w1") {
+            ResolveResult::Match(entry) => assert_eq!(entry.center(), (160, 120)),
+            other => panic!("unexpected resolve result: {other:?}"),
+        }
+    }
+
+    #[test]
+    fn selector_query_parses_explicit_modes() {
+        assert_eq!(
+            SelectorQuery::parse("@w1"),
+            SelectorQuery::Ref("w1".to_string())
+        );
+        assert_eq!(
+            SelectorQuery::parse("ref=w2"),
+            SelectorQuery::Ref("w2".to_string())
+        );
+        assert_eq!(
+            SelectorQuery::parse("id=win4"),
+            SelectorQuery::WindowId("win4".to_string())
+        );
+        assert_eq!(
+            SelectorQuery::parse("title=Chromium"),
+            SelectorQuery::Title("Chromium".to_string())
+        );
+        assert_eq!(
+            SelectorQuery::parse("class=Navigator"),
+            SelectorQuery::Class("Navigator".to_string())
+        );
+        assert_eq!(SelectorQuery::parse("focused"), SelectorQuery::Focused);
+    }
+
+    #[test]
+    fn resolve_supports_exact_title_class_and_focused_modes() {
+        let mut refs = RefMap::new();
+        refs.rebuild(&[
+            sample_window(1, "Browser"),
+            BackendWindow {
+                native_id: 2,
+                title: "Editor".to_string(),
+                app_name: "Code".to_string(),
+                x: 0,
+                y: 0,
+                width: 10,
+                height: 10,
+                focused: false,
+                minimized: false,
+            },
+        ]);
+
+        match refs.resolve("focused") {
+            ResolveResult::Match(entry) => assert_eq!(entry.title, "Browser"),
+            other => panic!("unexpected resolve result: {other:?}"),
+        }
+        match refs.resolve("title=Editor") {
+            ResolveResult::Match(entry) => assert_eq!(entry.app_class, "Code"),
+            other => panic!("unexpected resolve result: {other:?}"),
+        }
+        match refs.resolve("class=code") {
+            ResolveResult::Match(entry) => assert_eq!(entry.title, "Editor"),
+            other => panic!("unexpected resolve result: {other:?}"),
+        }
+    }
+
+    #[test]
+    fn fuzzy_resolution_fails_with_candidates_when_ambiguous() {
+        let mut refs = RefMap::new();
+        refs.rebuild(&[
+            sample_window(1, "Chromium"),
+            BackendWindow {
+                native_id: 2,
+                title: "Chromium Settings".to_string(),
+                app_name: "Chromium".to_string(),
+                x: 0,
+                y: 0,
+                width: 10,
+                height: 10,
+                focused: false,
+                minimized: false,
+            },
+        ]);
+
+        match refs.resolve("chromium") {
+            ResolveResult::Ambiguous {
+                mode, candidates, ..
+            } => {
+                assert_eq!(mode, "fuzzy");
+                assert_eq!(candidates.len(), 2);
+            }
+            other => panic!("unexpected resolve result: {other:?}"),
+        }
    }
 }
--- a/src/core/session.rs
+++ b/src/core/session.rs
@ -15,14 +15,14 @@ pub fn detect_session() -> Result<SessionType> {
                bail!(
                    "No X11 session detected.\n\
                     XDG_SESSION_TYPE is not set and DISPLAY is not set.\n\
-                     deskctl requires an X11 session. Wayland support coming in v0.2."
+                     deskctl requires an X11 session."
                );
            }
        }
        "wayland" => {
            bail!(
                "Wayland session detected (XDG_SESSION_TYPE=wayland).\n\
-                 deskctl currently supports X11 only. Wayland/Hyprland support coming in v0.2."
+                 deskctl currently supports X11 only."
            );
        }
        other => {
--- a/src/core/types.rs
+++ b/src/core/types.rs
@ -8,10 +8,10 @@ pub struct Snapshot {
 }

 #[allow(dead_code)]
-#[derive(Debug, Serialize, Deserialize)]
+#[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct WindowInfo {
    pub ref_id: String,
-    pub xcb_id: u32,
+    pub window_id: String,
    pub title: String,
    pub app_name: String,
    pub x: i32,
@ -22,6 +22,47 @@ pub struct WindowInfo {
    pub minimized: bool,
 }

+#[allow(dead_code)]
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct MonitorInfo {
+    pub name: String,
+    pub x: i32,
+    pub y: i32,
+    pub width: u32,
+    pub height: u32,
+    pub width_mm: u32,
+    pub height_mm: u32,
+    pub primary: bool,
+    pub automatic: bool,
+}
+
+#[allow(dead_code)]
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct ScreenSize {
+    pub width: u32,
+    pub height: u32,
+}
+
+#[allow(dead_code)]
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct VersionInfo {
+    pub version: String,
+    pub backend: String,
+}
+
+#[allow(dead_code)]
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct SystemInfo {
+    pub backend: String,
+    pub display: Option<String>,
+    pub session_type: Option<String>,
+    pub session: String,
+    pub socket_path: String,
+    pub screen: ScreenSize,
+    pub monitor_count: usize,
+    pub monitors: Vec<MonitorInfo>,
+}
+
 impl std::fmt::Display for WindowInfo {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        let state = if self.focused {
@ -47,9 +88,21 @@ impl std::fmt::Display for WindowInfo {

 #[allow(dead_code)]
 fn truncate(s: &str, max: usize) -> String {
-    if s.len() <= max {
+    if s.chars().count() <= max {
        s.to_string()
    } else {
-        format!("{}...", &s[..max - 3])
+        let truncated: String = s.chars().take(max.saturating_sub(3)).collect();
+        format!("{truncated}...")
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::truncate;
+
+    #[test]
+    fn truncate_is_char_safe() {
+        let input = format!("fire{}fox", '\u{00E9}');
+        assert_eq!(truncate(&input, 7), "fire...");
    }
 }
--- a/src/daemon/handler.rs
+++ b/src/daemon/handler.rs
@ -1,13 +1,18 @@
 use std::sync::Arc;
+
+use anyhow::{Context, Result};
 use tokio::sync::Mutex;
+use tokio::time::{sleep, Duration, Instant};

 use super::state::DaemonState;
-use crate::backend::DesktopBackend;
+use crate::backend::annotate::annotate_screenshot;
 use crate::core::protocol::{Request, Response};
-use crate::core::refs::RefEntry;
+use crate::core::refs::{ResolveResult, SelectorQuery};
+use crate::core::types::{MonitorInfo, ScreenSize, Snapshot, SystemInfo, VersionInfo, WindowInfo};

 pub async fn handle_request(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    match request.action.as_str() {
+        "ping" => Response::ok(serde_json::json!({"message": "pong"})),
        "snapshot" => handle_snapshot(request, state).await,
        "click" => handle_click(request, state).await,
        "dblclick" => handle_dblclick(request, state).await,
@ -24,6 +29,12 @@ pub async fn handle_request(request: &Request, state: &Arc<Mutex<DaemonState>>)
        "list-windows" => handle_list_windows(state).await,
        "get-screen-size" => handle_get_screen_size(state).await,
        "get-mouse-position" => handle_get_mouse_position(state).await,
+        "get-active-window" => handle_get_active_window(state).await,
+        "get-monitors" => handle_get_monitors(state).await,
+        "get-version" => handle_get_version(state).await,
+        "get-systeminfo" => handle_get_systeminfo(state).await,
+        "wait-window" => handle_wait(request, state, WaitKind::Window).await,
+        "wait-focus" => handle_wait(request, state, WaitKind::Focus).await,
        "screenshot" => handle_screenshot(request, state).await,
        "launch" => handle_launch(request, state).await,
        action => Response::err(format!("Unknown action: {action}")),
@ -38,152 +49,154 @@ async fn handle_snapshot(request: &Request, state: &Arc<Mutex<DaemonState>>) ->
        .unwrap_or(false);

    let mut state = state.lock().await;
-
-    match state.backend.snapshot(annotate) {
-        Ok(snapshot) => {
-            // Update ref map
-            state.ref_map.clear();
-            for win in &snapshot.windows {
-                state.ref_map.insert(RefEntry {
-                    xcb_id: win.xcb_id,
-                    app_class: win.app_name.clone(),
-                    title: win.title.clone(),
-                    pid: 0, // xcap doesn't expose PID directly in snapshot
-                    x: win.x,
-                    y: win.y,
-                    width: win.width,
-                    height: win.height,
-                    focused: win.focused,
-                    minimized: win.minimized,
-                });
-            }
-
-            Response::ok(serde_json::to_value(&snapshot).unwrap_or_default())
-        }
-        Err(e) => Response::err(format!("Snapshot failed: {e}")),
+    match capture_snapshot(&mut state, annotate, None) {
+        Ok(snapshot) => Response::ok(serde_json::to_value(&snapshot).unwrap_or_default()),
+        Err(error) => Response::err(format!("Snapshot failed: {error}")),
    }
 }

 async fn handle_click(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let selector = match request.extra.get("selector").and_then(|v| v.as_str()) {
-        Some(s) => s.to_string(),
+        Some(selector) => selector.to_string(),
        None => return Response::err("Missing 'selector' field"),
    };

    let mut state = state.lock().await;
+    let selector_query = SelectorQuery::parse(&selector);

-    // Try to parse as coordinates "x,y"
    if let Some((x, y)) = parse_coords(&selector) {
        return match state.backend.click(x, y) {
            Ok(()) => Response::ok(serde_json::json!({"clicked": {"x": x, "y": y}})),
-            Err(e) => Response::err(format!("Click failed: {e}")),
+            Err(error) => Response::err(format!("Click failed: {error}")),
        };
    }

-    // Resolve as window ref
+    if selector_query.needs_live_refresh() {
+        if let Err(error) = refresh_windows(&mut state) {
+            return Response::err(format!("Click failed: {error}"));
+        }
+    }
+
    match state.ref_map.resolve_to_center(&selector) {
-        Some((x, y)) => match state.backend.click(x, y) {
-            Ok(()) => {
-                Response::ok(serde_json::json!({"clicked": {"x": x, "y": y, "ref": selector}}))
+        ResolveResult::Match(entry) => {
+            let (x, y) = entry.center();
+            match state.backend.click(x, y) {
+                Ok(()) => Response::ok(serde_json::json!({
+                    "clicked": {"x": x, "y": y},
+                    "selector": selector,
+                    "ref_id": entry.ref_id,
+                    "window_id": entry.window_id,
+                    "title": entry.title,
+                })),
+                Err(error) => Response::err(format!("Click failed: {error}")),
            }
-            Err(e) => Response::err(format!("Click failed: {e}")),
-        },
-        None => Response::err(format!("Could not resolve selector: {selector}")),
+        }
+        outcome => selector_failure_response(outcome),
    }
 }

 async fn handle_dblclick(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let selector = match request.extra.get("selector").and_then(|v| v.as_str()) {
-        Some(s) => s.to_string(),
+        Some(selector) => selector.to_string(),
        None => return Response::err("Missing 'selector' field"),
    };

    let mut state = state.lock().await;
+    let selector_query = SelectorQuery::parse(&selector);

    if let Some((x, y)) = parse_coords(&selector) {
        return match state.backend.dblclick(x, y) {
            Ok(()) => Response::ok(serde_json::json!({"double_clicked": {"x": x, "y": y}})),
-            Err(e) => Response::err(format!("Double-click failed: {e}")),
+            Err(error) => Response::err(format!("Double-click failed: {error}")),
        };
    }

+    if selector_query.needs_live_refresh() {
+        if let Err(error) = refresh_windows(&mut state) {
+            return Response::err(format!("Double-click failed: {error}"));
+        }
+    }
+
    match state.ref_map.resolve_to_center(&selector) {
-        Some((x, y)) => match state.backend.dblclick(x, y) {
-            Ok(()) => Response::ok(
-                serde_json::json!({"double_clicked": {"x": x, "y": y, "ref": selector}}),
-            ),
-            Err(e) => Response::err(format!("Double-click failed: {e}")),
-        },
-        None => Response::err(format!("Could not resolve selector: {selector}")),
+        ResolveResult::Match(entry) => {
+            let (x, y) = entry.center();
+            match state.backend.dblclick(x, y) {
+                Ok(()) => Response::ok(serde_json::json!({
+                    "double_clicked": {"x": x, "y": y},
+                    "selector": selector,
+                    "ref_id": entry.ref_id,
+                    "window_id": entry.window_id,
+                    "title": entry.title,
+                })),
+                Err(error) => Response::err(format!("Double-click failed: {error}")),
+            }
+        }
+        outcome => selector_failure_response(outcome),
    }
 }

 async fn handle_type(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let text = match request.extra.get("text").and_then(|v| v.as_str()) {
-        Some(t) => t.to_string(),
+        Some(text) => text.to_string(),
        None => return Response::err("Missing 'text' field"),
    };

    let mut state = state.lock().await;
-
    match state.backend.type_text(&text) {
        Ok(()) => Response::ok(serde_json::json!({"typed": text})),
-        Err(e) => Response::err(format!("Type failed: {e}")),
+        Err(error) => Response::err(format!("Type failed: {error}")),
    }
 }

 async fn handle_press(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let key = match request.extra.get("key").and_then(|v| v.as_str()) {
-        Some(k) => k.to_string(),
+        Some(key) => key.to_string(),
        None => return Response::err("Missing 'key' field"),
    };

    let mut state = state.lock().await;
-
    match state.backend.press_key(&key) {
        Ok(()) => Response::ok(serde_json::json!({"pressed": key})),
-        Err(e) => Response::err(format!("Key press failed: {e}")),
+        Err(error) => Response::err(format!("Key press failed: {error}")),
    }
 }

 async fn handle_hotkey(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let keys: Vec<String> = match request.extra.get("keys").and_then(|v| v.as_array()) {
-        Some(arr) => arr
+        Some(keys) => keys
            .iter()
-            .filter_map(|v| v.as_str().map(|s| s.to_string()))
+            .filter_map(|value| value.as_str().map(|s| s.to_string()))
            .collect(),
        None => return Response::err("Missing 'keys' field"),
    };

    let mut state = state.lock().await;
-
    match state.backend.hotkey(&keys) {
        Ok(()) => Response::ok(serde_json::json!({"hotkey": keys})),
-        Err(e) => Response::err(format!("Hotkey failed: {e}")),
+        Err(error) => Response::err(format!("Hotkey failed: {error}")),
    }
 }

 async fn handle_mouse_move(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let x = match request.extra.get("x").and_then(|v| v.as_i64()) {
-        Some(v) => v as i32,
+        Some(value) => value as i32,
        None => return Response::err("Missing 'x' field"),
    };
    let y = match request.extra.get("y").and_then(|v| v.as_i64()) {
-        Some(v) => v as i32,
+        Some(value) => value as i32,
        None => return Response::err("Missing 'y' field"),
    };

    let mut state = state.lock().await;
-
    match state.backend.mouse_move(x, y) {
        Ok(()) => Response::ok(serde_json::json!({"moved": {"x": x, "y": y}})),
-        Err(e) => Response::err(format!("Mouse move failed: {e}")),
+        Err(error) => Response::err(format!("Mouse move failed: {error}")),
    }
 }

 async fn handle_mouse_scroll(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let amount = match request.extra.get("amount").and_then(|v| v.as_i64()) {
-        Some(v) => v as i32,
+        Some(value) => value as i32,
        None => return Response::err("Missing 'amount' field"),
    };
    let axis = request
@ -194,33 +207,31 @@ async fn handle_mouse_scroll(request: &Request, state: &Arc<Mutex<DaemonState>>)
        .to_string();

    let mut state = state.lock().await;
-
    match state.backend.scroll(amount, &axis) {
        Ok(()) => Response::ok(serde_json::json!({"scrolled": {"amount": amount, "axis": axis}})),
-        Err(e) => Response::err(format!("Scroll failed: {e}")),
+        Err(error) => Response::err(format!("Scroll failed: {error}")),
    }
 }

 async fn handle_mouse_drag(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let x1 = match request.extra.get("x1").and_then(|v| v.as_i64()) {
-        Some(v) => v as i32,
+        Some(value) => value as i32,
        None => return Response::err("Missing 'x1' field"),
    };
    let y1 = match request.extra.get("y1").and_then(|v| v.as_i64()) {
-        Some(v) => v as i32,
+        Some(value) => value as i32,
        None => return Response::err("Missing 'y1' field"),
    };
    let x2 = match request.extra.get("x2").and_then(|v| v.as_i64()) {
-        Some(v) => v as i32,
+        Some(value) => value as i32,
        None => return Response::err("Missing 'x2' field"),
    };
    let y2 = match request.extra.get("y2").and_then(|v| v.as_i64()) {
-        Some(v) => v as i32,
+        Some(value) => value as i32,
        None => return Response::err("Missing 'y2' field"),
    };

    let mut state = state.lock().await;
-
    match state.backend.drag(x1, y1, x2, y2) {
        Ok(()) => Response::ok(serde_json::json!({
            "dragged": {
@ -228,7 +239,7 @@ async fn handle_mouse_drag(request: &Request, state: &Arc<Mutex<DaemonState>>) -
                "to": {"x": x2, "y": y2}
            }
        })),
-        Err(e) => Response::err(format!("Drag failed: {e}")),
+        Err(error) => Response::err(format!("Drag failed: {error}")),
    }
 }

@ -238,20 +249,25 @@ async fn handle_window_action(
    action: &str,
 ) -> Response {
    let selector = match request.extra.get("selector").and_then(|v| v.as_str()) {
-        Some(s) => s.to_string(),
+        Some(selector) => selector.to_string(),
        None => return Response::err("Missing 'selector' field"),
    };

    let mut state = state.lock().await;
-
+    let selector_query = SelectorQuery::parse(&selector);
+    if selector_query.needs_live_refresh() {
+        if let Err(error) = refresh_windows(&mut state) {
+            return Response::err(format!("{action} failed: {error}"));
+        }
+    }
    let entry = match state.ref_map.resolve(&selector) {
-        Some(e) => e.clone(),
-        None => return Response::err(format!("Could not resolve window: {selector}")),
+        ResolveResult::Match(entry) => entry,
+        outcome => return selector_failure_response(outcome),
    };

    let result = match action {
-        "focus" => state.backend.focus_window(entry.xcb_id),
-        "close" => state.backend.close_window(entry.xcb_id),
+        "focus" => state.backend.focus_window(entry.backend_window_id),
+        "close" => state.backend.close_window(entry.backend_window_id),
        _ => unreachable!(),
    };

@ -259,96 +275,107 @@ async fn handle_window_action(
        Ok(()) => Response::ok(serde_json::json!({
            "action": action,
            "window": entry.title,
-            "xcb_id": entry.xcb_id,
+            "title": entry.title,
+            "ref_id": entry.ref_id,
+            "window_id": entry.window_id,
+            "selector": selector,
        })),
-        Err(e) => Response::err(format!("{action} failed: {e}")),
+        Err(error) => Response::err(format!("{action} failed: {error}")),
    }
 }

 async fn handle_move_window(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let selector = match request.extra.get("selector").and_then(|v| v.as_str()) {
-        Some(s) => s.to_string(),
+        Some(selector) => selector.to_string(),
        None => return Response::err("Missing 'selector' field"),
    };
    let x = request.extra.get("x").and_then(|v| v.as_i64()).unwrap_or(0) as i32;
    let y = request.extra.get("y").and_then(|v| v.as_i64()).unwrap_or(0) as i32;

    let mut state = state.lock().await;
+    let selector_query = SelectorQuery::parse(&selector);
+    if selector_query.needs_live_refresh() {
+        if let Err(error) = refresh_windows(&mut state) {
+            return Response::err(format!("Move failed: {error}"));
+        }
+    }
    let entry = match state.ref_map.resolve(&selector) {
-        Some(e) => e.clone(),
-        None => return Response::err(format!("Could not resolve window: {selector}")),
+        ResolveResult::Match(entry) => entry,
+        outcome => return selector_failure_response(outcome),
    };

-    match state.backend.move_window(entry.xcb_id, x, y) {
+    match state.backend.move_window(entry.backend_window_id, x, y) {
        Ok(()) => Response::ok(serde_json::json!({
-            "moved": entry.title, "x": x, "y": y
+            "moved": entry.title,
+            "title": entry.title,
+            "ref_id": entry.ref_id,
+            "window_id": entry.window_id,
+            "selector": selector,
+            "x": x,
+            "y": y,
        })),
-        Err(e) => Response::err(format!("Move failed: {e}")),
+        Err(error) => Response::err(format!("Move failed: {error}")),
    }
 }

 async fn handle_resize_window(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let selector = match request.extra.get("selector").and_then(|v| v.as_str()) {
-        Some(s) => s.to_string(),
+        Some(selector) => selector.to_string(),
        None => return Response::err("Missing 'selector' field"),
    };
-    let w = request
+    let width = request
        .extra
        .get("w")
        .and_then(|v| v.as_u64())
        .unwrap_or(800) as u32;
-    let h = request
+    let height = request
        .extra
        .get("h")
        .and_then(|v| v.as_u64())
        .unwrap_or(600) as u32;

    let mut state = state.lock().await;
+    let selector_query = SelectorQuery::parse(&selector);
+    if selector_query.needs_live_refresh() {
+        if let Err(error) = refresh_windows(&mut state) {
+            return Response::err(format!("Resize failed: {error}"));
+        }
+    }
    let entry = match state.ref_map.resolve(&selector) {
-        Some(e) => e.clone(),
-        None => return Response::err(format!("Could not resolve window: {selector}")),
+        ResolveResult::Match(entry) => entry,
+        outcome => return selector_failure_response(outcome),
    };

-    match state.backend.resize_window(entry.xcb_id, w, h) {
+    match state
+        .backend
+        .resize_window(entry.backend_window_id, width, height)
+    {
        Ok(()) => Response::ok(serde_json::json!({
-            "resized": entry.title, "width": w, "height": h
+            "resized": entry.title,
+            "title": entry.title,
+            "ref_id": entry.ref_id,
+            "window_id": entry.window_id,
+            "selector": selector,
+            "width": width,
+            "height": height,
        })),
-        Err(e) => Response::err(format!("Resize failed: {e}")),
+        Err(error) => Response::err(format!("Resize failed: {error}")),
    }
 }

 async fn handle_list_windows(state: &Arc<Mutex<DaemonState>>) -> Response {
    let mut state = state.lock().await;
-    // Re-run snapshot without screenshot, just to get current window list
-    match state.backend.snapshot(false) {
-        Ok(snapshot) => {
-            // Update ref map with fresh data
-            state.ref_map.clear();
-            for win in &snapshot.windows {
-                state.ref_map.insert(RefEntry {
-                    xcb_id: win.xcb_id,
-                    app_class: win.app_name.clone(),
-                    title: win.title.clone(),
-                    pid: 0,
-                    x: win.x,
-                    y: win.y,
-                    width: win.width,
-                    height: win.height,
-                    focused: win.focused,
-                    minimized: win.minimized,
-                });
-            }
-            Response::ok(serde_json::json!({"windows": snapshot.windows}))
-        }
-        Err(e) => Response::err(format!("List windows failed: {e}")),
+    match refresh_windows(&mut state) {
+        Ok(windows) => Response::ok(serde_json::json!({"windows": windows})),
+        Err(error) => Response::err(format!("List windows failed: {error}")),
    }
 }

 async fn handle_get_screen_size(state: &Arc<Mutex<DaemonState>>) -> Response {
    let state = state.lock().await;
    match state.backend.screen_size() {
-        Ok((w, h)) => Response::ok(serde_json::json!({"width": w, "height": h})),
-        Err(e) => Response::err(format!("Failed: {e}")),
+        Ok((width, height)) => Response::ok(serde_json::json!({"width": width, "height": height})),
+        Err(error) => Response::err(format!("Failed: {error}")),
    }
 }

@ -356,10 +383,189 @@ async fn handle_get_mouse_position(state: &Arc<Mutex<DaemonState>>) -> Response
    let state = state.lock().await;
    match state.backend.mouse_position() {
        Ok((x, y)) => Response::ok(serde_json::json!({"x": x, "y": y})),
-        Err(e) => Response::err(format!("Failed: {e}")),
+        Err(error) => Response::err(format!("Failed: {error}")),
    }
 }

+async fn handle_get_active_window(state: &Arc<Mutex<DaemonState>>) -> Response {
+    let mut state = state.lock().await;
+    let active_backend_window = match state.backend.active_window() {
+        Ok(window) => window,
+        Err(error) => return Response::err(format!("Failed: {error}")),
+    };
+
+    let windows = match refresh_windows(&mut state) {
+        Ok(windows) => windows,
+        Err(error) => return Response::err(format!("Failed: {error}")),
+    };
+
+    let active_window = if let Some(active_backend_window) = active_backend_window {
+        state
+            .ref_map
+            .entries()
+            .find_map(|(_, entry)| {
+                (entry.backend_window_id == active_backend_window.native_id)
+                    .then(|| entry.to_window_info())
+            })
+            .or_else(|| windows.iter().find(|window| window.focused).cloned())
+    } else {
+        windows.iter().find(|window| window.focused).cloned()
+    };
+
+    if let Some(window) = active_window {
+        Response::ok(serde_json::json!({"window": window}))
+    } else {
+        Response::err_with_data(
+            "No focused window is available",
+            serde_json::json!({"kind": "not_found", "mode": "focused"}),
+        )
+    }
+}
+
+async fn handle_get_monitors(state: &Arc<Mutex<DaemonState>>) -> Response {
+    let state = state.lock().await;
+    match state.backend.list_monitors() {
+        Ok(monitors) => {
+            let monitors: Vec<MonitorInfo> = monitors.into_iter().map(Into::into).collect();
+            Response::ok(serde_json::json!({
+                "count": monitors.len(),
+                "monitors": monitors,
+            }))
+        }
+        Err(error) => Response::err(format!("Failed: {error}")),
+    }
+}
+
+async fn handle_get_version(state: &Arc<Mutex<DaemonState>>) -> Response {
+    let state = state.lock().await;
+    let info = VersionInfo {
+        version: env!("CARGO_PKG_VERSION").to_string(),
+        backend: state.backend.backend_name().to_string(),
+    };
+    Response::ok(serde_json::to_value(info).unwrap_or_default())
+}
+
+async fn handle_get_systeminfo(state: &Arc<Mutex<DaemonState>>) -> Response {
+    let state = state.lock().await;
+    let screen = match state.backend.screen_size() {
+        Ok((width, height)) => ScreenSize { width, height },
+        Err(error) => return Response::err(format!("Failed: {error}")),
+    };
+    let monitors = match state.backend.list_monitors() {
+        Ok(monitors) => monitors.into_iter().map(Into::into).collect::<Vec<_>>(),
+        Err(error) => return Response::err(format!("Failed: {error}")),
+    };
+
+    let info = SystemInfo {
+        backend: state.backend.backend_name().to_string(),
+        display: std::env::var("DISPLAY")
+            .ok()
+            .filter(|value| !value.is_empty()),
+        session_type: std::env::var("XDG_SESSION_TYPE")
+            .ok()
+            .filter(|value| !value.is_empty()),
+        session: state.session.clone(),
+        socket_path: state.socket_path.display().to_string(),
+        screen,
+        monitor_count: monitors.len(),
+        monitors,
+    };
+
+    Response::ok(serde_json::to_value(info).unwrap_or_default())
+}
+
+async fn handle_wait(
+    request: &Request,
+    state: &Arc<Mutex<DaemonState>>,
+    wait_kind: WaitKind,
+) -> Response {
+    let selector = match request.extra.get("selector").and_then(|v| v.as_str()) {
+        Some(selector) => selector.to_string(),
+        None => return Response::err("Missing 'selector' field"),
+    };
+    let timeout_ms = request
+        .extra
+        .get("timeout_ms")
+        .and_then(|v| v.as_u64())
+        .unwrap_or(10_000);
+    let poll_ms = request
+        .extra
+        .get("poll_ms")
+        .and_then(|v| v.as_u64())
+        .unwrap_or(250);
+
+    let start = Instant::now();
+    let deadline = Instant::now() + Duration::from_millis(timeout_ms);
+    let mut last_observation: serde_json::Value;
+
+    loop {
+        let outcome = {
+            let mut state = state.lock().await;
+            if let Err(error) = refresh_windows(&mut state) {
+                return Response::err(format!("Wait failed: {error}"));
+            }
+            observe_wait(&state, &selector, wait_kind)
+        };
+
+        match outcome {
+            WaitObservation::Satisfied(window) => {
+                let elapsed_ms = start.elapsed().as_millis() as u64;
+                return Response::ok(serde_json::json!({
+                    "wait": wait_kind.as_str(),
+                    "selector": selector,
+                    "elapsed_ms": elapsed_ms,
+                    "window": window,
+                }));
+            }
+            WaitObservation::Retry { observation } => {
+                last_observation = observation;
+            }
+            WaitObservation::Failure(response) => return response,
+        }
+
+        if Instant::now() >= deadline {
+            return Response::err_with_data(
+                format!(
+                    "Timed out waiting for {} to match selector: {}",
+                    wait_kind.as_str(),
+                    selector
+                ),
+                serde_json::json!({
+                    "kind": "timeout",
+                    "wait": wait_kind.as_str(),
+                    "selector": selector,
+                    "timeout_ms": timeout_ms,
+                    "poll_ms": poll_ms,
+                    "last_observation": last_observation,
+                }),
+            );
+        }
+
+        sleep(Duration::from_millis(poll_ms)).await;
+    }
+}
+
+#[derive(Clone, Copy)]
+enum WaitKind {
+    Window,
+    Focus,
+}
+
+impl WaitKind {
+    fn as_str(self) -> &'static str {
+        match self {
+            Self::Window => "window",
+            Self::Focus => "focus",
+        }
+    }
+}
+
+enum WaitObservation {
+    Satisfied(WindowInfo),
+    Retry { observation: serde_json::Value },
+    Failure(Response),
+}
+
 async fn handle_screenshot(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let annotate = request
        .extra
@ -370,50 +576,214 @@ async fn handle_screenshot(request: &Request, state: &Arc<Mutex<DaemonState>>) -
        .extra
        .get("path")
        .and_then(|v| v.as_str())
-        .map(|s| s.to_string())
-        .unwrap_or_else(|| {
-            let ts = std::time::SystemTime::now()
-                .duration_since(std::time::UNIX_EPOCH)
-                .unwrap_or_default()
-                .as_millis();
-            format!("/tmp/deskctl-{ts}.png")
-        });
+        .map(|value| value.to_string())
+        .unwrap_or_else(temp_screenshot_path);
+
    let mut state = state.lock().await;
-    match state.backend.screenshot(&path, annotate) {
-        Ok(saved) => Response::ok(serde_json::json!({"screenshot": saved})),
-        Err(e) => Response::err(format!("Screenshot failed: {e}")),
+    let windows = if annotate {
+        match refresh_windows(&mut state) {
+            Ok(windows) => Some(windows),
+            Err(error) => return Response::err(format!("Screenshot failed: {error}")),
+        }
+    } else {
+        None
+    };
+
+    match capture_and_save_screenshot(&mut state, &path, annotate, windows.as_deref()) {
+        Ok(saved) => {
+            if let Some(windows) = windows {
+                Response::ok(serde_json::json!({"screenshot": saved, "windows": windows}))
+            } else {
+                Response::ok(serde_json::json!({"screenshot": saved}))
+            }
+        }
+        Err(error) => Response::err(format!("Screenshot failed: {error}")),
    }
 }

 async fn handle_launch(request: &Request, state: &Arc<Mutex<DaemonState>>) -> Response {
    let command = match request.extra.get("command").and_then(|v| v.as_str()) {
-        Some(c) => c.to_string(),
+        Some(command) => command.to_string(),
        None => return Response::err("Missing 'command' field"),
    };
    let args: Vec<String> = request
        .extra
        .get("args")
        .and_then(|v| v.as_array())
-        .map(|arr| {
-            arr.iter()
-                .filter_map(|v| v.as_str().map(String::from))
+        .map(|args| {
+            args.iter()
+                .filter_map(|value| value.as_str().map(String::from))
                .collect()
        })
        .unwrap_or_default();
+
    let state = state.lock().await;
    match state.backend.launch(&command, &args) {
        Ok(pid) => Response::ok(serde_json::json!({"pid": pid, "command": command})),
-        Err(e) => Response::err(format!("Launch failed: {e}")),
+        Err(error) => Response::err(format!("Launch failed: {error}")),
    }
 }

-fn parse_coords(s: &str) -> Option<(i32, i32)> {
-    let parts: Vec<&str> = s.split(',').collect();
-    if parts.len() == 2 {
-        let x = parts[0].trim().parse().ok()?;
-        let y = parts[1].trim().parse().ok()?;
-        Some((x, y))
-    } else {
-        None
+fn refresh_windows(state: &mut DaemonState) -> Result<Vec<WindowInfo>> {
+    let windows = state.backend.list_windows()?;
+    Ok(state.ref_map.rebuild(&windows))
+}
+
+fn selector_failure_response(result: ResolveResult) -> Response {
+    match result {
+        ResolveResult::NotFound { selector, mode } => Response::err_with_data(
+            format!("Could not resolve selector: {selector}"),
+            serde_json::json!({
+                "kind": "selector_not_found",
+                "selector": selector,
+                "mode": mode,
+            }),
+        ),
+        ResolveResult::Ambiguous {
+            selector,
+            mode,
+            candidates,
+        } => Response::err_with_data(
+            format!("Selector is ambiguous: {selector}"),
+            serde_json::json!({
+                "kind": "selector_ambiguous",
+                "selector": selector,
+                "mode": mode,
+                "candidates": candidates,
+            }),
+        ),
+        ResolveResult::Invalid {
+            selector,
+            mode,
+            message,
+        } => Response::err_with_data(
+            format!("Invalid selector '{selector}': {message}"),
+            serde_json::json!({
+                "kind": "selector_invalid",
+                "selector": selector,
+                "mode": mode,
+                "message": message,
+            }),
+        ),
+        ResolveResult::Match(_) => unreachable!(),
+    }
+}
+
+fn observe_wait(state: &DaemonState, selector: &str, wait_kind: WaitKind) -> WaitObservation {
+    match state.ref_map.resolve(selector) {
+        ResolveResult::Match(entry) => {
+            let window = entry.to_window_info();
+            match wait_kind {
+                WaitKind::Window => WaitObservation::Satisfied(window),
+                WaitKind::Focus if window.focused => WaitObservation::Satisfied(window),
+                WaitKind::Focus => WaitObservation::Retry {
+                    observation: serde_json::json!({
+                        "kind": "window_not_focused",
+                        "window": window,
+                    }),
+                },
+            }
+        }
+        ResolveResult::NotFound { selector, mode } => WaitObservation::Retry {
+            observation: serde_json::json!({
+                "kind": "selector_not_found",
+                "selector": selector,
+                "mode": mode,
+            }),
+        },
+        ResolveResult::Ambiguous {
+            selector,
+            mode,
+            candidates,
+        } => WaitObservation::Failure(Response::err_with_data(
+            format!("Selector is ambiguous: {selector}"),
+            serde_json::json!({
+                "kind": "selector_ambiguous",
+                "selector": selector,
+                "mode": mode,
+                "candidates": candidates,
+            }),
+        )),
+        ResolveResult::Invalid {
+            selector,
+            mode,
+            message,
+        } => WaitObservation::Failure(Response::err_with_data(
+            format!("Invalid selector '{selector}': {message}"),
+            serde_json::json!({
+                "kind": "selector_invalid",
+                "selector": selector,
+                "mode": mode,
+                "message": message,
+            }),
+        )),
+    }
+}
+
+fn capture_snapshot(
+    state: &mut DaemonState,
+    annotate: bool,
+    path: Option<String>,
+) -> Result<Snapshot> {
+    let windows = refresh_windows(state)?;
+    let screenshot_path = path.unwrap_or_else(temp_screenshot_path);
+    let screenshot =
+        capture_and_save_screenshot(state, &screenshot_path, annotate, Some(&windows))?;
+
+    Ok(Snapshot {
+        screenshot,
+        windows,
+    })
+}
+
+fn capture_and_save_screenshot(
+    state: &mut DaemonState,
+    path: &str,
+    annotate: bool,
+    windows: Option<&[WindowInfo]>,
+) -> Result<String> {
+    let mut image = state.backend.capture_screenshot()?;
+    if annotate {
+        let windows = windows.context("Annotated screenshots require current window data")?;
+        annotate_screenshot(&mut image, windows);
+    }
+    image
+        .save(path)
+        .with_context(|| format!("Failed to save screenshot to {path}"))?;
+    Ok(path.to_string())
+}
+
+fn temp_screenshot_path() -> String {
+    let timestamp = std::time::SystemTime::now()
+        .duration_since(std::time::UNIX_EPOCH)
+        .unwrap_or_default()
+        .as_millis();
+    format!("/tmp/deskctl-{timestamp}.png")
+}
+
+fn parse_coords(value: &str) -> Option<(i32, i32)> {
+    let parts: Vec<&str> = value.split(',').collect();
+    if parts.len() != 2 {
+        return None;
+    }
+
+    let x = parts[0].trim().parse().ok()?;
+    let y = parts[1].trim().parse().ok()?;
+    Some((x, y))
+}
+
+impl From<crate::backend::BackendMonitor> for MonitorInfo {
+    fn from(value: crate::backend::BackendMonitor) -> Self {
+        Self {
+            name: value.name,
+            x: value.x,
+            y: value.y,
+            width: value.width,
+            height: value.height,
+            width_mm: value.width_mm,
+            height_mm: value.height_mm,
+            primary: value.primary,
+            automatic: value.automatic,
+        }
    }
 }
--- a/src/daemon/mod.rs
+++ b/src/daemon/mod.rs
@ -1,7 +1,7 @@
 mod handler;
 mod state;

-use std::path::PathBuf;
+use std::path::{Path, PathBuf};
 use std::sync::Arc;

 use anyhow::{Context, Result};
@ -9,9 +9,33 @@ use tokio::io::{AsyncBufReadExt, AsyncWriteExt, BufReader};
 use tokio::net::UnixListener;
 use tokio::sync::Mutex;

+use crate::core::paths::{pid_path_from_env, socket_path_from_env};
 use crate::core::session;
 use state::DaemonState;

+struct RuntimePathsGuard {
+    socket_path: PathBuf,
+    pid_path: Option<PathBuf>,
+}
+
+impl RuntimePathsGuard {
+    fn new(socket_path: PathBuf, pid_path: Option<PathBuf>) -> Self {
+        Self {
+            socket_path,
+            pid_path,
+        }
+    }
+}
+
+impl Drop for RuntimePathsGuard {
+    fn drop(&mut self) {
+        remove_runtime_path(&self.socket_path);
+        if let Some(ref pid_path) = self.pid_path {
+            remove_runtime_path(pid_path);
+        }
+    }
+}
+
 pub fn run() -> Result<()> {
    // Validate session before starting
    session::detect_session()?;
@ -24,31 +48,29 @@ pub fn run() -> Result<()> {
 }

 async fn async_run() -> Result<()> {
-    let socket_path = std::env::var("DESKCTL_SOCKET_PATH")
-        .map(PathBuf::from)
-        .context("DESKCTL_SOCKET_PATH not set")?;
-
-    let pid_path = std::env::var("DESKCTL_PID_PATH").map(PathBuf::from).ok();
+    let socket_path = socket_path_from_env().context("DESKCTL_SOCKET_PATH not set")?;
+    let pid_path = pid_path_from_env();

    // Clean up stale socket
    if socket_path.exists() {
        std::fs::remove_file(&socket_path)?;
    }

-    // Write PID file
-    if let Some(ref pid_path) = pid_path {
-        std::fs::write(pid_path, std::process::id().to_string())?;
-    }
-
-    let listener = UnixListener::bind(&socket_path)
-        .context(format!("Failed to bind socket: {}", socket_path.display()))?;
-
    let session = std::env::var("DESKCTL_SESSION").unwrap_or_else(|_| "default".to_string());
    let state = Arc::new(Mutex::new(
        DaemonState::new(session, socket_path.clone())
            .context("Failed to initialize daemon state")?,
    ));

+    let listener = UnixListener::bind(&socket_path)
+        .context(format!("Failed to bind socket: {}", socket_path.display()))?;
+    let _runtime_paths = RuntimePathsGuard::new(socket_path.clone(), pid_path.clone());
+
+    // Write PID file only after the daemon is ready to serve requests.
+    if let Some(ref pid_path) = pid_path {
+        std::fs::write(pid_path, std::process::id().to_string())?;
+    }
+
    let shutdown = Arc::new(tokio::sync::Notify::new());
    let shutdown_clone = shutdown.clone();

@ -77,14 +99,6 @@ async fn async_run() -> Result<()> {
        }
    }

-    // Cleanup
-    if socket_path.exists() {
-        let _ = std::fs::remove_file(&socket_path);
-    }
-    if let Some(ref pid_path) = pid_path {
-        let _ = std::fs::remove_file(pid_path);
-    }
-
    Ok(())
 }

@ -125,3 +139,11 @@ async fn handle_connection(

    Ok(())
 }
+
+fn remove_runtime_path(path: &Path) {
+    if let Err(error) = std::fs::remove_file(path) {
+        if error.kind() != std::io::ErrorKind::NotFound {
+            eprintln!("Failed to remove runtime path {}: {error}", path.display());
+        }
+    }
+}
--- a/src/daemon/state.rs
+++ b/src/daemon/state.rs
@ -1,6 +1,6 @@
 use std::path::PathBuf;

-use crate::backend::x11::X11Backend;
+use crate::backend::{x11::X11Backend, DesktopBackend};
 use crate::core::refs::RefMap;

 #[allow(dead_code)]
@ -8,12 +8,12 @@ pub struct DaemonState {
    pub session: String,
    pub socket_path: PathBuf,
    pub ref_map: RefMap,
-    pub backend: X11Backend,
+    pub backend: Box<dyn DesktopBackend>,
 }

 impl DaemonState {
    pub fn new(session: String, socket_path: PathBuf) -> anyhow::Result<Self> {
-        let backend = X11Backend::new()?;
+        let backend: Box<dyn DesktopBackend> = Box::new(X11Backend::new()?);
        Ok(Self {
            session,
            socket_path,
--- a/src/lib.rs
+++ b/src/lib.rs
@ -0,0 +1,11 @@
+pub mod backend;
+pub mod cli;
+pub mod core;
+pub mod daemon;
+
+pub fn run() -> anyhow::Result<()> {
+    if std::env::var("DESKCTL_DAEMON").is_ok() {
+        return daemon::run();
+    }
+    cli::run()
+}
--- a/src/main.rs
+++ b/src/main.rs
@ -1,11 +1,3 @@
-mod backend;
-mod cli;
-mod core;
-mod daemon;
-
 fn main() -> anyhow::Result<()> {
-    if std::env::var("DESKCTL_DAEMON").is_ok() {
-        return daemon::run();
-    }
-    cli::run()
+    deskctl::run()
 }
--- a/tests/support/mod.rs
+++ b/tests/support/mod.rs
@ -0,0 +1,281 @@
+#![cfg(target_os = "linux")]
+
+use std::os::unix::net::UnixListener;
+use std::path::{Path, PathBuf};
+use std::process::{Command, Output};
+use std::sync::{Mutex, OnceLock};
+use std::thread;
+use std::time::{SystemTime, UNIX_EPOCH};
+
+use anyhow::{anyhow, bail, Context, Result};
+use deskctl::cli::{connection, GlobalOpts};
+use x11rb::connection::Connection;
+use x11rb::protocol::xproto::{
+    AtomEnum, ConnectionExt as XprotoConnectionExt, CreateWindowAux, EventMask, PropMode,
+    WindowClass,
+};
+use x11rb::rust_connection::RustConnection;
+use x11rb::wrapper::ConnectionExt as X11WrapperConnectionExt;
+
+pub fn env_lock() -> &'static Mutex<()> {
+    static LOCK: OnceLock<Mutex<()>> = OnceLock::new();
+    LOCK.get_or_init(|| Mutex::new(()))
+}
+
+pub fn env_lock_guard() -> std::sync::MutexGuard<'static, ()> {
+    match env_lock().lock() {
+        Ok(guard) => guard,
+        Err(poisoned) => poisoned.into_inner(),
+    }
+}
+
+pub struct SessionEnvGuard {
+    old_session_type: Option<String>,
+}
+
+impl SessionEnvGuard {
+    pub fn prepare() -> Option<Self> {
+        let _display = std::env::var("DISPLAY")
+            .ok()
+            .filter(|value| !value.is_empty())?;
+
+        let old_session_type = std::env::var("XDG_SESSION_TYPE").ok();
+        std::env::set_var("XDG_SESSION_TYPE", "x11");
+        Some(Self { old_session_type })
+    }
+}
+
+impl Drop for SessionEnvGuard {
+    fn drop(&mut self) {
+        match &self.old_session_type {
+            Some(value) => std::env::set_var("XDG_SESSION_TYPE", value),
+            None => std::env::remove_var("XDG_SESSION_TYPE"),
+        }
+    }
+}
+
+pub struct FixtureWindow {
+    conn: RustConnection,
+    window: u32,
+}
+
+impl FixtureWindow {
+    pub fn create(title: &str, app_class: &str) -> Result<Self> {
+        let (conn, screen_num) = connect_to_test_display()?;
+        let screen = &conn.setup().roots[screen_num];
+        let window = conn.generate_id()?;
+
+        conn.create_window(
+            x11rb::COPY_DEPTH_FROM_PARENT,
+            window,
+            screen.root,
+            10,
+            10,
+            320,
+            180,
+            0,
+            WindowClass::INPUT_OUTPUT,
+            0,
+            &CreateWindowAux::new()
+                .background_pixel(screen.white_pixel)
+                .event_mask(EventMask::EXPOSURE),
+        )?;
+        conn.change_property8(
+            PropMode::REPLACE,
+            window,
+            AtomEnum::WM_NAME,
+            AtomEnum::STRING,
+            title.as_bytes(),
+        )?;
+        let class_bytes = format!("{app_class}\0{app_class}\0");
+        conn.change_property8(
+            PropMode::REPLACE,
+            window,
+            AtomEnum::WM_CLASS,
+            AtomEnum::STRING,
+            class_bytes.as_bytes(),
+        )?;
+        conn.map_window(window)?;
+        conn.flush()?;
+
+        std::thread::sleep(std::time::Duration::from_millis(150));
+        Ok(Self { conn, window })
+    }
+}
+
+fn connect_to_test_display() -> Result<(RustConnection, usize)> {
+    let max_attempts = 10;
+    let mut last_error = None;
+
+    for attempt in 0..max_attempts {
+        match x11rb::connect(None) {
+            Ok(connection) => return Ok(connection),
+            Err(error) => {
+                last_error = Some(anyhow!(error));
+                if attempt + 1 < max_attempts {
+                    thread::sleep(std::time::Duration::from_millis(100 * (attempt + 1) as u64));
+                }
+            }
+        }
+    }
+
+    Err(last_error.expect("x11 connection attempts should capture an error"))
+        .context("Failed to connect to the integration test display")
+}
+
+impl Drop for FixtureWindow {
+    fn drop(&mut self) {
+        let _ = self.conn.destroy_window(self.window);
+        let _ = self.conn.flush();
+    }
+}
+
+pub struct TestSession {
+    pub opts: GlobalOpts,
+    root: PathBuf,
+}
+
+impl TestSession {
+    pub fn new(label: &str) -> Result<Self> {
+        let suffix = SystemTime::now()
+            .duration_since(UNIX_EPOCH)
+            .context("System clock is before the Unix epoch")?
+            .as_nanos();
+        let root = std::env::temp_dir().join(format!("deskctl-{label}-{suffix}"));
+        std::fs::create_dir_all(&root)
+            .with_context(|| format!("Failed to create {}", root.display()))?;
+
+        Ok(Self {
+            opts: GlobalOpts {
+                socket: Some(root.join("deskctl.sock")),
+                session: format!("{label}-{suffix}"),
+                json: false,
+            },
+            root,
+        })
+    }
+
+    pub fn socket_path(&self) -> &Path {
+        self.opts
+            .socket
+            .as_deref()
+            .expect("TestSession always has an explicit socket path")
+    }
+
+    pub fn pid_path(&self) -> PathBuf {
+        self.root.join("deskctl.pid")
+    }
+
+    pub fn create_stale_socket(&self) -> Result<()> {
+        let listener = UnixListener::bind(self.socket_path())
+            .with_context(|| format!("Failed to bind {}", self.socket_path().display()))?;
+        drop(listener);
+        Ok(())
+    }
+
+    pub fn start_daemon_cli(&self) -> Result<()> {
+        let output = self.run_cli(["daemon", "start"])?;
+        if output.status.success() {
+            return Ok(());
+        }
+
+        bail!(
+            "deskctl daemon start failed\nstdout:\n{}\nstderr:\n{}",
+            String::from_utf8_lossy(&output.stdout),
+            String::from_utf8_lossy(&output.stderr)
+        );
+    }
+
+    pub fn run_cli<I, S>(&self, args: I) -> Result<Output>
+    where
+        I: IntoIterator<Item = S>,
+        S: AsRef<str>,
+    {
+        let socket = self.socket_path();
+        let mut command = Command::new(env!("CARGO_BIN_EXE_deskctl"));
+        command
+            .arg("--socket")
+            .arg(socket)
+            .arg("--session")
+            .arg(&self.opts.session);
+
+        for arg in args {
+            command.arg(arg.as_ref());
+        }
+
+        command.output().with_context(|| {
+            format!(
+                "Failed to run {} against {}",
+                env!("CARGO_BIN_EXE_deskctl"),
+                socket.display()
+            )
+        })
+    }
+
+    pub fn run_daemon<I, K, V>(&self, env: I) -> Result<Output>
+    where
+        I: IntoIterator<Item = (K, V)>,
+        K: AsRef<std::ffi::OsStr>,
+        V: AsRef<std::ffi::OsStr>,
+    {
+        let mut command = Command::new(env!("CARGO_BIN_EXE_deskctl"));
+        command
+            .env("DESKCTL_DAEMON", "1")
+            .env("DESKCTL_SOCKET_PATH", self.socket_path())
+            .env("DESKCTL_PID_PATH", self.pid_path())
+            .env("DESKCTL_SESSION", &self.opts.session)
+            .envs(env);
+
+        command.output().with_context(|| {
+            format!(
+                "Failed to run daemon {} against {}",
+                env!("CARGO_BIN_EXE_deskctl"),
+                self.socket_path().display()
+            )
+        })
+    }
+}
+
+impl Drop for TestSession {
+    fn drop(&mut self) {
+        let _ = connection::stop_daemon(&self.opts);
+        if self.socket_path().exists() {
+            let _ = std::fs::remove_file(self.socket_path());
+        }
+        if self.pid_path().exists() {
+            let _ = std::fs::remove_file(self.pid_path());
+        }
+        let _ = std::fs::remove_dir_all(&self.root);
+    }
+}
+
+pub fn deskctl_tmp_screenshot_count() -> usize {
+    std::fs::read_dir("/tmp")
+        .ok()
+        .into_iter()
+        .flat_map(|iter| iter.filter_map(Result::ok))
+        .filter(|entry| {
+            entry
+                .file_name()
+                .to_str()
+                .map(|name| name.starts_with("deskctl-") && name.ends_with(".png"))
+                .unwrap_or(false)
+        })
+        .count()
+}
+
+pub fn successful_json_response(output: Output) -> Result<serde_json::Value> {
+    if !output.status.success() {
+        return Err(anyhow!(
+            "deskctl command failed\nstdout:\n{}\nstderr:\n{}",
+            String::from_utf8_lossy(&output.stdout),
+            String::from_utf8_lossy(&output.stderr)
+        ));
+    }
+
+    serde_json::from_slice(&output.stdout).context("Failed to parse JSON output from deskctl")
+}
+
+pub fn json_response(output: &Output) -> Result<serde_json::Value> {
+    serde_json::from_slice(&output.stdout).context("Failed to parse JSON output from deskctl")
+}
--- a/tests/x11_runtime.rs
+++ b/tests/x11_runtime.rs
@ -0,0 +1,260 @@
+#![cfg(target_os = "linux")]
+
+mod support;
+
+use anyhow::Result;
+use deskctl::cli::connection::send_command;
+use deskctl::core::doctor;
+use deskctl::core::protocol::Request;
+
+use self::support::{
+    deskctl_tmp_screenshot_count, env_lock_guard, json_response, successful_json_response,
+    FixtureWindow, SessionEnvGuard, TestSession,
+};
+
+#[test]
+fn doctor_reports_healthy_x11_environment() -> Result<()> {
+    let _guard = env_lock_guard();
+    let Some(_env) = SessionEnvGuard::prepare() else {
+        eprintln!("Skipping X11 integration test because DISPLAY is not set");
+        return Ok(());
+    };
+
+    let _window = FixtureWindow::create("deskctl doctor test", "DeskctlDoctor")?;
+    let session = TestSession::new("doctor")?;
+    let report = doctor::run(session.socket_path());
+
+    assert!(report
+        .checks
+        .iter()
+        .any(|check| check.name == "display" && check.ok));
+    assert!(report
+        .checks
+        .iter()
+        .any(|check| check.name == "backend" && check.ok));
+    assert!(report
+        .checks
+        .iter()
+        .any(|check| check.name == "window-enumeration" && check.ok));
+    assert!(report
+        .checks
+        .iter()
+        .any(|check| check.name == "screenshot" && check.ok));
+
+    Ok(())
+}
+
+#[test]
+fn list_windows_is_side_effect_free() -> Result<()> {
+    let _guard = env_lock_guard();
+    let Some(_env) = SessionEnvGuard::prepare() else {
+        eprintln!("Skipping X11 integration test because DISPLAY is not set");
+        return Ok(());
+    };
+
+    let _window = FixtureWindow::create("deskctl list-windows test", "DeskctlList")?;
+    let session = TestSession::new("list-windows")?;
+    session.start_daemon_cli()?;
+
+    let before = deskctl_tmp_screenshot_count();
+    let response = send_command(&session.opts, &Request::new("list-windows"))?;
+    assert!(response.success);
+
+    let windows = response
+        .data
+        .and_then(|data| data.get("windows").cloned())
+        .and_then(|windows| windows.as_array().cloned())
+        .expect("list-windows response must include a windows array");
+    assert!(windows.iter().any(|window| {
+        window
+            .get("title")
+            .and_then(|value| value.as_str())
+            .map(|title| title == "deskctl list-windows test")
+            .unwrap_or(false)
+    }));
+
+    let after = deskctl_tmp_screenshot_count();
+    assert_eq!(
+        before, after,
+        "list-windows should not create screenshot artifacts"
+    );
+
+    Ok(())
+}
+
+#[test]
+fn daemon_start_recovers_from_stale_socket() -> Result<()> {
+    let _guard = env_lock_guard();
+    let Some(_env) = SessionEnvGuard::prepare() else {
+        eprintln!("Skipping X11 integration test because DISPLAY is not set");
+        return Ok(());
+    };
+
+    let _window = FixtureWindow::create("deskctl daemon recovery test", "DeskctlDaemon")?;
+    let session = TestSession::new("daemon-recovery")?;
+    session.create_stale_socket()?;
+
+    session.start_daemon_cli()?;
+    let response = successful_json_response(session.run_cli(["--json", "list-windows"])?)
+        .expect("list-windows should return valid JSON");
+
+    let windows = response
+        .get("data")
+        .and_then(|data| data.get("windows"))
+        .and_then(|value| value.as_array())
+        .expect("CLI JSON response must include windows");
+    assert!(windows.iter().any(|window| {
+        window
+            .get("title")
+            .and_then(|value| value.as_str())
+            .map(|title| title == "deskctl daemon recovery test")
+            .unwrap_or(false)
+    }));
+
+    Ok(())
+}
+
+#[test]
+fn daemon_init_failure_cleans_runtime_state() -> Result<()> {
+    let _guard = env_lock_guard();
+    let session = TestSession::new("daemon-init-failure")?;
+
+    let output = session.run_daemon([("XDG_SESSION_TYPE", "x11"), ("DISPLAY", ":99999")])?;
+    assert!(!output.status.success(), "daemon startup should fail");
+
+    let stderr = String::from_utf8_lossy(&output.stderr);
+    assert!(
+        stderr.contains("Failed to initialize daemon state"),
+        "unexpected stderr: {stderr}"
+    );
+    assert!(
+        !session.socket_path().exists(),
+        "failed startup should remove the socket path"
+    );
+    assert!(
+        !session.pid_path().exists(),
+        "failed startup should remove the pid path"
+    );
+
+    Ok(())
+}
+
+#[test]
+fn wait_window_returns_matched_window_payload() -> Result<()> {
+    let _guard = env_lock_guard();
+    let Some(_env) = SessionEnvGuard::prepare() else {
+        eprintln!("Skipping X11 integration test because DISPLAY is not set");
+        return Ok(());
+    };
+
+    let title = "deskctl wait window test";
+    let _window = FixtureWindow::create(title, "DeskctlWait")?;
+    let session = TestSession::new("wait-window-success")?;
+    let response = successful_json_response(session.run_cli([
+        "--json",
+        "wait",
+        "window",
+        "--selector",
+        &format!("title={title}"),
+        "--timeout",
+        "1",
+        "--poll-ms",
+        "50",
+    ])?)?;
+
+    let window = response
+        .get("data")
+        .and_then(|data| data.get("window"))
+        .expect("wait window should return a matched window");
+    assert_eq!(
+        window.get("title").and_then(|value| value.as_str()),
+        Some(title)
+    );
+    assert_eq!(
+        response
+            .get("data")
+            .and_then(|data| data.get("wait"))
+            .and_then(|value| value.as_str()),
+        Some("window")
+    );
+
+    Ok(())
+}
+
+#[test]
+fn ambiguous_fuzzy_selector_returns_candidates() -> Result<()> {
+    let _guard = env_lock_guard();
+    let Some(_env) = SessionEnvGuard::prepare() else {
+        eprintln!("Skipping X11 integration test because DISPLAY is not set");
+        return Ok(());
+    };
+
+    let _window_one = FixtureWindow::create("deskctl ambiguity alpha", "DeskctlAmbiguous")?;
+    let _window_two = FixtureWindow::create("deskctl ambiguity beta", "DeskctlAmbiguous")?;
+    let session = TestSession::new("selector-ambiguity")?;
+    let output = session.run_cli(["--json", "focus", "ambiguity"])?;
+    let response = json_response(&output)?;
+
+    assert!(!output.status.success());
+    assert_eq!(
+        response.get("success").and_then(|value| value.as_bool()),
+        Some(false)
+    );
+    assert_eq!(
+        response
+            .get("data")
+            .and_then(|data| data.get("kind"))
+            .and_then(|value| value.as_str()),
+        Some("selector_ambiguous")
+    );
+    assert!(response
+        .get("data")
+        .and_then(|data| data.get("candidates"))
+        .and_then(|value| value.as_array())
+        .map(|candidates| candidates.len() >= 2)
+        .unwrap_or(false));
+
+    Ok(())
+}
+
+#[test]
+fn wait_focus_timeout_is_structured() -> Result<()> {
+    let _guard = env_lock_guard();
+    let Some(_env) = SessionEnvGuard::prepare() else {
+        eprintln!("Skipping X11 integration test because DISPLAY is not set");
+        return Ok(());
+    };
+
+    let session = TestSession::new("wait-focus-timeout")?;
+    let output = session.run_cli([
+        "--json",
+        "wait",
+        "focus",
+        "--selector",
+        "title=missing-window-for-wait-focus",
+        "--timeout",
+        "1",
+        "--poll-ms",
+        "50",
+    ])?;
+    let response = json_response(&output)?;
+
+    assert!(!output.status.success());
+    assert_eq!(
+        response
+            .get("data")
+            .and_then(|data| data.get("kind"))
+            .and_then(|value| value.as_str()),
+        Some("timeout")
+    );
+    assert_eq!(
+        response
+            .get("data")
+            .and_then(|data| data.get("last_observation"))
+            .and_then(|value| value.get("kind"))
+            .and_then(|value| value.as_str()),
+        Some("selector_not_found")
+    );
+
+    Ok(())
+}
Author	SHA1	Message	Date
Harivansh Rathi	32c6d337f1	ci: use self-hosted netty runners for validation jobs Some checks failed CI / Changes (push) Has been cancelled Details CI / Validate (push) Has been cancelled Details CI / Integration (Xvfb) (push) Has been cancelled Details CI / Distribution Validate (push) Has been cancelled Details CI / Update Manifests (push) Has been cancelled Details CI / Build Release Asset (push) Has been cancelled Details CI / Release (push) Has been cancelled Details CI / Publish npm (push) Has been cancelled Details CI / Publish crates.io (push) Has been cancelled Details	2026-04-05 11:46:45 -04:00
Harivansh Rathi	13119eecf7	update crates.io link Some checks failed CI / Changes (push) Has been cancelled Details CI / Validate (push) Has been cancelled Details CI / Integration (Xvfb) (push) Has been cancelled Details CI / Distribution Validate (push) Has been cancelled Details CI / Update Manifests (push) Has been cancelled Details CI / Build Release Asset (push) Has been cancelled Details CI / Release (push) Has been cancelled Details CI / Publish npm (push) Has been cancelled Details CI / Publish crates.io (push) Has been cancelled Details	2026-04-02 14:53:56 -04:00
github-actions[bot]	2b7de5fcef	release: v0.1.14 [skip ci]	2026-03-27 23:46:33 +00:00
Harivansh Rathi	2b3d422c7b	crates.io	2026-03-27 19:40:24 -04:00
Harivansh Rathi	19669fb4c1	demo	2026-03-27 19:25:26 -04:00
Hari	2107449d9b	Update README with asset link and description change Added a link to GitHub assets and removed 'Linux' from description.	2026-03-27 18:17:51 -04:00
github-actions[bot]	85e1916635	release: v0.1.13 [skip ci]	2026-03-27 14:10:07 +00:00
Harivansh Rathi	9bfada8b4b	fix helper	2026-03-27 10:04:10 -04:00
Harivansh Rathi	3ca6c90eaf	fix termination bug	2026-03-27 00:20:37 -04:00
github-actions[bot]	3a8d9f90c1	release: v0.1.12 [skip ci]	2026-03-26 19:31:47 +00:00
Hari	ff26c57035	replace firefox with chrome (#14 )	2026-03-26 15:25:40 -04:00
github-actions[bot]	580ea79c27	release: v0.1.11 [skip ci]	2026-03-26 18:47:09 +00:00
Harivansh Rathi	a58912284b	reorder pipeline	2026-03-26 14:40:45 -04:00
github-actions[bot]	8d690a62b4	release: v0.1.10 [skip ci]	2026-03-26 18:28:13 +00:00
Harivansh Rathi	07a478b0ee	couple CI with publish	2026-03-26 14:21:41 -04:00
github-actions[bot]	e61c5bc33f	release: v0.1.9 [skip ci]	2026-03-26 16:03:29 +00:00
Hari	a64b46b479	deskctl upgrade (#13 ) * deskctl upgrade * interactive update as well as --yes flag	2026-03-26 11:53:15 -04:00
Hari	2b02513d6e	Improve docs structure and navigation (#12 ) * Improve docs structure and navigation Co-authored-by: Codex <noreply@openai.com> * rm * handwrite docs --------- Co-authored-by: Codex <noreply@openai.com>	2026-03-26 11:27:35 -04:00
github-actions[bot]	844f2f2bc6	release: v0.1.8 [skip ci]	2026-03-26 13:37:41 +00:00
Harivansh Rathi	6c6f33040f	update readme	2026-03-26 09:35:46 -04:00
Harivansh Rathi	848ef97e87	edit readme	2026-03-26 09:34:10 -04:00
Harivansh Rathi	bf603671f9	rm:	2026-03-26 09:28:18 -04:00
Harivansh Rathi	3bfec9eecc	edit docs	2026-03-26 09:27:43 -04:00
Harivansh Rathi	c907e800af	change client bin name	2026-03-26 09:21:58 -04:00
Harivansh Rathi	2a8b51b4f5	docs: tighten skill install docs and bundle Co-authored-by: Codex <noreply@openai.com>	2026-03-26 09:21:43 -04:00
Harivansh Rathi	eedb5de2d4	refresh contributor cache [skip ci]	2026-03-26 09:13:10 -04:00
Harivansh Rathi	47047e9064	migrate update manifest job to publish workflow	2026-03-26 09:11:13 -04:00
Harivansh Rathi	deaffff45a	major/minor/patch	2026-03-26 09:07:56 -04:00
Harivansh Rathi	1d72c7b852	fix: add registry-url to setup-node for npm auth [skip ci]	2026-03-26 09:01:12 -04:00
Harivansh Rathi	86c36a3b50	release: v0.1.7 [skip ci]	2026-03-26 08:53:50 -04:00
Hari	eac3a61ceb	rename (#11 ) * align docs and contract * clean * rename from deskctl-cli to deskctl * runtime	2026-03-26 08:51:15 -04:00
Harivansh Rathi	88f9ff85a3	clean	2026-03-26 08:37:52 -04:00
Harivansh Rathi	14c8956321	align docs and contract	2026-03-26 08:37:52 -04:00
Harivansh Rathi	c37589ccf4	skill validated with workflows	2026-03-26 00:33:27 -04:00
Harivansh Rathi	3dbd9ce52d	init with runtime contract	2026-03-26 00:33:27 -04:00
github-actions[bot]	1092e503be	release: v0.1.6 [skip ci]	2026-03-26 03:25:14 +00:00
Hari	714e34ba19	nix (#7 ) npm cargo	2026-03-25 23:18:28 -04:00
github-actions[bot]	425a71095a	release: v0.1.5 [skip ci]	2026-03-26 02:04:56 +00:00
Hari	543d41c3a2	runtime contract enforcement (#6 )	2026-03-25 22:00:16 -04:00
github-actions[bot]	61f4738311	release: v0.1.4 [skip ci]	2026-03-26 01:16:24 +00:00
Hari	a4cf9e32dd	grouped runtime reads and waits selector modes (#5 ) - grouped runtime reads and waits selector modes - Fix wait command client timeouts and test failures	2026-03-25 21:11:30 -04:00
github-actions[bot]	cc8f8e548a	release: v0.1.3 [skip ci]	2026-03-25 23:47:58 +00:00
Harivansh Rathi	11ea267feb	gate the validation CI behind changes	2026-03-25 19:45:19 -04:00
Harivansh Rathi	08d8402afc	fix ci tag mismatch	2026-03-25 19:41:11 -04:00
Harivansh Rathi	ae5eb21563	licence	2026-03-25 19:34:36 -04:00
Harivansh Rathi	8944e82c1f	rm	2026-03-25 19:32:09 -04:00
Harivansh Rathi	ec9bc1f137	rm ai stuff from git	2026-03-25 19:30:22 -04:00
Hari	3819a85c47	tests and tooling (#4 ) * init openspec * clean out src, move mod into lib, remove trash * create tests * pre-commit hook * add tests to CI * update website * README, CONTRIBUTING and Makefile * openspec * archive task * fix ci order * fix integration test * fix validation tests	2026-03-25 19:29:59 -04:00
Harivansh Rathi	7dfab68304	mv skills into own dir	2026-03-25 18:36:21 -04:00
github-actions[bot]	bcf5f43fad	release: v0.1.1 [skip ci]	2026-03-25 22:34:39 +00:00
Hari	6dce22eaef	stabilize (#3 ) * specs * Stabilize deskctl runtime foundation Co-authored-by: Codex <noreply@openai.com> * opsx archive --------- Co-authored-by: Codex <noreply@openai.com>	2026-03-25 18:31:08 -04:00
Hari	d487a60209	openspec init (#2 )	2026-03-25 17:31:55 -04:00
Harivansh Rathi	a6ea5cc9e8	changes (detect paths + calculate version) \| build [cargo, docker] (parallel matrix) \| update-manifests (bump Cargo.toml, commit, tag) \| release (GitHub release + checksums)	2026-03-25 16:54:11 -04:00
Harivansh Rathi	4bd14c0da3	ci	2026-03-25 16:44:58 -04:00
Harivansh Rathi	6845f6b7e4	Acknowledgements	2026-03-25 16:31:15 -04:00
Harivansh Rathi	f241dcc1c2	gitignore	2026-03-25 16:25:14 -04:00
Harivansh Rathi	07124001eb	favicon	2026-03-25 16:24:27 -04:00
Harivansh Rathi	9a178e0b3a	font	2026-03-25 16:04:04 -04:00
Harivansh Rathi	e3c96878b1	scaffold docs	2026-03-25 16:04:04 -04:00
Harivansh Rathi	600fd6503b	base	2026-03-25 16:04:04 -04:00
Harivansh Rathi	26ec452878	public	2026-03-25 16:04:04 -04:00
Harivansh Rathi	50c9594780	site init (barrett)	2026-03-25 16:04:04 -04:00
Harivansh Rathi	f05f441dee	gitignore and comment	2026-03-25 15:16:42 -04:00
Harivansh Rathi	2b65c83245	temp rm uva	2026-03-25 13:40:34 -04:00