2d:["$","$L31",null,{"formats":"$undefined","locale":"en","messages":{"aria":{"closeMenu":"Close navigation menu","homePageLink":"PlanToCode home page","toggleMenu":"Toggle navigation menu"},"breadcrumb":{"docs":"Documentation","features":"Components","home":"Home"},"cta":{"download":"Download","talkToArchitect":"Technical discussion","viewSource":"View Source"},"feature":{"copyButtons":{"description":"Template-driven workflow handoff","label":"Copy Buttons"},"deepResearch":{"description":"Web search, extraction, and synthesis jobs","label":"Deep Research"},"fileDiscovery":{"description":"Multi-stage file selection pipeline","label":"File Discovery"},"integratedTerminal":{"description":"Persistent PTY sessions with logging","label":"Integrated Terminal"},"mergeInstructions":{"description":"Structured plan merge workflow","label":"Merge Instructions"},"planEditor":{"description":"Monaco editor for plan review","label":"Plan Editor"},"textImprovement":{"description":"Text refinement jobs for specs","label":"Text Improvement"},"voiceTranscription":{"description":"Voice capture and transcription","label":"Voice Transcription"},"skills":{"description":"Reusable prompt templates with trust levels","label":"Skills Catalog"},"claudeCodeChat":{"description":"Codex CLI chat with streaming JSONL timeline","label":"Codex CLI Chat"},"backgroundJobs":{"description":"Multi-project job monitoring and tracking","label":"Background Jobs"},"gitDiff":{"description":"Live repository changes alongside workspace","label":"Git Diff Viewer"},"deviceSync":{"description":"Continue Codex sessions from your phone","label":"Mobile Relay"},"videoAnalysis":{"description":"Gemini multimodal screen recording analysis","label":"Video Analysis"}},"videoButton":{"label":"View walkthrough video"},"videoModal":{"closeLabel":"Close video","unsupported":"Your browser does not support the video tag."},"footer":{"about":"About","architecture":"Architecture","changelog":"Changelog","company":"Source","copyright":"© {year} helpful bits GmbH","documentation":"Documentation","downloads":"Downloads","evolution":"Evolution","feedback":"Feedback","legal":"Legal","madeInGermany":"Made in Germany","privacy":"Privacy","product":"Project","resources":"Resources","runtimeWalkthrough":"Runtime Walkthrough","sourceCode":"Source Code","support":"Support","tagline":"Desktop Codex workspace with planning, skills, Gemini video analysis, and an iOS control plane.","terms":"Terms"},"label":{"english":"English","german":"German"},"docs":{"meta":{"title":"Documentation - PlanToCode","description":"Learn how PlanToCode works: run-centric execution, desktop authority, iOS control plane, terminal sessions, attention monitoring, and model configuration."},"docs":{"meta":{"title":"Documentation - PlanToCode","description":"Learn how PlanToCode works: run-centric execution, desktop authority, iOS control plane, terminal sessions, attention monitoring, and model configuration."}},"architecture":{"meta":{"title":"PlanToCode architecture overview","description":"Desktop execution authority, iOS control plane, run lifecycle, and the relay that connects them."},"category":"Architecture","date":"2025-09-19","description":"How the desktop execution authority, iOS control plane, and server relay are organised.","frontend":{"heading":"Frontend surface","providers":"Shared providers handle notifications, runtime configuration, and session state. The workspace chat timeline displays run progress, model responses, and activity events. The background jobs sidebar tracks active, queued, and completed runs across sessions.","ui":"The desktop UI is built with React components centered on the workspace chat — a conversational timeline that streams run output, supports inline file previews, and manages the full run lifecycle. An executive attention strip surfaces Now/Running/Next counters so operators can triage interventions. Terminal sessions render inside a buffered view with multi-tab support and agent attention indicators."},"intro":"PlanToCode is a run-centric Tauri desktop application with a React front end and an iOS companion. The desktop app holds execution authority — owning process execution, filesystem access, terminal PTY runtime, and relay emission. The iOS app acts as the control plane — issuing intents, monitoring run and attention state, and delivering local notifications. Both clients communicate through canonical RPC namespaces (session, plan, run, files, terminal) with runId as the control identifier.","visuals":{"systemMap":{"title":"System map snapshot","description":"$32","imageSrc":"/images/architecture/system-map.svg","imageAlt":"Diagram showing PlanToCode system map","caption":"Five-layer architecture with data flowing down, events streaming back up, and device relay syncing desktop with iOS."}},"metaDescription":"Desktop execution authority, iOS control plane, run lifecycle, and persistence layers that power the workspace.","metaTitle":"PlanToCode architecture overview","ogDescription":"Learn how the desktop execution authority, iOS control plane, and server relay cooperate in the run-centric workspace.","ogTitle":"PlanToCode architecture overview","persistence":{"database":"Terminal output and session metadata are stored in SQLite via the terminal sessions repository. Each record includes identifiers, timestamps, working directories, environment variables, and the accumulated log so that restarts can recover prior output. The same repository emits events when session state changes.","heading":"Persistence and configuration","modelConfig":"Model defaults live in the application configuration table. Each task defines a default model, a list of allowed alternatives, token budgets, and optional copy-button presets. The React layer reads these settings to populate the model selector and guardrails."},"readTime":"7 min","tauriCommands":{"commands":"The Rust side of the application exposes commands for workflows, terminal sessions, and model tooling. The workflow commands start background jobs through the Workflow Orchestrator, validating inputs and emitting progress events as the file discovery pipeline runs. Token estimation commands calculate prompt sizes for the currently selected model.","heading":"Tauri commands and services","terminal":"Terminal commands manage PTY processes, track remote clients, and verify whether supported CLI binaries are available before launching a session. Health checks combine PTY status with database records to report whether a session is still alive."},"ipcBridge":{"heading":"IPC bridge and event streaming","description":"The desktop UI calls Rust commands through the Tauri IPC bridge for run lifecycle, terminal sessions, and configuration. iOS reaches the same Rust backend through the RPC router over the WebSocket relay.","details":"Desktop commands are invoked from React; iOS commands arrive as JSON-RPC messages through the relay. Both paths stream results back via events so the UI can update run progress, terminal output, and attention state in real time."},"workflowOrchestrator":{"heading":"Run execution and relay","description":"Runs are the canonical unit of execution. The desktop creates runs, executes them through the Codex CLI or LLM proxy, and emits relay events (run:created, run:status-changed, run:stream-progress, run:finalized) to connected iOS clients.","details":"The overseer attention loop recomputes Now/Running/Next counters on a 60-second heartbeat and emits immediately on state changes. iOS listens for attention events and schedules local notifications."},"title":"PlanToCode Architecture","voicePipeline":{"description":"Voice transcription is available on both desktop and iOS. On desktop it is implemented as a React hook that coordinates media permissions and transcription requests. On iOS, native dictation integrates with the workspace chat composer, inserting recognised text directly into the message input.","heading":"Voice transcription pipeline"},"server":{"heading":"Server layer","description":"The server handles provider configuration (API keys from env/config and provider/model mappings), routes proxy requests by provider prefix, enforces rate limits, and records usage/cost for billing. It also serves system prompt defaults and runtime model configuration to clients."},"dataFlows":{"heading":"Data flows","description":"Runs, attention events, and sessions flow between desktop, iOS, and the server relay: (1) Chat message: Composer → Codex CLI run → run:stream-progress events → desktop timeline + iOS relay. (2) Attention: Overseer heartbeat → Now/Running/Next recompute → attention.raised relay event → iOS local notification. (3) Terminal: PTY session → output streaming → desktop UI + iOS terminal tab via relay → multi-context switching. (4) Plans: Ephemeral plan artifacts tied to runs via plan.* namespace → read/merge/generate through runId."},"stateSync":{"heading":"State synchronization","description":"Desktop SQLite is the source of truth for runs, sessions, and terminal output. iOS synchronizes through the relay and reconciles on reconnect.","details":"Relay events update iOS state as runs execute. Relay disconnect preserves local state and resumes synchronization after reconnect. Replay gaps trigger iOS reconciliation."},"llmRouting":{"heading":"LLM routing and provider normalization","description":"Model requests are sent to the server proxy, which routes by provider prefix and normalizes payloads and streaming responses.","details":"The proxy tracks usage and cost per user or API key, enforces rate limits, and routes specific providers through OpenRouter when configured (for example, Anthropic streaming or DeepSeek mappings)."}},"deepResearch":{"meta":{"title":"Deep research - PlanToCode","description":"Technical documentation for the web search workflow: API integration, query optimization, result processing, and development workflow integration."},"apiIntegration":{"heading":"API Integration Details","pipeline":{"description":"Research findings pass through a standardized processing pipeline that extracts meaningful information while preserving formatting and context. The pipeline handles various content types and synthesizes findings into actionable insights for development workflows.","heading":"Content Processing Pipeline"},"providerConfig":{"description":"The system uses your configured LLM provider for web research. The LLM generates targeted research queries based on your task context and synthesizes findings from its training data and web search capabilities. Model selection and configuration are managed through the application settings.","heading":"AI Research Configuration"}},"architecture":{"description":"The deep research system operates as a two-stage workflow: (1) WebSearchPromptsGeneration - AI analyzes your task and project context to generate targeted research queries, and (2) WebSearchExecution - the LLM executes research prompts in parallel and synthesizes findings. Each stage is designed for reliability, cost efficiency, and contextual relevance.","heading":"Architecture Overview"},"bestPractices":{"examples":{"description":"Common integration patterns demonstrate how web search results enhance different development scenarios, from debugging specific errors to implementing new features with unfamiliar APIs.","heading":"Integration Examples"},"heading":"Best Practices and Examples","strategies":{"description":"To maximize the value of web search integration, follow these proven strategies for formulating queries, interpreting results, and integrating findings into your development workflow.","heading":"Effective Search Strategies","queryFormulation":{"constraints":"Include platform or environment constraints","errors":"Combine library names with specific error messages","heading":"Query Formulation","practices":"Use \"best practices\" or \"recommended approach\" for pattern searches","versions":"Include specific version numbers when relevant"},"resultEvaluation":{"crossReference":"Cross-reference solutions across multiple sources","dates":"Check publication dates for time-sensitive information","heading":"Result Evaluation","official":"Prioritize official documentation over third-party sources","verify":"Verify code examples in your development environment"}}},"category":"Technical Reference","configuration":{"heading":"Configuration and Customization","preferences":{"description":"Research behavior is configured through model selection and task settings. Choose your preferred AI model for research tasks, configure timeouts, and select which files to include for context.","filters":"Model selection determines research quality and cost","heading":"Research Settings","limits":"Maximum 12 research prompts generated per task","optionsHeading":"Configurable Options","patterns":"Include relevant project files for better context","sources":"Project directory and file selection for context","triggers":"Start research manually via the workflow command"},"projectSettings":{"description":"Research configuration is session-aware. The system uses the current session's project directory and included files to provide context. Excluded paths (like node_modules, dist) are automatically filtered from the directory tree shown to the AI.","heading":"Project-Specific Settings"}},"costs":{"heading":"Cost Considerations","optimization":{"description":"Research costs are managed through intelligent prompt generation - the system limits research prompts to a maximum of 12 per task. Parallel execution minimizes wall-clock time. Each job tracks token usage and estimated costs in its metadata for full transparency.","heading":"Cost Optimization"},"rateLimiting":{"cacheFirst":"Research results are stored per job so you can reuse them without rerunning","description":"Deep research uses your configured LLM provider. Each research task generates multiple parallel LLM calls, so costs scale with the number of research prompts generated. The system tracks token usage and costs per job for transparency.","guidelinesHeading":"Cost Management Tips","heading":"Usage and Costs","personal":"Token usage tracked per research job with detailed cost breakdown","team":"Costs managed through your provider account (self-hosted) or PlanToCode billing (hosted)","throttling":"Monitor job metadata for token counts and estimated costs"}},"cta":{"description":"The Deep Research and Web Search features are available in the PlanToCode desktop application. Download the build for your platform to start integrating web research into your development workflow.","heading":"Ready to use Deep Research?","links":{"architecture":"View System Architecture","buildYourOwn":"Build Your Own Integration"}},"date":"2025-09-20","description":"How PlanToCode performs web searches, processes results, and integrates findings into development workflows.","devIntegration":{"caching":{"description":"Research results are stored in job metadata and can be accessed through the job details panel. Results persist for the session duration and can be referenced when creating implementation plans or making coding decisions.","heading":"Result Storage"},"contextAware":{"description":"Research requests are automatically enhanced with context from your current session. The system includes your project's directory tree and selected file contents in the prompt generation phase, enabling the AI to formulate research queries that are specific to your codebase.","heading":"Context-Aware Research"},"heading":"Development Workflow Integration","resultIntegration":{"description":"Research findings can be used to inform implementation plans. When research tasks complete, findings are formatted as research_finding tags that can be incorporated into subsequent planning tasks, ensuring your implementation is guided by current best practices and accurate documentation.","heading":"Result Integration"}},"intro":"The Deep Research feature enables PlanToCode to perform intelligent AI-powered research, gather relevant information, and integrate findings directly into development workflows. This system uses large language models to generate targeted research queries based on your project context, execute parallel research tasks, and synthesize actionable insights to enhance code generation and problem-solving capabilities.","metaDescription":"Technical documentation for the web search workflow: API integration, query optimization, result processing, and development workflow integration.","metaTitle":"Deep research - PlanToCode","ogDescription":"Understand how web search operates within PlanToCode: from query generation to result processing and integration with development workflows.","ogTitle":"Deep research - PlanToCode","readTime":"8 min","title":"Deep Research & Web Search","troubleshooting":{"commonIssues":{"description":"Most research issues stem from LLM API connectivity, insufficient credits, or prompts that are too broad. The system provides clear error messages and job status tracking for troubleshooting.","geographic":"Model Availability","geographicSolution":"Some models may have regional restrictions from the provider","heading":"Common Issues","noResults":"No Research Prompts Generated","noResultsSolution":"Provide more specific task descriptions or include relevant files for context","rateLimit":"API Errors","rateLimitSolution":"Check provider status and rate limit or credit balance"},"heading":"Troubleshooting and Support","performance":{"description":"For optimal performance, provide clear and specific task descriptions. Include relevant project files to give the AI better context. The system executes research prompts in parallel to minimize total execution time.","heading":"Performance Optimization"}},"workflow":{"execution":{"blogs":"Best practices and implementation patterns","description":"Research prompts are executed in parallel by AI language models. Each prompt is processed independently, allowing the system to gather information on multiple aspects of your task simultaneously. Results are synthesized into structured findings with titles and actionable insights.","documentation":"API documentation and technical specifications","forums":"Error resolution and troubleshooting approaches","github":"Code examples and implementation patterns","heading":"Research Execution","releases":"Version compatibility and migration guidance","sourcesHeading":"Research Focus Areas"},"heading":"Research Workflow Stages","processing":{"deduplication":"Findings consolidated across multiple research prompts","description":"Research findings are structured into JSON format with titles and detailed findings. The system aggregates results from parallel research tasks, tracks success and failure counts, and provides a summary of the research outcomes. Results are stored in job metadata for easy access.","extraction":"Key findings extracted and formatted for integration","heading":"Result Processing & Synthesis","scoring":"Results organized by research topic and relevance","snippets":"Actionable insights and recommendations highlighted","stepsHeading":"Processing Steps","timestamp":"Research execution tracked with timing metrics"},"queryGeneration":{"api":"API documentation and library-specific research","compatibility":"Version compatibility and migration paths","description":"Research prompts are automatically generated by AI based on your task description, project context, and included files. The system analyzes your codebase structure via directory tree and file contents to formulate targeted research queries. Up to 12 focused research prompts are generated per task.","errors":"Error resolution and debugging approaches","heading":"Prompt Generation","practices":"Best practices and recommended patterns","security":"Security considerations and vulnerability awareness","typesHeading":"Research Topics"}},"visuals":{"pipeline":{"title":"Deep Research Pipeline","description":"The two-stage workflow: prompt generation and parallel research execution.","imageSrc":"/images/docs/deep-research/workflow.svg","imageAlt":"Deep research pipeline diagram showing prompt generation and execution stages","caption":"Deep research workflow showing prompt generation and parallel execution stages"},"workflow":{"title":"Deep research workflow","description":"The two-stage workflow: prompt generation and parallel research execution.","imageSrc":"/images/docs/deep-research/workflow.svg","caption":"Deep research workflow showing all processing stages"}}},"fileDiscovery":{"meta":{"title":"File discovery workflow - PlanToCode","description":"Comprehensive technical guide to the 4-stage AI workflow that identifies and filters relevant files for task execution."},"apiUsage":{"heading":"API Usage Examples","monitoring":"Monitoring Progress","retrieving":"Retrieving Results","starting":"Starting a Workflow"},"architecture":{"caching":"Intermediate results are persisted in SQLite job records for reuse and debugging.","costTracking":"Cost tracking and timeout management for AI operations","distributed":"The system uses a distributed job architecture where each stage runs as an independent background job, enabling cancellation, retry logic, and detailed progress tracking. Real-time events are published throughout execution to provide immediate feedback to the user interface.","errorHandling":"Comprehensive error handling with automatic retry mechanisms","eventDriven":"Event-driven progress reporting with WebSocket-like updates","featuresHeading":"Key Architecture Features:","gitIntegration":"Git integration with fallback to directory traversal","heading":"Workflow Architecture","overview":"The workflow operates as an orchestrated background job system with four distinct stages that execute sequentially. Each stage builds upon the previous stage's output, progressively refining the file selection based on task requirements."},"category":"Technical Guide","configuration":{"exclusion":{"description":"Define directories and file patterns to exclude from the discovery process.","heading":"Exclusion Patterns"},"heading":"Configuration Options","retry":{"description":"Set maximum retry attempts for failed stages with exponential backoff.","heading":"Retry Configuration"},"timeout":{"description":"Configure maximum execution time for the entire workflow or individual stages to prevent indefinite hanging.","heading":"Timeout Management"},"workflowConfig":"Workflow Configuration"},"cta":{"description":"The file discovery workflow runs inside the desktop client alongside implementation planning and terminal sessions.","heading":"Need the desktop app?","links":{"architecture":"Learn about architecture","buildYourOwn":"Build your own pipeline"}},"date":"2025-09-21","description":"Comprehensive technical guide to the 4-stage AI workflow that identifies and filters relevant files for task execution.","errorHandling":{"commonIssues":{"binaryDetection":"Binary file detection: Uses both extension-based and content-based binary detection","gitNotFound":"Git repository not found: Falls back to directory traversal with standard exclusions","heading":"Common Issues","networkTimeout":"Network timeouts: Automatic retry with exponential backoff for transient failures","tokenLimit":"Token limit exceeded: Implements intelligent batching and provides clear error messages"},"debugging":{"description":"The workflow provides comprehensive logging, performance metrics export, and detailed error context including stage information, retry attempts, and intermediate data for troubleshooting.","heading":"Debugging Tools"},"errorCategories":{"billing":"Billing Errors: Insufficient credits or payment failures with actionable guidance","heading":"Error Categories","system":"System Errors: File system access, git command failures, or memory constraints","validation":"Validation Errors: Invalid session ID, missing task description, or invalid project directory","workflow":"Workflow Errors: Stage-specific failures with detailed context and retry suggestions"},"heading":"Error Handling & Troubleshooting"},"integration":{"desktop":{"description":"The workflow integrates seamlessly with the desktop application through Tauri commands, providing native file system access and event-driven updates via the WorkflowTracker class.","heading":"Desktop Application"},"heading":"Integration Patterns","implementationPlans":{"description":"Selected files are automatically fed into the Implementation Plans panel, ensuring that plan generation uses the same optimized file context without requiring re-execution of the discovery workflow.","heading":"Implementation Plans Integration"},"sessionManagement":{"description":"Selected files and task history persist per session so follow-up actions can reuse the same context without rerunning discovery.","heading":"Session Management"}},"intro":"PlanToCode identifies the right files before you plan or run commands. The 4-stage workflow narrows scope and keeps context tight.","metaDescription":"Comprehensive technical guide to the 4-stage AI workflow that identifies and filters relevant files for task execution.","metaTitle":"File discovery workflow - PlanToCode","ogDescription":"Technical documentation for the multi-stage file discovery workflow architecture.","ogTitle":"File discovery workflow - PlanToCode","performance":{"costOptimization":{"description":"AI stages track actual costs from API responses, implement intelligent batching to minimize token usage, and provide cost estimates before execution to help manage expenses.","heading":"Cost Optimization"},"heading":"Performance Considerations","memory":{"description":"The workflow uses token-aware chunking, streaming responses, and cleanup of temporary data to manage memory. There is no fixed file batch size.","heading":"Memory Management"},"monitoring":{"description":"Built-in performance tracking monitors execution times, memory usage, throughput metrics, and provides recommendations for optimization based on historical data analysis.","heading":"Performance Monitoring"}},"readTime":"12 min","stages":{"heading":"4-Stage Workflow Process","stage1":{"description":"Uses AI to intelligently select the most relevant root directories from a list of candidate paths based on the task description. The LLM analyzes the primary project directory and candidate roots to determine which directories are most likely to contain files relevant to the task.","heading":"Stage 1: Root Folder Selection","technical":"Technical Details: Receives candidate root directories (up to depth 2) and the task description. The LLM evaluates each path against the task context and returns a filtered list of root directories that will be searched in subsequent stages.","inputOutput":"Input/Output: Receives candidate_roots array and task_description. Returns root_directories array containing the AI-selected directories most relevant to the task."},"stage2":{"binaryDetection":"Binary Detection: Filters out files with binary extensions (.jpg, .png, .pdf, .exe, etc.) and uses content analysis to detect binary files by null bytes and non-printable character ratios.","description":"Uses AI to generate intelligent regex pattern groups based on the task description and directory structure. Each pattern group can include path patterns (positive and negative) and content patterns. The processor then applies these patterns to filter files from each selected root directory.","gitIntegration":"Git Integration: Finds the git repository root for each selected directory and uses git_utils to get all non-ignored files, respecting .gitignore rules while including both tracked and untracked files.","heading":"Stage 2: Regex File Filter","technical":"Technical Details: Generates a directory tree for each root, calls the LLM to produce patternGroups with path_pattern, content_pattern, and negative_path_pattern fields. Uses fancy-regex for lookahead/lookbehind support. Processes roots in parallel with configurable concurrency."},"stage3":{"aiProcessing":"AI Processing: Uses large language models to evaluate file content against task requirements, with intelligent chunking based on actual file sizes and token estimates to manage context windows efficiently.","description":"Employs AI models to analyze file content and assess relevance to the specific task description. This stage performs deep content analysis by reading file contents and having the LLM identify which files are most relevant to the task.","heading":"Stage 3: AI File Relevance Assessment","technical":"Technical Details: Estimates tokens per file using file-type-aware heuristics (code ~3 chars/token, structured data ~5 chars/token). Creates content-aware chunks to stay under the 90k token threshold. Processes chunks in parallel with streaming to avoid timeouts. Validates all LLM-suggested paths against the filesystem."},"stage4":{"description":"Discovers additional relevant files by providing the LLM with the previously identified files and their contents, along with the directory tree. The AI analyzes imports, dependencies, and project structure to find related files that enhance the context for the task.","heading":"Stage 4: Extended Path Finder","relationship":"Relationship Analysis: Reads content of all previously identified files and provides it to the LLM alongside the directory tree (scoped to selected roots if available). The AI identifies additional files based on imports, references, and structural relationships.","technical":"Technical Details: Generates a combined directory tree for selected root directories. Reads content of all initial_paths files. Uses streaming LLM calls to avoid Cloudflare timeouts. Validates discovered paths against the filesystem and normalizes to relative paths within the project."}},"stateManagement":{"eventDriven":{"description":"The system publishes real-time events for workflow status changes, stage completions, and error conditions. These events enable responsive user interfaces and integration with external monitoring systems.","heading":"Event-Driven Updates"},"heading":"Workflow State Management","intermediateData":{"description":"Each stage stores its output in a structured intermediate data format, including directory tree content, regex patterns, filtered file lists results. This data is accessible for debugging and can be used to resume workflows from specific stages.","heading":"Intermediate Data Storage"},"transitions":{"description":"The workflow progresses through clearly defined states: Created → Running → Paused (optional) → Completed/Failed/Canceled. Each state transition publishes events that can be monitored for real-time updates.","heading":"State Transitions"}},"visuals":{"pipeline":{"title":"File discovery pipeline","description":"The 4-stage workflow: root folder selection, regex filtering, AI relevance assessment, and extended path discovery.","imageSrc":"/images/docs/file-discovery/pipeline.svg","caption":"File discovery pipeline showing all 4 stages","imageAlt":"Diagram showing the 4-stage file discovery workflow: Root Folder Selection, Regex File Filter, AI File Relevance Assessment, and Extended Path Finder"}},"title":"File Discovery Workflow","sqliteStorage":{"heading":"SQLite Storage","description":"All workflow state, intermediate results, and job metadata are persisted in SQLite. Each stage stores its output in the background_jobs table, enabling workflow resumption and debugging. The job records include token usage, cost tracking, and system prompt templates for each AI stage."}},"hub":{"ctaDescription":"Download PlanToCode to access the implementation planner, model guardrails, terminal sessions, and transcription features described in this documentation.","ctaHeading":"Ready to try these workflows?","ctaLinks":{"overview":"Start with Overview","runtime":"Runtime Walkthrough"},"description":"Learn how to plan and ship code changes with PlanToCode: file discovery, implementation plans, terminal sessions, model guardrails, and voice.","exploreHeading":"Explore Documentation","learnMore":"Learn More","searchAriaLabel":"Search documentation","searchPlaceholder":"Search documentation...","searchShortcut":"⌘K","title":"PlanToCode documentation"},"onThisPage":{"title":"On this page"},"sidebar":{"title":"Documentation"},"sections":{"architecture":{"title":"Architecture & Internals"},"inputs":{"title":"Inputs & Capture"},"planning":{"title":"Planning Pipeline"},"execution":{"title":"Execution & Automation"},"research":{"title":"Research & Models"},"platform":{"title":"Build & Deployment"}},"items":{"overview":{"title":"System Overview","description":"Start here: what the system does, how the core loop works, and where each component lives."},"runtime-walkthrough":{"title":"Runtime Walkthrough","description":"End-to-end timeline of what happens from task input to execution."},"architecture":{"title":"System Architecture","description":"How the desktop shell, Rust services, server APIs, and persistence layers fit together."},"desktop-app":{"title":"Desktop App Internals","description":"Tauri v2 shell, Rust command layer, PTY sessions, and UI state management."},"server-api":{"title":"Server API & LLM Proxy","description":"Auth, provider routing, model configuration, and WebSocket endpoints."},"mobile-ios":{"title":"iOS Client Architecture","description":"Swift workflows, Auth0 login flow, and device-link session management."},"background-jobs":{"title":"Background Jobs & Orchestration","description":"Job records, workflow orchestration, processors, and event streaming."},"data-model":{"title":"Data Model & Storage","description":"SQLite entities, relationships, and how state is rehydrated."},"decisions-tradeoffs":{"title":"Technical Decisions & Tradeoffs","description":"Why Tauri, SQLite, and a dedicated LLM proxy were chosen and what they cost."},"build-your-own":{"title":"Build Your Own Pipeline","description":"Conceptual guide for designing file discovery and plan generation workflows."},"meeting-ingestion":{"title":"Meeting & Recording Ingestion","description":"How recordings become structured task inputs and artifacts."},"video-analysis":{"title":"Video Analysis","description":"Frame sampling, prompts, and analysis artifacts from recordings."},"voice-transcription":{"title":"Voice Transcription","description":"Recording lifecycle, project-aware settings, and device management."},"text-improvement":{"title":"Text Improvement","description":"Selection popover, job queue, and integrations for prompt cleanup."},"file-discovery":{"title":"File Discovery Workflow","description":"Background workflow that gathers relevant paths for each task."},"implementation-plans":{"title":"Implementation Plans","description":"How plans stream into the Monaco viewer and stay linked to plan history."},"merge-instructions":{"title":"Merge Instructions","description":"How multiple plan drafts are merged using XML-tagged source plans and user guidance."},"prompt-types":{"title":"Prompt Types & Templates","description":"Catalog of prompt-driven job types and template assembly."},"terminal-sessions":{"title":"Terminal Sessions","description":"Persistent PTY sessions, CLI detection, and recovery behaviour."},"copy-buttons":{"title":"Copy Buttons","description":"Template handoff from plans into terminals and external tools."},"deep-research":{"title":"Deep Research & Web Search","description":"Web search workflow, API integration, query optimization, and development workflow integration."},"provider-routing":{"title":"Provider Routing & Streaming","description":"How provider requests are normalized, streamed, and tracked."},"model-configuration":{"title":"Model Configuration","description":"Allowed models per task and token guardrails in the selector toggle."},"server-setup":{"title":"Dedicated Server Setup","description":"Ansible-based infrastructure: base hardening, app deployment, and vault-managed secrets."},"tauri-v2":{"title":"Tauri v2 Development Guide","description":"Project layout, commands, and capability-based permissions for Tauri v2."},"distribution-macos":{"title":"macOS Distribution","description":"Signing, notarization, DMG packaging, and updater artifacts."}},"implementationPlans":{"meta":{"title":"Implementation Plans - Review AI Changes","description":"Guide to AI implementation planning. Generate, review, and approve file-by-file plans before execution. Prevent duplicates and wrong paths."},"category":"Product Guide","context":{"audit":"Plan metadata persists with each job so you can review which inputs were used (task description, selected roots/files, model settings) and compare drafts later.","heading":"Context and Metadata for Corporate Governance","storage":"The panel stores which repository roots were selected during the file discovery workflow so that follow-up actions reuse the same scope. It also records plan-specific metadata, such as the project directory and any prepared prompt content, so downstream prompts can be generated or copied without recomputing the workflow.","tokenEstimation":"Token estimation runs before prompts are copied. The panel calls the token estimation command with the project directory, selected files, and the currently chosen model, surfacing both system and user prompt totals so teams can stay under model limits."},"cta":{"claudeCodeLink":"See Claude plan mode workflow","codexLink":"See Codex plan mode workflow","cursorLink":"See Cursor plan mode workflow","description":"Human-in-the-loop implementation plans are available inside the PlanToCode desktop application. Download the build for your platform to experience safe, governed AI-assisted development.","heading":"Ready to adopt AI coding agents safely?","links":{"architecture":"System Architecture","decisions":"Decisions & Tradeoffs","buildYourOwn":"Build Your Own Pipeline","fileDiscovery":"File Discovery Workflow"}},"date":"2025-09-19","description":"How PlanToCode enables confident adoption of AI coding agents through human-in-the-loop review, granular file-by-file plans, and clear handoff workflows.","fileGranularity":{"created":"Created (with complete file paths and initial content structure)","declaredFiles":"Each step in a plan explicitly declares which files will be:","deleted":"Deleted (with justification and dependency analysis)","heading":"File-by-File Granularity","impact":"Reviewers can immediately identify if critical legacy code will be modified, if breaking changes are proposed, or if the plan touches files that require additional scrutiny.","intro":"Implementation plans use a highly granular structure that breaks down development tasks on a file-by-file basis, with exact file paths corresponding to the project's repository structure. This granularity makes scope explicit before any code is touched.","modified":"Modified (with specific line ranges and changes described)","referenced":"Referenced (for context but not modified)","transmission":"The file-by-file approach also enables precise transmission of approved plans to coding agents. Instead of vague instructions like \"update the authentication system,\" agents receive exact specifications: \"modify src/auth/session_manager.rs lines 45-67 to add token rotation, create src/auth/token_store.rs with the following structure...\""},"hitl":{"approve":"Approve:","approveDesc":"When you are ready, you can hand the plan off to a coding agent or developer for execution.","conclusion":"This workflow keeps execution aligned with the plan you reviewed and helps prevent surprise changes.","edit":"Edit:","editDesc":"You can directly modify steps, adjust approaches, add constraints, or remove risky operations using VS Code editing features.","heading":"Human-in-the-Loop Governance","intro":"PlanToCode keeps planning human-in-the-loop so you can review, edit, and decide when to hand off a plan for execution.","reject":"Discard:","rejectDesc":"If a draft isn't useful, you can delete it from the session list.","requestChanges":"Request Changes:","requestChangesDesc":"Generate alternative plans or merge drafts with custom instructions to converge on the approach you want.","review":"Review:","reviewDesc":"Plans open in Monaco editor where reviewers can examine every proposed change with full syntax highlighting and professional editing tools.","workflow":"Plans are designed for a structured review workflow before any code modifications begin:"},"intro":"Review and approve every plan before execution. File-by-file granularity keeps scope explicit and changes aligned with your requirements.","metaDescription":"Guide to AI implementation planning. Generate, review, and approve file-by-file plans before execution. Prevent duplicates and wrong paths.","metaTitle":"Implementation Plans - Review AI Changes","multiplePlans":{"description":"Plans can be merged, deleted, or reopened later. The panel keeps a list of selected plan identifiers, manages a dedicated modal for terminal output tied to a plan, and exposes navigation helpers so reviewers can page through earlier plans without closing the viewer. Terminal access, prompt copy controls, and merge instructions all share the same job identifier so plan history stays consistent.","heading":"Working with multiple plans"},"ogDescription":"Understand how human-in-the-loop governance and file-by-file review workflows ensure safe AI development with complete control over code modifications.","ogTitle":"Human-in-the-Loop Implementation Plans in PlanToCode","plansOrigin":{"description":"Each plan corresponds to a background job in the current session. The panel subscribes to plan data, keeps track of which plan is currently open, and exposes navigation between earlier and newer jobs. This behaviour lives inside {code} and the surrounding panel component.","heading":"Where the plans come from","processor":"ImplementationPlanProcessor handles plan generation. It reads relevant files, optionally generates a directory tree based on selected root directories, and assembles a unified prompt for the LLM.","storage":"Plan responses are stored in the background_jobs table with metadata including planTitle, summary, sessionName, and token usage. The raw LLM response is preserved for review and debugging.","streaming":"Plans stream via the LlmTaskRunner with real-time progress events. Token warnings are logged for prompts exceeding 100k tokens but processing continues with full content."},"readTime":"6 min","reviewingPlans":{"description":"Plan content is rendered through the shared {code}, which wraps Monaco Editor. The viewer automatically detects common languages, supports copy-to-clipboard actions, virtualises very large plans, and offers optional metrics such as character counts and syntax-aware highlighting.","heading":"Reviewing plans with Monaco","opening":"When a plan is opened, the panel resolves the active plan by job identifier, passes the content to Monaco, and lets reviewers move between neighbouring jobs without losing the currently open modal."},"visuals":{"structure":{"title":"Implementation plan structure","description":"XML format for implementation plans with file-by-file granularity and metadata.","imageSrc":"/images/docs/implementation-plans/structure.svg","imageAlt":"Implementation plan XML structure diagram","caption":"Plan structure showing steps, files, and dependency tracking"}},"title":"Implementation Plans","planProcessor":{"heading":"Plan Generation Pipeline","description":"The ImplementationPlanProcessor orchestrates plan generation by loading file contents, building context, and streaming results through the LLM task runner.","inputs":"Session context, task description, selected relevant files, optional directory tree (configurable via include_project_structure flag), and web search flag for external research.","prompt":"Uses prompt_utils::build_unified_prompt to combine task description, full file contents (no truncation), and directory tree into a model-specific format with estimated token counts.","output":"Raw LLM response stored as JobResultData::Text. Metadata includes planTitle, summary, token usage, cache statistics, and actual cost.","display":"Responses stream to the UI via progress events. Plans are rendered in a Monaco-based VirtualizedCodeViewer supporting syntax highlighting and copy actions."},"schema":{"heading":"Plan Data Structure","description":"Implementation plans are stored as raw LLM responses with associated metadata. The response text is preserved exactly as generated, while structured metadata tracks the plan context and usage.","fieldsHeading":"Metadata Fields","fields":["planTitle - Generated or user-provided title for the plan","summary - Human-readable summary of the plan","sessionName - Name of the session that generated the plan","isStructured - True for implementation_plan jobs; false for merge outputs","isStreaming - False for completed plans (true during generation)","planData - Contains agent_instructions (optional) and steps array"],"exampleHeading":"Metadata Example","example":"{\n \"planTitle\": \"Authentication System Refactor\",\n \"summary\": \"Implementation plan generated\",\n \"sessionName\": \"my-project\",\n \"isStructured\": true,\n \"isStreaming\": false,\n \"planData\": {\n \"agent_instructions\": null,\n \"steps\": []\n }\n}"}},"modelConfiguration":{"meta":{"title":"Model configuration and guardrails - PlanToCode","description":"How PlanToCode lets you pick allowed models per task and keeps prompts within the active context window."},"category":"Product Guide","date":"2025-09-20","description":"Task-level model lists, selector controls, and token guardrails in the desktop client.","intro":"PlanToCode treats model selection as a task-level decision. Each workflow ships with a default model and an allowed list, and the desktop client exposes these options through a toggle that prevents sending prompts that exceed the active context window.","visuals":{"selector":{"title":"Model selector toggle","description":"How the model selector shows allowed models with token guardrails.","imageSrc":"","imageAlt":"Model selector toggle with token estimates and guardrails","caption":"Model selector screenshot not yet available."}},"metaDescription":"How PlanToCode lets you pick allowed models per task and keeps prompts within the active context window.","metaTitle":"Model configuration and guardrails - PlanToCode","ogDescription":"Learn how task-level model settings, selector toggles, and token estimates work together.","ogTitle":"Model configuration and guardrails - PlanToCode","promptEstimation":{"description":"Token counts are calculated through the token estimation command. The panel submits the session id, task description, relevant files, and the selected model so the backend can return system, user, and total token values. These numbers feed directly into the selector guardrails and let teams spot over-limit prompts before copying them into another tool.","heading":"Prompt estimation"},"readTime":"5 min","selectorToggle":{"description":"The Implementation Plans panel renders allowed models with the {code}. The toggle displays each allowed model, tracks the active selection, and checks whether the estimated prompt plus planned output tokens fit within the model's advertised context window before allowing a switch.","guardrails":"If a model cannot support the total token requirement, the toggle disables the button and surfaces a tooltip with the computed overage, keeping reviewers within safe limits before they send work to an agent.","heading":"Selector toggle in the client"},"taskDefaults":{"description":"Default models and allowed alternatives are stored server-side in the application configuration. Each task type - such as implementation plans, merges, prompt generation, or voice transcription - defines a preferred model, a list of allowed options, and token limits that the desktop app reads at runtime.","heading":"Task-driven defaults"},"title":"Model Configuration"},"terminalSessions":{"meta":{"title":"Terminal sessions - PlanToCode","description":"Technical guide to PTY terminal implementation in PlanToCode. Learn how sessions persist, agent inactivity detection works, and recovery mechanisms."},"attentionDetection":{"conclusion":"This approach helps you track when agents have finished tasks or need guidance, without trying to guess why they stopped. Attention indicators clear automatically when new output is received.","heading":"Agent attention detection","intro":"The terminal monitors agent activity through a two-level inactivity detection system. When an agent stops producing output, the system progressively alerts you to check what has happened:","level1":"Level 1 (30 seconds): \"Agent idle - may have completed task\" with yellow indicator","level2":"Level 2 (2 minutes): \"Agent requires attention - check terminal\" with red indicator and desktop notification"},"category":"Product Guide","date":"2025-09-22","dependencyChecks":{"description":"Before launching commands, the terminal checks for the presence of supported CLI tools such as claude, cursor, codex, and gemini. The same command also reports the default shell so users know which environment will run. This prevents launching into a session that cannot find the required binary.","heading":"Dependency checks"},"description":"Persistent PTY sessions, agent attention detection, and recovery behaviour in the Implementation Plans terminal.","intro":"Run commands in a persistent PTY with health checks and logging. Voice transcription is available when you need it.","visuals":{"sessionView":{"title":"Terminal session architecture","description":"PTY process lifecycle, output routing, and persistence layers.","imageSrc":"","imageAlt":"Terminal session architecture showing PTY, channels, and persistence","caption":"Terminal session architecture diagram not yet available."}},"lifecycle":{"description":"When a terminal opens, the UI component creates a PTY session and streams output through a buffered view. The component shows immediate connection status, forwards keystrokes to the PTY, and automatically retries if the session fails. Session metadata is stored in SQLite with timestamps, exit codes, working directories, and the full output log so that restarts can resume previous context.","heading":"Session lifecycle"},"metaDescription":"Technical guide to PTY terminal implementation in PlanToCode. Learn how sessions persist, agent inactivity detection works, and recovery mechanisms.","metaTitle":"Terminal sessions - PlanToCode","ogDescription":"Understand session persistence, agent attention detection, and recovery in the plan terminal.","ogTitle":"Terminal sessions - PlanToCode","readTime":"6 min","title":"Terminal Sessions","voiceRecovery":{"heading":"Voice transcription and recovery","recovery":"If a PTY session disconnects, the terminal surface displays recovery controls and retries the connection with exponential backoff. Health checks continue monitoring session state and provide automatic recovery actions when connection issues are detected.","voice":"Inside the terminal modal, voice transcription can capture speech and paste it into the terminal input area. The recording hook looks up project-level transcription settings, tracks recording state, and inserts transcribed text when the recording stops."}},"copyButtons":{"meta":{"title":"Copy Buttons - PlanToCode","description":"How template-driven copy buttons resolve placeholders against plans and hand off to terminals or clipboard for agent execution."},"category":"Execution","date":"2025-09-23","readTime":"10 min","title":"Copy Buttons","description":"Template-driven handoff from implementation plans to PTY terminals and external tools.","intro":"Copy buttons resolve template placeholders against the active plan and then send the result to the clipboard (plan views) or the PTY (terminal modal).","metaTitle":"Copy buttons - PlanToCode","metaDescription":"How template-driven copy buttons resolve placeholders against plans and hand off to terminals or clipboard for agent execution.","ogTitle":"Copy buttons - PlanToCode","ogDescription":"Technical guide to copy button templates, placeholder resolution, and terminal handoff.","visuals":{"templateFlow":{"title":"Template resolution flow","description":"Templates resolve {{IMPLEMENTATION_PLAN}}, {{TASK_DESCRIPTION}}, and {{STEP_CONTENT}} before copying or sending to the terminal.","imageSrc":"/images/docs/copy-buttons/templates.svg","imageAlt":"Flow showing copy button template resolution","caption":"Placeholder for a template resolution flow diagram."}},"templateConfiguration":{"heading":"Template Configuration Sources","description":"Copy button templates follow a layered configuration model. Server defaults provide baseline templates, and project-level overrides customize the implementation_plan task for a given repo.","serverDefaults":{"heading":"Server Defaults","description":"Shared templates from /api/config/desktop-runtime-config. Includes button labels and template strings."},"projectOverrides":{"heading":"Project Overrides","description":"Project overrides are stored in SQLite key_value_store under project_task_settings and merged with server defaults."},"taskSpecific":{"heading":"Task-Specific","description":"Copy buttons are configured per task type (implementation_plan) and stored per project. There are no per-job overrides."}},"placeholderResolution":{"heading":"Placeholder Resolution","description":"Templates use double-brace placeholders that are resolved against plan content and the current task description.","placeholdersHeading":"Available Placeholders","placeholders":[{"placeholder":"{{IMPLEMENTATION_PLAN}}","description":"Full implementation plan content as generated by the LLM"},{"placeholder":"{{TASK_DESCRIPTION}}","description":"The task description from the current session"},{"placeholder":"{{STEP_CONTENT}}","description":"Content for the selected plan step (when a step is selected)"}],"resolutionOrder":"Missing placeholders are replaced with empty strings. Step content is only available when a plan step is selected.","exampleTemplate":"Example template:\n\n{{IMPLEMENTATION_PLAN}}\n\nUnderstand the implementation plan above thoroughly. Analyze the architecture, data flows, and sequence of events.\n\nTask: {{TASK_DESCRIPTION}}"},"processingPipeline":{"heading":"Template Processing Pipeline","description":"When a button is clicked, placeholders are extracted, values are resolved, and the output is sent to clipboard or PTY depending on where the button is used.","steps":[{"number":1,"title":"Extract Placeholders","description":"Regex scan for {{...}} patterns in the template string"},{"number":2,"title":"Lookup Context","description":"Resolve plan content and task description values for placeholders"},{"number":3,"title":"Substitute Values","description":"Replace placeholders with resolved values"},{"number":4,"title":"Send Output","description":"Copy to clipboard or write to the PTY input buffer"}],"chunking":{"heading":"Large Plan Chunking","description":"When sending to the PTY, the text is chunked into 4KB segments and a carriage return is appended."}},"terminalHandoff":{"heading":"PTY Terminal Handoff","description":"In the plan terminal modal, copy buttons write the resolved template to the PTY input buffer as if typed by the user.","detailsHeading":"Handoff Details","details":["Content sent via write_terminal_input_command to the PTY input buffer","Chunked into 4KB segments for large plans","Appends a carriage return after sending"],"codeExample":"// Terminal handoff (PlanTerminalModal)\nconst textToSend = replacePlaceholders(button.content, {\n IMPLEMENTATION_PLAN: planContent,\n TASK_DESCRIPTION: taskDescription ?? \"\"\n});\nawait sendInChunks(sessionId, textToSend);"},"clipboardHandoff":{"heading":"Clipboard Handoff","description":"In plan cards and plan modals, buttons copy the resolved template to the system clipboard using the browser clipboard API.","crossPlatform":{"heading":"Cross-Platform API","description":"Uses navigator.clipboard.writeText() inside the Tauri webview for clipboard access."},"feedback":{"heading":"User Feedback","description":"Toast notification confirms the copy action."}},"defaultButtons":{"heading":"Default Copy Buttons","description":"PlanToCode ships with several default copy buttons for implementation plans. These are templates you can edit in settings.","buttonsHeading":"Built-in Buttons","buttons":[{"id":"parallel-agents","label":"Parallel Claude Coding Agents","description":"Template that instructs Claude Code to launch parallel agents using the plan."},{"id":"investigate-results","label":"Investigate Results","description":"Template that asks the agent to review changes without launching new agents."},{"id":"task-only","label":"Task","description":"Copies only the task description."},{"id":"task-and-plan","label":"Task + Plan","description":"Combines task description and implementation plan for full context."},{"id":"plan-only","label":"Plan","description":"Copies only the implementation plan content."}]},"customization":{"heading":"Customizing Copy Buttons","description":"Copy buttons can be customized at multiple levels: global defaults, project-level overrides, and per-task configurations.","globalDefaults":{"heading":"Global Defaults","description":"Server-side configuration in /api/config/desktop-runtime-config defines the base set of copy buttons. These are loaded when the desktop app starts and cached for offline use."},"projectSettings":{"heading":"Project-Level Customization","description":"Each project can override the default buttons through the Settings panel. Project-specific buttons are stored in key_value_store and merged with server defaults at runtime."},"taskSettings":{"heading":"Task-Level Configuration","description":"Copy buttons are configured per task type (implementation_plan) and applied per project."},"editorDescription":"The copy button editor supports drag-and-drop ordering, inline label editing, and template content modification. Changes are persisted automatically."},"uiIntegration":{"heading":"UI Integration and Safety","description":"Copy buttons appear in plan viewers and terminal headers. Clicking a button sends output immediately; there is no preview step by default.","tokenEstimation":{"heading":"Token Estimation","description":"Plan cards display token counts for the plan job; copy buttons do not compute per-template token estimates."},"previewModal":{"heading":"Full Preview Modal","description":"There is no dedicated preview modal; open the plan content to inspect what will be copied."},"disabledState":{"heading":"Disabled State","description":"Buttons are disabled when required context is missing (e.g., no active plan, missing session). Tooltips explain what context is needed to enable the button."}},"auditTrail":{"heading":"History and signoff","description":"Copy button clicks are not stored in a dedicated table. Plan edits are stored in background_jobs.response and signoff state is recorded in background_jobs.metadata.userSignoff.","schemaHeading":"Notes","schema":"No copy_button_actions table exists in the current release.","fieldsHeading":"Stored plan signals","fields":[{"field":"background_jobs.response","description":"Plan content after edits or merges"},{"field":"background_jobs.metadata.userSignoff","description":"User signoff state and timestamp"}],"retention":"No separate retention policy exists for copy button actions; job history retention is controlled in app settings."},"mobileIntegration":{"heading":"Mobile Integration","description":"Copy buttons work in the iOS remote terminal actions bar. Resolved templates are sent to the linked desktop terminal.","deviceLink":{"heading":"Device Link Support","description":"When a mobile device is linked to a desktop session, copy buttons can target the desktop terminal directly. The resolved content is sent through the device link WebSocket connection."},"mobileButtons":{"heading":"Mobile-Specific Buttons","description":"Mobile clients use the same copy button configuration stored in project task settings."}},"cta":{"heading":"Trace handoff to execution","description":"Terminal sessions show where copy button output lands and how it is logged.","terminalLink":"Terminal sessions","plansLink":"Implementation plans"}},"textImprovement":{"meta":{"title":"Text improvement - PlanToCode","description":"How the desktop workspace rewrites highlighted text, preserves formatting, and links the feature to voice and video inputs."},"category":"Product Guide","cta":{"description":"Download PlanToCode to combine voice capture, video context, and inline rewriting before you generate implementation plans.","heading":"Try text improvement in the desktop app","links":{"architecture":"Architecture overview","buildYourOwn":"Build your own"}},"date":"2025-09-21","description":"How PlanToCode rewrites highlighted text without changing formatting and links the result back to your workspace.","intro":"Refine text with AI context. Select text in any editor, trigger a background job, and get improved content that keeps your formatting intact.","metaDescription":"How the desktop workspace rewrites highlighted text, preserves formatting, and links the feature to voice and video inputs.","metaTitle":"Text improvement - PlanToCode","ogDescription":"Understand the selection popover, job queue, model configuration, and integrations that power text improvement.","ogTitle":"Text improvement - PlanToCode","readTime":"7 min","selectionPopover":{"component":"The popover itself is a minimal component rendered by {code}, which simply triggers the provider hook and shows a loading indicator while a rewrite is running. Because the provider registers global listeners, the popover appears in Monaco plan viewers, the plan terminal dictation field, and any task description inputs without extra wiring.","heading":"Selection popover behaviour","provider":"The {code} listens for selection events on standard inputs and Monaco editors. When you highlight non-empty text it positions a popover near the cursor, stores the selected range, and tracks whether the popover should be visible. Clicking the button kicks off the job and disables the control until the result returns. When the job completes the provider applies the improved text back into the same selection and flushes any pending saves to keep session state in sync."},"title":"Text Improvement","triggerImprovement":{"action":"Pressing the popover button calls {code}. The action validates the selection, ensures a session identifier exists, and invokes the Rust command {code} via Tauri. The command builds a {code} containing the original text and queues a background job against the active session.","backend":"On the backend, the {code} resolves the configured model for the {code} task, wraps the selection in XML tags, and runs the request through the {code} without streaming. When the model response returns it records token usage, cost, and the system prompt template before emitting the improved text back to the UI. The default configuration ships with Claude Sonnet 4.5 and Gemini 3 Pro as the approved models, capped at 4,096 tokens with a temperature of 0.7.","heading":"What happens when you trigger an improvement","metadata":"The background jobs sidebar records the original text in job metadata, so you can review what was sent alongside the rewritten copy. If the selection changes while a job is running, the provider skips replacing the text to avoid clobbering manual edits."},"videoCapture":{"dialog":"The video analysis dialog combines the current task description with an optional focus prompt wrapped in and tags before sending the job. You can narrate while recording; the resulting summary can be pasted into the task description and refined with the improvement popover.","features":"Video jobs include frame-rate controls, optional audio capture, and usage tracking. Results appear in the background jobs sidebar alongside text improvements.","heading":"Video capture and prompt scaffolding"},"voiceIntegration":{"heading":"Voice transcription integration","hook":"Voice recordings use the {code} hook. It loads per-project transcription defaults, requests microphone access, and inserts transcribed text at the cursor inside the task description or terminal dictation buffer. The inserted text can be highlighted and passed through the improvement popover.","preferences":"Language, model, and temperature preferences persist at the project level, so teams get consistent transcription quality before refining the copy. Silence detection warns about bad audio levels, and a ten-minute cap prevents oversized recordings from blocking improvement jobs with large payloads."},"visuals":{"popoverFlow":{"title":"Text improvement flow","description":"Selection popover triggers improvement job and returns enhanced text.","imageSrc":"/images/docs/text-improvement/flow.svg","imageAlt":"Text improvement flow diagram","caption":"Selection popover to job pipeline overview."}},"processorDetails":{"heading":"Processor implementation details","processor":"The {code} handles the text rewriting workflow on the Rust backend.","stepsHeading":"Processing steps","steps":["Parse the incoming payload with original text and selection metadata","Build the system prompt from the configured text_improvement template","Submit the request to the LLM task runner without streaming","Extract the improved text from the model response","Record token usage, cost, and prompt template for billing","Emit the result back to the UI via Tauri events"]},"inlineRewriting":{"heading":"Inline rewriting behaviour","description":"When the improved text returns, the provider automatically replaces the original selection. The rewriting preserves whitespace, line breaks, and any inline formatting present in the source. If the editor is Monaco-based, the change is applied as a single undo-able edit operation.","contextsHeading":"Supported contexts","contexts":["Task description input fields","Plan terminal dictation area","Monaco plan viewers and editors","Any standard HTML input or textarea"]},"modelConfiguration":{"heading":"Model configuration","description":"Text improvement uses the text_improvement task configuration from the desktop runtime config. You can override the default model and parameters in the settings panel.","settingsHeading":"Configurable settings","settings":["Allowed models list (default: Claude Sonnet 4.5, Gemini 3 Pro)","Maximum token limit (default: 4096)","Temperature setting (default: 0.7)","System prompt template override"]},"keyFiles":{"heading":"Key implementation files","items":["desktop/src/contexts/TextImprovementProvider.tsx","desktop/src/components/TextImprovementPopover.tsx","desktop/src/actions/text-improvement/index.ts","desktop/src-tauri/src/jobs/processors/text_improvement.rs","server/src/config/task_model_config.rs"]}},"voiceTranscription":{"meta":{"title":"Voice transcription - PlanToCode","description":"How PlanToCode records audio, sends it to the configured transcription provider, and inserts text into task or terminal inputs."},"category":"Product Guide","date":"2025-09-22","description":"Recording lifecycle, device management, and transcription behavior for voice-driven prompts.","deviceManagement":{"description":"The feature requests microphone permission, enumerates available audio inputs, and lets users choose the active device before recording. Changes take effect on the next recording.","heading":"Device management","monitoring":"Real-time audio level monitoring displays visual feedback during recording. The system warns when audio is silent so you can catch muted microphones before sending the recording."},"intro":"Voice transcription is available anywhere the desktop app exposes dictation controls, including the plan terminal and prompt editors. The feature records audio locally and sends a single recording to the transcription service when you stop, then inserts text into the active input field without blocking manual typing.","metaDescription":"How PlanToCode records audio, sends it to the configured transcription provider, manages permissions, and inserts text into task or terminal inputs.","metaTitle":"Voice transcription - PlanToCode","ogDescription":"Learn how the recording hook manages devices, permissions, and streaming text.","ogTitle":"Voice transcription - PlanToCode","projectSettings":{"description":"When a recording session starts, the hook looks up the active project's transcription configuration so recordings follow the project's preferences.","heading":"Project-aware settings","storage":"Project transcription preferences are stored in SQLite key_value_store under project_task_settings and include the preferred model, language code, prompt, and temperature. Hosted uses managed providers; self-hosting can adjust the allowlist."},"readTime":"5 min","recordingWorkflow":{"description":"The recording hook keeps a state machine with idle, recording, processing, and error states. It records audio into a single blob, enforces a ten-minute cap, and sends the recording on stop.","heading":"Recording workflow","statesHeading":"Recording states","states":["idle: No recording in progress, microphone permissions may or may not be granted","recording: Capturing audio via MediaRecorder with live level monitoring","processing: Uploading the recording to the transcription endpoint and awaiting a response","error: Recording failed due to permission denial, device disconnection, or transcription API error"]},"routingBehavior":{"heading":"Multi-destination routing","description":"Transcribed text is routed based on the active UI context and inserted into the appropriate input.","destinations":["Task description editors: Cursor insertion with optional follow-up text_improvement","Terminal dictation buffer: Command text inserted into PTY input","Prompt editors: Direct insertion into active text inputs"]},"pipeline":{"heading":"Transcription pipeline","hook":"The {code} React hook manages the complete recording lifecycle. It initializes {code} for audio capture in WebM format with Opus codec, monitors audio levels, and handles device switching.","command":"The desktop app invokes {code} to send audio data to the server endpoint {code}. The command validates minimum size (1KB), duration, temperature (0.0-1.0), and prompt length (max 1000 characters); the server enforces max file size (100MB).","constraints":"Audio files must be between 1KB and 100MB. Supported formats: WAV, MP3, M4A, OGG, WebM, FLAC, AAC, and MP4. The transcription model must be specified explicitly and must be in the server allowlist (OpenAI models by default on hosted)."},"serverProcessing":{"heading":"Server-side processing","endpoint":"The server exposes {code} which accepts multipart form data. It routes requests to OpenAI or Google based on the model's provider configuration, validates user credits, and calculates billing based on audio duration.","parametersHeading":"Request parameters","parameters":["file: Audio file data (required) - WAV, MP3, M4A, OGG, WebM, FLAC, AAC, or MP4","model: Transcription model ID (required) - from server allowlist (e.g., openai/gpt-4o-transcribe)","durationMs: Recording duration in milliseconds (required for billing calculation)","language: ISO 639-1 language code (optional) - improves accuracy for specific languages","prompt: Context hint for transcription (optional, max 1000 characters) - helps with domain-specific vocabulary","temperature: Sampling temperature 0.0-1.0 (optional, default 0.0) - lower values produce more deterministic output"]},"dataFlow":{"heading":"Data flow","description":"Audio data flows from the browser through the Tauri command layer to the server, which proxies requests to the appropriate transcription provider.","stepsHeading":"Processing steps","steps":["Browser MediaRecorder captures audio in a single recording (WebM by default)","useVoiceTranscription tracks duration and recording state","On stop, the audio blob is converted to bytes and sent via transcribe_audio_command","Tauri command validates size, duration, temperature, and prompt length","Request sent to server /api/audio/transcriptions endpoint with auth token","Server routes to the configured provider and returns transcribed text","Transcribed text returned to desktop and inserted via callback"]},"keyFiles":{"heading":"Key implementation files","items":["desktop/src/hooks/use-voice-recording/use-voice-transcription.ts","desktop/src/actions/voice-transcription/transcribe.ts","desktop/src-tauri/src/commands/audio_commands.rs","server/src/handlers/proxy/specialized/transcription.rs","server/src/clients/openai/transcription.rs","server/src/clients/google_client.rs"]},"examples":{"heading":"Usage examples","description":"Common voice transcription workflows:","items":["Sprint planning: Dictate tasks, then run text_improvement and task_refinement","Terminal commands: Dictation transcribed and typed directly into PTY for execution","Bug reports: Verbal description captured, refined with text_improvement, then stored in task history","Walkthrough notes: Narrate a screen recording and attach the video analysis summary to the task"]},"cta":{"heading":"Continue exploring","description":"Learn how transcribed text can be refined and how meeting recordings are processed into actionable tasks.","links":{"textImprovement":"Text Improvement","meetingIngestion":"Meeting Ingestion"}},"title":"Voice Transcription","visuals":{"recordingFlow":{"title":"Voice transcription pipeline","description":"Audio capture, provider transcription, and text insertion flow.","imageSrc":"/images/docs/voice-transcription/pipeline.svg","imageAlt":"Voice transcription pipeline diagram","caption":"Audio flows from browser capture through Tauri commands to the configured transcription provider."}}},"overview":{"meta":{"title":"System overview - PlanToCode","description":"Start here: what PlanToCode does, how the core loop works, and where each component lives in the repo."},"category":"Overview","date":"2025-09-25","readTime":"15 min","title":"System Overview","description":"A concise map of the system, the core loop, and the required dependencies.","intro":"PlanToCode is a run-centric development workspace. The desktop app holds execution authority — it owns process execution, filesystem access, terminal runtime, and relay emission. The iOS companion acts as the control plane, issuing intents, monitoring state, and notifying the operator. A server proxy handles authentication, LLM provider routing, and billing. Desktop and iOS interoperate through canonical RPC namespaces (session, plan, run, files, terminal) with runId as the control identifier at every boundary. The system follows an offline-first architecture where the desktop operates independently using SQLite for local state.","visuals":{"systemMap":{"title":"System map","description":"Map of the desktop app, the Rust core, local SQLite storage, and the server proxy.","imageSrc":"/images/docs/overview/system-map.svg","imageAlt":"PlanToCode system map diagram","caption":"Four-layer architecture with data flowing down and events streaming back up."}},"systemLayers":{"heading":"System layers","description":"The system is organized into layers that communicate through canonical RPC namespaces (session.*, plan.*, run.*, files.*, terminal.*):","items":["Presentation Layer: Desktop React UI (workspace chat, attention strip, terminal panels, background jobs sidebar) and iOS SwiftUI (workspace tabs, attention summary bar, chat composer, terminal contexts).","Command Layer: Tauri commands bridging React and Rust for run lifecycle, terminal sessions, and configuration (desktop/src-tauri/src/commands/). RPC router for iOS-to-desktop commands (desktop/src-tauri/src/remote_api/router.rs).","Processing Layer: Run execution, Codex CLI integration, overseer attention loop, and relay emission in Rust (desktop/src-tauri/src/).","Persistence Layer: SQLite repositories for local state and server PostgreSQL for auth/billing (desktop/src-tauri/src/db_utils/)."]},"coreLoop":{"heading":"Core loop in practice","description":"Every task flows through a run-centric lifecycle:","steps":["Capture the task from the workspace chat composer (text, voice dictation, or file/image attachments).","Desktop creates a run and begins execution — the run is the canonical unit of work, identified by runId at every boundary.","The overseer attention loop recomputes counters (Now, Running, Next) on a 60-second heartbeat and emits immediately on state changes.","iOS receives attention events via the relay and schedules local notifications for raised attention.","The operator clears Now items (failed runs, awaiting-input, terminal attention) before adding load.","Plans are ephemeral guidance artifacts tied to runs — created, read, merged, and generated through run-backed operations.","Terminal sessions execute commands with PTY runtime; output streams to both desktop UI and iOS via the relay.","All run artifacts, attention events, and terminal logs persist to SQLite for history and recovery."]},"components":{"heading":"Major components","description":"Each component has a specific responsibility and communicates through canonical RPC namespaces:","items":["Desktop app (execution authority): Tauri v2 shell with React UI. Owns process execution, filesystem access, terminal PTY runtime, run lifecycle, relay emission, and the overseer attention loop.","iOS companion (control plane): SwiftUI workspace with four tabs (Workspace chat, Terminal, Changes, Settings). Issues intents via RPC, monitors run/attention state, and delivers local notifications.","Server relay and proxy (Actix-Web) in server/src/: authenticates clients, routes LLM requests, relays WebSocket messages between desktop and iOS, and handles billing via Stripe.","Local SQLite schema in desktop/src-tauri/migrations/consolidated_schema.sql with WAL mode for concurrent access.","Infrastructure automation in infrastructure/ansible/ for Hetzner (EU) and InterServer (US) dedicated servers."]},"dependencies":{"heading":"Required dependencies","description":"The system requires these external services and resources:","items":["External LLM providers (OpenAI, Anthropic, Google, X.AI, OpenRouter) for plan generation, transcription, and analysis.","Auth0-based authentication with PKCE flow for desktop and mobile sessions.","PostgreSQL 17 and Redis 7+ for server-side user accounts, billing state, and job queues (self-hosted deployments).","Local filesystem access via git ls-files or directory traversal for file discovery workflows.","Whisper-compatible transcription endpoint for voice input processing."]},"codeMap":{"heading":"Where the behavior lives in the repo","description":"Quick reference to key directories and files:","items":["Tauri commands: desktop/src-tauri/src/commands/ (35+ command modules: job_commands.rs, workflow_commands.rs, terminal_commands.rs, session_commands.rs, auth0_commands.rs)","Workflow orchestration: desktop/src-tauri/src/jobs/workflow_orchestrator/ (definition_loader.rs, stage_scheduler.rs, event_emitter.rs, payload_builder.rs)","Job processors: desktop/src-tauri/src/jobs/processors/ (implementation_plan_processor.rs, text_improvement_processor.rs, root_folder_selection_processor.rs)","SQLite repositories: desktop/src-tauri/src/db_utils/ (background_job_repository/, session_repository.rs, terminal_repository.rs)","Server routes: server/src/routes.rs (configure_routes, configure_public_auth_routes, configure_webhook_routes)","LLM proxy handlers: server/src/handlers/proxy_handlers.rs and server/src/handlers/proxy/ (router.rs, providers/)","Provider transformers: server/src/handlers/provider_transformers/ (openai.rs, google.rs, anthropic.rs, xai.rs)","iOS workspace and relay state: mobile/ios/VibeUI/Sources/VibeUI/SessionWorkspaceView.swift, SessionWorkspaceViewModel.swift, and Core/Sources/Core/DataServices/","Infrastructure playbooks: infrastructure/ansible/site-base.yml (hardening, PostgreSQL, Redis) and site-app.yml (deployment)"]},"keyAbstractions":{"heading":"Key abstractions","description":"Understanding these core concepts helps navigate the codebase:","items":["Run: Operator-facing unit of execution identified by runId — the canonical control identifier at desktop/iOS boundaries. Relay events use run:created, run:status-changed, run:finalized, etc.","Session: Project context stored in sessions table with task_description, included_files, and model preferences. Identified by UUID.","Execution authority: The desktop app owns process execution, filesystem access, terminal runtime, and relay emission.","Control plane: The iOS app issues intents, monitors state, and notifies the operator via local notifications.","Attention counters: Now (failed/canceled runs + awaiting-input + terminal attention), Running (active runs + terminals), Next (queued/preparing runs).","Ephemeral plan: Plan content stored as run output/metadata, accessed through plan.* namespace, and tied to runId.","Terminal Session: PTY process stored in terminal_sessions with output_log, status, and multi-context switching on iOS.","Provider: LLM service abstraction in server/src/handlers/proxy/providers/ with request transformation and response normalization."]},"dataFlowSummary":{"heading":"Data flow summary","description":"How data moves through the system for a typical run:","items":["Operator sends a message from the workspace chat composer (desktop or iOS). iOS messages queue in the outbox and deliver automatically on reconnect.","Desktop creates a run, assigns runId, and begins execution through the Codex CLI or LLM proxy.","Run progress streams to the desktop UI and relays to iOS via canonical run events (run:stream-progress, run:status-changed, run:finalized).","The overseer attention loop recomputes Now/Running/Next counters and emits attention.raised or attention.cleared events.","iOS receives attention events, updates the workspace attention summary bar, and schedules local notifications.","Terminal output streams to both desktop and iOS; multi-terminal context switching on iOS lets operators monitor parallel sessions.","All run artifacts, attention snapshots, and terminal logs persist to SQLite for history and recovery."]}},"runtimeWalkthrough":{"meta":{"title":"Runtime walkthrough - PlanToCode","description":"End-to-end timeline of a task from chat input through run execution, attention monitoring, and terminal output."},"category":"Architecture","date":"2025-09-25","readTime":"12 min","title":"Runtime Walkthrough","description":"End-to-end runtime timeline from chat input through run execution and attention monitoring.","intro":"This walkthrough traces a single task from chat input through run creation, execution, attention monitoring, and terminal output. The run is the canonical unit of execution — identified by runId at every desktop/iOS boundary. Desktop holds execution authority; iOS monitors and intervenes through the control plane.","visuals":{"timeline":{"title":"Runtime timeline","description":"Visual timeline showing task input, workflow stages, and plan output.","imageSrc":"/images/docs/runtime-walkthrough/timeline.svg","imageAlt":"Runtime timeline diagram","caption":"Task execution flows through six stages, with all artifacts persisted to SQLite."},"walkthroughVideo":{"title":"Runtime walkthrough video","description":"Video demonstration of a complete task execution from input to plan output.","videoSrc":"","posterSrc":"","caption":"Video walkthrough placeholder - record a demonstration of the full planning workflow."}},"timeline":{"heading":"High-level runtime sequence","description":"A complete task execution follows this run-centric sequence:","steps":["Operator sends a message from the workspace chat composer (desktop or iOS). On iOS, messages queue in the outbox and deliver automatically on reconnect.","Desktop receives the message and creates a run with a unique runId — the canonical control identifier.","Run execution begins through the Codex CLI or LLM proxy. Desktop emits run:created and run:stream-progress relay events.","The workspace chat timeline on desktop streams run output in real time. iOS receives the same events via the relay.","The overseer attention loop recomputes counters every 60 seconds and emits immediately on state changes: Now (failed/canceled + awaiting-input + terminal attention), Running (active runs + terminals), Next (queued/preparing).","iOS receives attention.raised events and schedules local notifications, replacing pending notifications per session to avoid stacking.","Operator reviews run output in the workspace chat, inspects changed files in the Changes tab, or monitors terminal output in the Terminal tab.","Plans are ephemeral artifacts tied to runs — created/read/merged via plan.* namespace using runId.","Terminal sessions execute commands with PTY runtime; output streams to desktop UI and iOS terminal tab via relay.","Run completes with run:finalized event. All artifacts persist to SQLite for history and recovery."]},"jobTypes":{"heading":"Job types in the runtime","description":"Each task_type maps to a specific processor and produces distinct artifacts:","items":["text_improvement: TextImprovementProcessor wraps text in XML, sends to LLM, returns refined text. Stored in background_jobs.response.","root_folder_selection: RootFolderSelectionProcessor receives directory tree, returns JSON array of selected directories.","regex_file_filter: RegexFileFilterProcessor generates patterns from task description, applies to git file list.","file_relevance_assessment: FileRelevanceAssessmentProcessor loads file contents, chunks by token limit, scores relevance.","extended_path_finder: ExtendedPathFinderProcessor analyzes imports/dependencies, expands context with related files.","implementation_plan: ImplementationPlanProcessor streams XML-formatted plans with plan_step elements.","implementation_plan_merge: ImplementationPlanMergeProcessor combines plans using source_plans XML tags and user instructions.","video_analysis: Processes screen recordings via /api/llm/video/analyze with a framerate hint.","web_search_prompts_generation: Generates research_task XML blocks for deep research workflow.","web_search_execution: Executes research prompts in parallel, aggregates findings."]},"inputCapture":{"heading":"Task input capture","description":"Tasks enter the system through multiple input surfaces:","text":"Task descriptions are typed or pasted into TaskDescriptionEditor which persists to sessions.task_description and creates history entries in task_description_history table with device_id for multi-device sync.","voice":"Voice input uses useVoiceTranscription hook which records via MediaRecorder API, sends to /api/audio/transcriptions, and inserts at cursor position.","video":"Video analysis uses VideoAnalysisDialog to capture screen recordings, upload to /api/llm/video/analyze, and extract UI state observations."},"workflowExecution":{"heading":"Workflow execution details","description":"The WorkflowOrchestrator coordinates multi-stage workflows:","scheduling":"workflow_lifecycle_manager.rs creates workflow records and stage_scheduler.rs dispatches stages sequentially based on workflow JSON definitions.","data":"IntermediateData structures in workflow_types.rs pass outputs between stages: selectedRoots, rawRegexPatterns, locallyFilteredFiles, aiFilteredFiles, verifiedPaths.","events":"event_emitter.rs publishes workflow-status and workflow-stage Tauri events consumed by WorkflowTracker in the React UI."},"persistence":{"heading":"State persistence","description":"All artifacts are persisted for review and recovery:","jobs":"background_job_repository/ stores job records with session_id, task_type, status, prompt, response, tokens_sent/received, actual_cost.","sessions":"session_repository.rs manages sessions table with task_description, included_files, model_used, history versions.","terminals":"terminal_repository.rs persists terminal_sessions with output_log, status, exit_code, working_directory for session recovery.","rehydration":"On app restart, the Rust core rehydrates session state from SQLite, marks stale running jobs as failed, and restores terminal output logs."},"inputs":{"heading":"Task input capture","capture":"Tasks enter the system through multiple input surfaces: typed text in TaskDescriptionEditor, voice dictation via useVoiceTranscription hook, or video analysis through VideoAnalysisDialog.","artifacts":"Each input type updates SQLite state: task_description in sessions and task_description_history, voice transcription inserts text into the session or terminal input, and video analysis responses are stored in background_jobs."},"refinement":{"heading":"Input refinement","jobs":"The text_improvement job type refines raw input through TextImprovementProcessor, wrapping text in XML and sending to the LLM for grammar, clarity, and structure improvements.","storage":"Refined text is stored in background_jobs.response and can update sessions.task_description via the React provider."},"discovery":{"heading":"File discovery workflow","workflow":"FileFinderWorkflow runs four sequential stages: root_folder_selection narrows directories, regex_file_filter applies patterns, file_relevance_assessment scores content, and extended_path_finder expands with dependencies.","outputs":"Each stage stores results in IntermediateData structures passed between processors, with final file selections persisted to sessions.included_files."},"planGeneration":{"heading":"Plan generation","jobs":"The implementation_plan job type uses ImplementationPlanProcessor to generate XML-formatted plans with plan_step elements containing file paths, operation types, and code changes.","streaming":"Plan content streams to the UI via job:stream-progress Tauri events, displayed in the VirtualizedCodeViewer Monaco component with syntax highlighting."},"merge":{"heading":"Plan merging","instructions":"The implementation_plan_merge job combines multiple plans using source_plans XML tags and user-provided merge instructions to resolve conflicts and consolidate changes.","outputs":"Merged plans maintain traceability to source plans and include merged_from metadata in the final background_jobs record."},"review":{"heading":"Plan review","editor":"Plans open in the Monaco-based VirtualizedCodeViewer for review. Users can edit plan text directly, request modifications, or approve for execution.","audit":"Plan edits are persisted in background_jobs.response; signoff state is recorded in background_jobs.metadata.userSignoff."},"execution":{"heading":"Execution handoff","terminal":"Approved plans are copied to the integrated terminal via copy-button templates, or exported for external agents like Claude Code, Cursor, or Codex.","logging":"Terminal sessions in terminal_commands.rs capture PTY output, detect agent attention states, and log all execution activity to terminal_sessions table."},"state":{"heading":"State persistence","jobs":"All job artifacts persist in background_jobs table with session_id, task_type, status, prompt, response, token counts, and cost tracking.","rehydration":"On app restart, the Rust core rehydrates session state from SQLite, marks stale running jobs as failed, and restores terminal output logs."},"jobMap":{"heading":"Job type mapping","items":["text_improvement → TextImprovementProcessor → refined task descriptions","root_folder_selection → RootFolderSelectionProcessor → selected directories","regex_file_filter → RegexFileFilterProcessor → pattern-matched files","file_relevance_assessment → FileRelevanceAssessmentProcessor → scored files","extended_path_finder → ExtendedPathFinderProcessor → expanded context","implementation_plan → ImplementationPlanProcessor → XML plan documents","implementation_plan_merge → ImplementationPlanMergeProcessor → merged plans"]},"cta":{"heading":"Explore the architecture","description":"Understand how the components fit together in detail.","links":{"architecture":"Architecture overview","jobs":"Background jobs","desktop":"Desktop app internals","dataModel":"Data model","plans":"Implementation plans"}}},"desktopApp":{"meta":{"title":"Desktop app internals - PlanToCode","description":"How the Tauri desktop shell, Rust command layer, SQLite persistence, and PTY sessions work together."},"category":"Desktop","date":"2025-09-25","readTime":"14 min","title":"Desktop App Internals","description":"Tauri v2 shell, Rust command layer, PTY sessions, and UI state management.","intro":"The desktop app is the execution authority in the PlanToCode system — a Tauri v2 shell running a React UI. It owns process execution, filesystem access, terminal PTY runtime, run lifecycle, and relay emission to connected iOS clients. Rust services expose commands for run management, terminal sessions, and configuration while persisting state locally in SQLite. The RPC router accepts iOS commands through canonical namespaces (session, plan, run, files, terminal).","visuals":{"shell":{"title":"Desktop shell overview","description":"Screenshot showing the plan editor, terminal tabs, and job status sidebar.","imageSrc":"/assets/images/demo-implementation-plans.jpg","imageAlt":"PlanToCode desktop shell","caption":"The desktop app showing the implementation plans panel and sidebar."}},"projectLayout":{"heading":"Project layout","description":"The desktop application follows the standard Tauri v2 structure:","items":["desktop/src/: React UI components, hooks, providers, and desktop-specific adapters.","desktop/src-tauri/: Rust core including commands, jobs, repositories, and services.","desktop/src-tauri/src/lib.rs: Application entry point with plugin registration and AppState management.","desktop/src-tauri/src/commands/: 35+ Tauri command handler modules organized by domain.","desktop/src-tauri/src/jobs/: Background job processors, workflow orchestration, and queue management.","desktop/src-tauri/capabilities/: JSON capability definitions for security permissions (default.json, desktop-default.json, plantocode-api.json).","desktop/src-tauri/migrations/: SQLite schema migrations in consolidated_schema.sql."]},"ui":{"heading":"React UI and surface area","description":"The React UI centers on the workspace chat and run monitoring surfaces:","components":["WorkspaceChat: Conversational timeline that streams run output, displays activity events, supports inline file previews, and manages the full run lifecycle with model override and reasoning-level controls.","ChatComposer: Message input with file/image attachments, voice dictation, model picker, and an offline-capable outbox that queues messages for delivery on reconnect.","ExecutiveAttentionStrip: Top-level Now/Running/Next counters that surface overseer attention state across all sessions.","BackgroundJobsSidebar: Project-grouped session cards showing active, queued, and completed runs with real-time status updates.","TerminalSurface: PTY output buffer with connection status, agent attention indicators, and multi-tab support.","GitDiffPanel: Changed-files viewer for reviewing run output before commit."]},"commands":{"heading":"Tauri commands","description":"Commands in desktop/src-tauri/src/commands/ expose Rust functionality to the React UI. Key modules include:","modules":["job_commands.rs: create_job, get_job, cancel_job, get_jobs_for_session, clear_job_history.","workflow_commands.rs: start_file_finder_workflow, get_workflow_status, retry_workflow, pause_workflow, resume_workflow.","terminal_commands.rs: start_terminal_session, attach_terminal_output, write_terminal_input, resize_terminal_session, get_terminal_metadata, graceful_exit_terminal.","session_commands.rs: create_session, get_session, update_session, sync_task_description_history, sync_file_selection_history.","auth0_commands.rs: initiate_login, complete_login, refresh_token, logout, get_user_info.","implementation_plan_commands.rs: generate_implementation_plan, merge_implementation_plans, estimate_tokens.","config_commands.rs: get_runtime_config, get_model_config, get_system_prompts, refresh_config_cache.","settings_commands.rs: get_setting, set_setting, get_project_system_prompt, set_project_system_prompt."]},"appState":{"heading":"AppState management","description":"The Rust core manages application state through Tauri's state system:","structure":"AppState struct in lib.rs holds: config_load_error (Option), HTTP client (reqwest::Client), RuntimeConfig (server URL, onboarding status) behind Mutex, and Auth0State for authentication.","config":"RuntimeConfig contains server_url, onboarding_complete flag, and is updated via set_runtime_config command. ConfigCache stores runtime AI configuration with per-project overrides.","tokens":"TokenManager uses the OS keyring (via keyring crate) to securely store access_token, refresh_token, and jwt with automatic refresh before expiry."},"jobs":{"heading":"Job processors and workflows","description":"Job processing architecture in desktop/src-tauri/src/jobs/:","queue":"queue.rs manages the job queue with in-memory pending jobs and SQLite persistence. Jobs transition through statuses: idle, created, queued, acknowledged_by_worker, preparing, preparing_input, running, generating_stream, processing_stream, completed, failed, canceled.","processors":"processors/ directory contains task-specific processors: ImplementationPlanProcessor (streaming plans), TextImprovementProcessor (inline rewrites), RootFolderSelectionProcessor, RegexFileFilterProcessor, FileRelevanceAssessmentProcessor, ExtendedPathFinderProcessor.","orchestrator":"workflow_orchestrator/ coordinates multi-stage workflows: definition_loader.rs loads JSON workflow definitions, stage_scheduler.rs dispatches stages, payload_builder.rs constructs inputs, event_emitter.rs publishes progress events.","streaming":"processors/generic_llm_stream_processor.rs handles streaming LLM responses, emitting job:stream-progress events and accumulating content in background_jobs.response."},"persistence":{"heading":"Local persistence","description":"SQLite storage in desktop/src-tauri/migrations/consolidated_schema.sql:","tables":["sessions: id (UUID), name, project_directory, project_hash, task_description, included_files, force_excluded_files, model_used, history versions.","background_jobs: id (UUID), session_id (FK), task_type, status, prompt, response, tokens_sent/received, cache_read/write_tokens, actual_cost, metadata (JSON), server_request_id.","terminal_sessions: id, job_id (nullable FK), session_id, status, process_pid, output_log, working_directory, environment_vars, last_output_at.","task_description_history: session_id (FK), description, device_id, sequence_number, version for multi-device sync.","file_selection_history: session_id (FK), included_files, force_excluded_files, device_id, sequence_number.","project_system_prompts: project_hash, task_type, system_prompt for per-project prompt overrides.","key_value_store: key, value (JSON), updated_at for app settings.","error_logs: timestamp, level, error_type, message, context, stack, metadata for client-side error tracking."],"repositories":"Repositories in db_utils/ provide typed access: background_job_repository/ (modular with base.rs, worker.rs, metadata.rs, cleanup.rs), session_repository.rs, terminal_repository.rs, settings_repository.rs, error_log_repository.rs."},"terminal":{"heading":"Terminal sessions","description":"PTY terminal implementation:","commands":"terminal_commands.rs manages session lifecycle: create_terminal_session spawns PTY via portable-pty crate, send_terminal_input forwards keystrokes, resize_terminal adjusts dimensions, check_cli_availability verifies tool presence (claude, cursor, codex, gemini).","persistence":"terminal_repository.rs persists sessions with output_log (accumulated terminal output), status (idle/running/completed/failed/agent_requires_attention), exit_code, working_directory. Sessions can be restored after app restart.","attention":"Agent attention detection monitors last_output_at timestamps. Level 1 (30s idle): yellow indicator. Level 2 (2min idle): red indicator with desktop notification."},"inputStability":{"heading":"Task description stability","description":"The task description editor includes safeguards to prevent cursor jumps:","items":["Remote updates are queued while the user is typing and flushed on idle or blur.","Selection state is tracked and restored after React re-renders.","Background writers call sessionActions.updateCurrentSessionFields to coordinate updates.","Multi-device sync uses sequence_number and version fields to resolve conflicts."]},"plugins":{"heading":"Tauri plugins","description":"PlanToCode uses the Tauri v2 plugin ecosystem:","list":["tauri-plugin-http (2.5.2): HTTP client with CSP-aware fetch for API calls.","tauri-plugin-dialog (2.4.2): Native file/folder picker and message dialogs.","tauri-plugin-shell (2.3.3): Shell command execution for external CLI tools.","tauri-plugin-store (2.4.1): Persistent key-value storage for app settings.","tauri-plugin-notification (2.3.0): Desktop notifications for agent attention.","tauri-plugin-updater (2.9.0): In-app updates with signature verification.","tauri-plugin-single-instance (2.3.4): Single instance enforcement.","tauri-plugin-process (2.3.1): Process restart capability."]}},"serverApi":{"meta":{"title":"Server API and LLM proxy - PlanToCode","description":"Auth, provider routing, model configuration, and WebSocket endpoints used by desktop and mobile clients."},"category":"Server","date":"2025-09-25","readTime":"12 min","title":"Server API & LLM Proxy","description":"Auth, provider routing, model configuration, billing, and WebSocket endpoints.","intro":"The server is an Actix-Web service written in Rust that provides authentication, model configuration, LLM proxying, and billing. Desktop and mobile clients depend on it for secure provider routing and streaming responses. The server runs on dedicated infrastructure in two regions: Hetzner (EU) at api-eu.plantocode.com and InterServer (US) at api-us.plantocode.com.","visuals":{"flow":{"title":"Server request flow","description":"Diagram showing clients, API routes, and the LLM proxy.","imageSrc":"/images/docs/provider-routing/routing-map.svg","imageAlt":"Server request flow diagram","caption":"Placeholder for the server request flow."}},"routeOrganization":{"heading":"Route organization","description":"Routes are organized in server/src/routes.rs with three configuration functions:","functions":["configure_routes(): JWT-authenticated routes under /api scope. Includes auth, billing, config, providers, models, llm proxy, audio, system-prompts, consent, devices, notifications.","configure_public_auth_routes(): Browser-based auth flow under /auth scope. Includes Auth0 initiate-login, callback, and logged-out routes.","configure_webhook_routes(): Unauthenticated webhook endpoints under /webhooks scope. Currently handles Stripe webhooks."]},"auth":{"heading":"Authentication endpoints","description":"Authentication uses Auth0 with PKCE flow:","routes":["/auth/auth0/initiate-login (GET): Starts OAuth flow with code_challenge, redirects to Auth0.","/auth/auth0/callback (GET): Handles Auth0 redirect, exchanges code for tokens.","/api/auth/userinfo (GET): Returns authenticated user info from Auth0.","/api/auth/logout (POST): Revokes tokens and clears session.","/api/auth/account (DELETE): Account deletion with cascading cleanup.","/api/auth0/refresh-app-token (POST): Refreshes access token using refresh token."],"implementation":"Auth handlers in server/src/handlers/auth0_handlers.rs and server/src/handlers/auth/. JWT validation uses services/auth/jwt.rs with JWKS rotation. Revoked tokens tracked in revoked_token_repository.rs."},"llmProxy":{"heading":"LLM proxy and streaming","description":"The LLM proxy normalizes requests across providers and streams responses:","routes":["/api/llm/chat/completions (POST): Main chat completion endpoint. Routes to OpenAI, Anthropic, Google, X.AI, or OpenRouter based on model ID.","/api/llm/video/analyze (POST): Multipart video upload for video analysis (FPS hint). Requires google/* models with video capability.","/api/llm/cancel (POST): Cancels in-flight streaming request by request_id.","/api/llm/status/{request_id} (GET): Returns status of a request (active, completed, cancelled).","/api/audio/transcriptions (POST): Whisper-compatible transcription. Multipart upload with audio file and parameters."],"routing":"Router in server/src/handlers/proxy/router.rs selects provider based on model ID prefix (openai/, anthropic/, google/, xai/, openrouter/). Provider-specific handlers in server/src/handlers/proxy/providers/ transform requests and normalize responses.","streaming":"Streaming responses use Server-Sent Events (SSE) via streaming/sse_adapter.rs. The proxy forwards chunks from providers, transforms them to a common format, and tracks token usage in real-time."},"providers":{"heading":"Provider routing","description":"Provider handlers in server/src/handlers/proxy/providers/:","handlers":["openai.rs: OpenAI and OpenAI-compatible APIs (GPT-4, o1, o3).","anthropic.rs: Anthropic Claude models with prompt caching support.","google.rs: Google Gemini models including video analysis capability.","xai.rs: X.AI Grok models.","openrouter.rs: OpenRouter aggregation for model routing."],"transformers":"Request/response transformers in server/src/handlers/provider_transformers/ normalize API differences. Each transformer handles: request body format, authentication headers, streaming chunk format, usage extraction, error normalization."},"config":{"heading":"Configuration endpoints","description":"Configuration and model metadata endpoints:","routes":["/api/config/all-configurations (GET): Returns all application configurations including model settings per task type.","/api/config/desktop-runtime-config (GET): Desktop-specific runtime configuration.","/api/config/billing (GET/PUT): Billing configuration management.","/api/providers (GET): List of available LLM providers with capabilities.","/api/providers/with-counts (GET): Providers with model counts.","/api/providers/by-capability/{capability} (GET): Filter providers by capability.","/api/models (GET): All available models with pricing.","/api/models/{id} (GET): Single model details.","/api/models/by-provider/{provider_code} (GET): Models for a specific provider.","/api/models/estimate-cost (POST): Cost estimation for a request.","/api/models/estimate-tokens (POST): Token count estimation.","/api/system-prompts/defaults (GET): Default system prompts by task type."]},"billing":{"heading":"Billing endpoints","description":"Credit-based billing system integrated with Stripe:","routes":["/api/billing/dashboard (GET): User billing dashboard data.","/api/billing/usage-summary (GET): Detailed usage with cost breakdown.","/api/billing/credits/balance (GET): Current credit balance.","/api/billing/credits/details (GET): Credit details including grants and purchases.","/api/billing/credits/unified-history (GET): Transaction history.","/api/billing/checkout/credit-purchase (POST): Create Stripe checkout for credits.","/api/billing/checkout/setup (POST): Create Stripe setup session for payment method.","/api/billing/auto-top-off (GET/PUT): Auto top-off settings management."],"implementation":"Billing handlers in server/src/handlers/billing/. Credit service in services/credit_service.rs. Stripe integration via services/stripe_service.rs with webhook handling in webhook_handlers.rs."},"devices":{"heading":"Device management","description":"Device registration and push notifications:","routes":["/api/devices/register (POST): Register desktop device with device_id.","/api/devices/mobile/register (POST): Register mobile device with platform info.","/api/devices/{device_id}/heartbeat (POST): Device heartbeat for presence.","/api/devices/{device_id}/push-token (POST): Save push notification token.","/api/devices/{device_id}/connection-descriptor (GET): WebSocket connection info for device linking.","/api/notifications/job-completed (POST): Send push notification for completed job.","/api/notifications/job-progress (POST): Send progress notification."]},"websockets":{"heading":"WebSocket endpoints","description":"Real-time communication via WebSocket:","endpoints":["/ws/device-link: Relay for desktop-mobile device linking. Handles terminal output streaming, job status updates, and RPC commands between linked devices.","/ws/events: General event stream for real-time updates."],"implementation":"Device link relay in server/src/handlers/device_link_ws.rs. Sessions managed by services/relay_session_store.rs with heartbeat monitoring and reconnection support."},"serverStorage":{"heading":"Server-side persistence","description":"PostgreSQL database with repositories in server/src/db/repositories/:","repositories":["user_repository.rs: User accounts linked to Auth0 sub.","customer_billing_repository.rs: Stripe customer and credit state.","credit_transaction_repository.rs: Credit transaction history.","provider_repository.rs: LLM provider configuration.","system_prompts_repository.rs: System prompt templates.","consent_repository.rs: Legal consent tracking.","audit_log_repository.rs: Audit trail for sensitive operations.","revoked_token_repository.rs: JWT revocation list.","api_key_repository.rs: API key management with secure hashing."]}},"backgroundJobs":{"meta":{"title":"Background jobs - PlanToCode","description":"Job queue architecture, processor types, state machine, and artifact storage for the desktop job engine."},"category":"Architecture","date":"2025-09-25","readTime":"14 min","title":"Background Jobs","description":"Job queue, processors, state machine, event streaming, and artifact storage.","intro":"All LLM-backed work runs through the background job system in the desktop app. The job queue dispatches work to processors, streams progress events, and persists every prompt and response in SQLite for review and recovery. This architecture enables cancellation, retry, cost tracking, and real-time UI updates.","visuals":{"stateMachine":{"title":"Job state machine","description":"Diagram showing job status transitions from created through completion or failure.","imageSrc":"/images/docs/background-jobs/state-machine.svg","imageAlt":"Job state machine diagram","caption":"Placeholder for job state machine diagram."}},"jobRecord":{"heading":"Job record structure","description":"Each job creates a background_jobs row in SQLite with these fields:","fields":["id (TEXT PRIMARY KEY): UUID for the job.","session_id (TEXT NOT NULL, FK): References sessions.id with CASCADE DELETE.","task_type (TEXT DEFAULT 'unknown'): Processor identifier (e.g., implementation_plan, text_improvement, root_folder_selection).","status (TEXT): Current state with CHECK constraint for valid values.","prompt (TEXT NOT NULL): Full text sent to the LLM, stored for review and debugging.","response (TEXT): LLM output or error message.","error_message (TEXT): Detailed error information on failure.","tokens_sent (INTEGER DEFAULT 0): Input token count from provider response.","tokens_received (INTEGER DEFAULT 0): Output token count.","cache_read_tokens (INTEGER DEFAULT 0): Tokens read from provider cache (Anthropic).","cache_write_tokens (INTEGER DEFAULT 0): Tokens written to cache.","model_used (TEXT): Model identifier used for the request.","actual_cost (REAL): Computed cost based on token usage and model pricing.","metadata (TEXT): JSON with task-specific data, workflow IDs, stage names.","system_prompt_template (TEXT): Template identifier used for the system prompt.","server_request_id (TEXT): Links to server-side usage tracking.","created_at, updated_at, start_time, end_time (INTEGER): Timestamps.","is_finalized (INTEGER DEFAULT 0): Whether final cost/usage has been recorded."]},"statusValues":{"heading":"Status values and transitions","description":"Jobs transition through well-defined statuses tracked in the database:","statuses":["idle: Initial state before processing starts.","created: Job record created, not yet queued.","queued: Added to job queue, waiting for processor.","acknowledged_by_worker: Processor has picked up the job.","preparing: Processor is gathering inputs (files, prompts).","preparing_input: Building the LLM request payload.","running: Request sent to LLM, awaiting response.","generating_stream: Streaming response in progress.","processing_stream: Processing streamed chunks.","completed: Job finished successfully.","completed_by_tag: Completed via stream end tag detection.","failed: Job failed with error_message populated.","canceled: User requested cancellation."],"transitions":"Transitions are enforced in background_job_repository/worker.rs. Invalid transitions are rejected. Status changes emit job:status-changed Tauri events."},"orchestrator":{"heading":"Workflow orchestrator","description":"Multi-stage workflows are managed by WorkflowOrchestrator in desktop/src-tauri/src/jobs/workflow_orchestrator/:","modules":["mod.rs: Main orchestrator struct and workflow execution entry point.","definition_loader.rs: Loads workflow JSON definitions (e.g., file_finder_workflow.json) specifying stage order and processor types.","stage_scheduler.rs: Schedules stages sequentially, waits for upstream completion.","stage_job_manager.rs: Creates background_job records for each stage.","payload_builder.rs: Constructs stage inputs from IntermediateData.","data_extraction.rs: Extracts outputs from completed stage jobs.","event_emitter.rs: Publishes workflow-status and workflow-stage Tauri events.","state_updater.rs: Updates workflow state in memory and database.","completion_handler.rs: Handles workflow completion and cleanup.","failure_handler.rs: Manages stage failures and retry decisions.","retry_handler.rs: Implements retry logic with exponential backoff."],"dataFlow":"Workflows use WorkflowIntermediateData (defined in workflow_types.rs) to pass outputs between stages: directoryTreeContent, selectedRoots, rawRegexPatterns, locallyFilteredFiles, aiFilteredFiles, verifiedPaths, unverifiedPaths."},"processors":{"heading":"Job processors","description":"Each task_type maps to a processor in desktop/src-tauri/src/jobs/processors/:","implementations":["implementation_plan_processor.rs: Loads selected file contents, builds structured prompt with directory tree, streams XML plan to UI. Uses generic_llm_stream_processor for streaming.","text_improvement_processor.rs: Wraps selection in XML tags, sends non-streaming request, returns improved text. Runs via LlmTaskRunner.","root_folder_selection_processor.rs: Sends directory tree to LLM, parses JSON array response of selected directories.","RegexFileFilterProcessor (in processors/mod.rs): Generates regex patterns from task, applies to git file list, filters binaries.","FileRelevanceAssessmentProcessor: Chunks file contents by token limit, scores relevance in batches, aggregates relevant paths.","ExtendedPathFinderProcessor (path_finder_types.rs): Analyzes imports/dependencies, suggests related files, validates paths exist.","web_search_prompts_generator_processor.rs: Generates research_task XML blocks for deep research.","web_search_executor_processor.rs: Executes research prompts in parallel via server search API.","generic_llm_stream_processor.rs: Reusable streaming processor that handles chunk accumulation, event emission, and response finalization."]},"events":{"heading":"Event streaming","description":"Job progress emits Tauri events consumed by the React UI:","eventTypes":["job:status-changed: Payload {jobId, status, error?}. Emitted on every status transition.","job:stream-progress: Payload {jobId, content, tokensReceived}. Emitted for each streaming chunk.","job:completed: Payload {jobId, response, tokensTotal, cost}. Emitted on successful completion.","workflow-status: Payload {workflowId, status, currentStage?}. Workflow-level status updates.","workflow-stage: Payload {workflowId, stageName, status}. Individual stage status."],"reactConsumption":"React components subscribe via useEffect with listen() from @tauri-apps/api/event. WorkflowTracker aggregates workflow events. JobStatusIndicator displays real-time status."},"retry":{"heading":"Retry and cancellation","description":"Job retry and cancellation mechanisms:","retryLogic":"retry_handler.rs manages retry counts and delays. Retries use exponential backoff with configurable max attempts. Retry state stored in job.metadata.retryCount.","cancellation":"Cancellation sets a flag checked between streaming chunks in generic_llm_stream_processor.rs. Server-side cancellation sends /api/llm/cancel with request_id.","cleanup":"workflow_cleanup.rs handles cleanup of incomplete workflows. Stale jobs (running status after app restart) are marked failed."},"artifacts":{"heading":"Artifact storage","description":"Job inputs and outputs are fully persisted for review:","stored":["prompt: Complete LLM prompt including system prompt and user content.","response: Full LLM response text or streaming accumulation.","metadata: JSON with task-specific data (original text for improvements, file lists, workflow context).","system_prompt_template: Identifier linking to server-side prompt template version.","Token counts and cost: Captured from provider response for billing and analysis."],"access":"background_job_repository provides queries: get_jobs_for_session, get_job_by_id, get_jobs_by_task_type, get_recent_jobs. Job history displayed in BackgroundJobsSidebar component."},"costTracking":{"heading":"Cost tracking","description":"Per-job cost tracking enables budget management:","calculation":"Cost calculated using model pricing from server/src/models/model_pricing.rs. Formula: (tokens_sent * input_price + tokens_received * output_price) with cache adjustments.","accumulation":"Session-level cost aggregated from background_jobs. UI displays cumulative cost in session header.","serverSync":"server_request_id links desktop jobs to server-side usage records for billing reconciliation."},"cta":{"heading":"See the data model","description":"Understand the SQLite schema that stores jobs, sessions, and terminal session logs.","links":{"dataModel":"Data model","runtime":"Runtime walkthrough"}}},"buildYourOwn":{"meta":{"title":"Build your own pipeline - PlanToCode","description":"Conceptual guide for designing file discovery and plan generation workflows similar to PlanToCode."},"category":"Reference","date":"2025-09-25","readTime":"12 min","title":"Build Your Own Pipeline","description":"Conceptual guide for designing file discovery and plan generation workflows.","intro":"This guide distills the key architectural patterns from PlanToCode into a conceptual blueprint. Whether you want to build a similar system or understand why certain design decisions were made, this document covers the foundational patterns you can reuse or adapt.","visuals":{"pipelineMap":{"title":"Pipeline architecture map","description":"Overview of the multi-stage pipeline from task input to plan output.","imageSrc":"/images/docs/overview/system-map.svg","imageAlt":"Pipeline architecture diagram","caption":"Placeholder for pipeline architecture diagram."}},"keyPatterns":{"heading":"Key Architectural Patterns","jobQueue":{"title":"Job Queue Pattern","description":"All LLM-backed operations run as background jobs with status tracking, cancellation support, and retry logic. Jobs are persisted to SQLite so state survives app restarts.","benefits":["Decouples UI responsiveness from LLM latency","Enables cancellation mid-stream","Provides job history of all operations","Supports retry with exponential backoff"],"pitfalls":["Job status management adds complexity","Need careful handling of stale jobs on restart","Stream accumulation can consume memory for large responses"]},"workflowOrchestrator":{"title":"Workflow Orchestrator Pattern","description":"Multi-stage workflows are coordinated by an orchestrator that schedules stages sequentially, passes intermediate data between them, and handles failures at any stage.","components":["Definition loader reads workflow JSON specs","Stage scheduler dispatches stages in order","Payload builder constructs inputs from prior outputs","Event emitter publishes progress for UI updates"]},"repositoryPattern":{"title":"Repository Pattern","description":"All persistence goes through typed repositories that abstract SQLite operations. This provides a clean API, enables testing, and centralizes database access.","benefits":["Typed access prevents SQL injection","Repositories can be mocked for testing","Centralized query optimization","Consistent error handling"]}},"steps":{"step1":{"title":"1. Define your task model","description":"Start by defining what constitutes a task in your system. PlanToCode uses sessions with task descriptions, file selections, and model preferences.","details":"Store task metadata in a dedicated table with versioning for history tracking."},"step2":{"title":"2. Build the job queue","description":"Create a job queue that persists jobs to storage, emits status events, and supports cancellation. Jobs should track prompts, responses, tokens, and cost.","details":"Use a semaphore-based concurrency limiter to control parallel LLM requests."},"step3":{"title":"3. Implement processors","description":"Each job type needs a processor that builds prompts, calls the LLM, and parses responses. Use streaming for long outputs.","details":"Processors should be stateless and receive all context through job parameters."},"step4":{"title":"4. Create the workflow orchestrator","description":"For multi-stage workflows, build an orchestrator that schedules stages, manages intermediate data, and handles failures.","details":"Store workflow definitions as JSON for easy modification without code changes."},"step5":{"title":"5. Add the routing layer","description":"Route LLM requests through a server proxy that normalizes payloads, manages API keys, and tracks usage.","details":"Keep provider credentials on the server; never embed them in desktop clients."}},"architectureDecisions":{"heading":"Architecture Decisions","decisions":[{"question":"Should you use a local database or server-side storage?","recommendation":"Use local SQLite for job state and artifacts. This enables offline operation and fast queries. Sync to server only for billing and cross-device state."},{"question":"Streaming vs non-streaming responses?","recommendation":"Use streaming for plan generation and any output shown progressively. Use non-streaming for short transformations like text improvement."},{"question":"How to handle LLM provider failures?","recommendation":"Implement automatic retry with exponential backoff. Consider a fallback provider like OpenRouter for resilience."},{"question":"Where should file content be loaded?","recommendation":"Load file content in the processor just before building the prompt. This ensures fresh content and avoids storing large blobs in job records."}]},"customizeVsReuse":{"heading":"What to Customize vs Reuse","customize":["Prompt templates for your specific use case","File discovery patterns for your project types","Output format (XML, JSON, Markdown)","Model selection per task type"],"reuse":["Job queue architecture with status tracking","Workflow orchestrator pattern","Repository pattern for persistence","Streaming response handling","Provider routing and normalization"]},"commonPitfalls":{"heading":"Common Pitfalls to Avoid","items":[{"pitfall":"Embedding API keys in the client","solution":"Route all LLM requests through a server proxy that manages credentials securely."},{"pitfall":"Not persisting job state","solution":"Store every job with full prompt and response for review and recovery."},{"pitfall":"Blocking UI on LLM calls","solution":"Use background jobs with event-driven UI updates for responsive interfaces."},{"pitfall":"Ignoring token limits","solution":"Estimate tokens before sending and chunk large inputs to stay within context windows."},{"pitfall":"No cancellation support","solution":"Check cancellation flags between streaming chunks and propagate to server."}]},"artifacts":{"heading":"Artifacts to Persist","items":["Full prompt sent to the LLM (for debugging and review)","Complete response including streaming accumulation","Token counts from provider response","Computed cost based on model pricing","System prompt template identifier for versioning","Workflow intermediate data for multi-stage flows"]},"implementationNotes":{"heading":"Implementation Notes","items":["Use SQLite with WAL mode for concurrent read/write access","Implement graceful shutdown that marks running jobs as failed","Add health checks for external dependencies before job processing","Log all LLM errors with full context for debugging","Consider caching file content with short TTL to avoid redundant reads"]}},"decisionsTradeoffs":{"meta":{"title":"Technical decisions and tradeoffs - PlanToCode","description":"Why Tauri, SQLite, and a dedicated LLM proxy were chosen, and what operational tradeoffs they create."},"category":"Architecture","date":"2025-09-25","readTime":"10 min","title":"Technical Decisions & Tradeoffs","description":"Why Tauri, SQLite, and a dedicated LLM proxy were chosen and what they cost.","intro":"Every architecture involves tradeoffs. This document explains the major technology choices in PlanToCode, what benefits they provide, and what costs or limitations they introduce.","visuals":{"tradeoffMatrix":{"title":"Tradeoff matrix","description":"Visual comparison of technology choices with their benefits and costs.","imageSrc":"/images/docs/overview/system-map.svg","imageAlt":"Technology tradeoff matrix","caption":"System architecture overview illustrating the technology stack decisions."}},"sections":{"tauri":{"title":"Tauri v2 for Desktop","description":"Tauri provides a Rust backend with a web-based frontend, enabling cross-platform desktop apps with native performance and small binary sizes.","benefits":["Small binary size (~15MB vs 200MB+ for Electron)","Native Rust performance for file operations and job processing","Capability-based security model with fine-grained permissions","Single codebase for macOS","Access to system APIs (PTY, keychain, notifications)"],"tradeoffs":["Smaller ecosystem than Electron","Rust learning curve for backend development","WebView rendering differences across platforms","Less mature tooling for debugging IPC issues"],"implementation":"PlanToCode uses Tauri 2.9.1 with ~35 command modules, capability-based permissions, and plugins for shell, dialog, and notifications."},"sqlite":{"title":"SQLite for Local Persistence","description":"SQLite stores all local state including sessions, jobs, terminal output, and settings. This enables offline operation and fast queries.","benefits":["Zero-config embedded database","Fast queries for local data","Enables offline operation","Single file backup and restore","WAL mode for concurrent access"],"tradeoffs":["No built-in replication or sync","Large terminal logs can grow the database","Need manual schema migrations","Single-writer limitation (mitigated by WAL)"],"implementation":"Schema in consolidated_schema.sql with ~10 tables. Repositories provide typed access with rusqlite."},"llmProxy":{"title":"Dedicated LLM Proxy Server","description":"All LLM requests route through a server proxy that manages API keys, normalizes requests, tracks usage, and handles billing.","benefits":["API keys never leave the server","Single request format for all providers","Centralized usage tracking and billing","Provider failover without client updates","Content filtering and rate limiting"],"tradeoffs":["Requires server infrastructure","Adds network latency to requests","Server becomes single point of failure","Need to maintain provider integrations"],"implementation":"Actix-Web server with handlers in server/src/handlers/proxy/. Transformers in provider_transformers/ normalize requests."},"websocket":{"title":"WebSocket Relay for Mobile","description":"Desktop and mobile clients connect through a WebSocket relay for device linking, terminal streaming, and job synchronization.","benefits":["Real-time bidirectional communication","No direct P2P networking required","Works across NAT and firewalls","Supports multiple linked devices"],"tradeoffs":["Requires persistent server connections","Relay adds latency for large payloads","Connection management complexity","Need reconnection and heartbeat logic"],"implementation":"device_link_ws.rs implements the relay with session tracking, heartbeats, and PTC1 binary framing for terminal output."}},"operational":{"heading":"Operational Consequences","items":["Tauri: Need separate builds for each platform. CI/CD must cross-compile or use platform-specific runners.","SQLite: Database file grows with terminal output. May need periodic cleanup for long-running instances.","LLM Proxy: Server downtime blocks all LLM operations. Need monitoring and redundancy for production.","WebSocket: Reconnection logic adds complexity. Clients must handle connection drops gracefully."]},"securityBoundaries":{"heading":"Security Boundaries","description":"The architecture creates clear security boundaries that limit exposure:","items":["API keys stored in server vault, never sent to clients","JWT tokens validated on every request with JWKS rotation","Capability-based permissions limit filesystem access","Content sent to LLMs requires explicit user approval","Audit logs track all LLM requests with user context"]},"whenToReconsider":{"heading":"When to Reconsider","description":"These decisions may need revisiting if requirements change significantly:","items":["If browser-only access is required, consider a web-based alternative to Tauri","If multi-device sync is critical, consider server-side job storage","If provider lock-in is acceptable, direct API calls may reduce latency","If mobile is primary, consider native apps instead of device linking"]}},"dataModel":{"meta":{"title":"Data model and storage - PlanToCode","description":"SQLite entities, relationships, and how state is rehydrated on app restart."},"category":"Architecture","date":"2025-09-25","readTime":"10 min","title":"Data Model & Storage","description":"SQLite entities, relationships, and how state is rehydrated.","intro":"PlanToCode uses SQLite for all local state. This document describes the schema, entity relationships, and how state is restored when the app restarts.","sqlite":{"heading":"SQLite Configuration","description":"The database uses WAL mode for concurrent read/write access. The file is stored in the Tauri app data directory (~/.local/share/plantocode on Linux, ~/Library/Application Support/plantocode on macOS).","migrations":"Schema migrations are consolidated in consolidated_schema.sql. The app checks schema version on startup and runs any pending migrations."},"entities":{"heading":"Core Entities","items":["sessions: Project context with task description, file selections, model preferences, search settings, video/merge prompts, history indexes","background_jobs: LLM-backed operations with prompt, response, tokens, cost, is_finalized flag, error_message","terminal_sessions: PTY sessions with output log, status, process info","task_description_history: Version history for task descriptions","file_selection_history: Version history for file selections","project_system_prompts: Per-project prompt overrides","key_value_store: App settings and configuration","error_logs: Client-side error tracking","migrations: Tracks applied database migrations with timestamps","db_diagnostic_logs: Records database diagnostic issues and errors","app_settings: Application configuration key-value pairs with descriptions"]},"visuals":{"schema":{"title":"Entity relationship diagram","description":"Visual representation of the SQLite schema and relationships.","imageSrc":"/images/docs/data-model/schema.svg","imageAlt":"Database schema diagram","caption":"Placeholder for database schema diagram."}},"relationships":{"heading":"Entity Relationships","description":"Entities are linked through foreign keys with cascade delete rules:","links":["sessions → background_jobs: One-to-many, cascade delete","background_jobs → terminal_sessions: Optional one-to-one link via job_id","sessions → task_description_history: One-to-many for version tracking","sessions → file_selection_history: One-to-many for version tracking"]},"repositories":{"heading":"Repository Layer","description":"All database access goes through typed repositories in desktop/src-tauri/src/db_utils/:","examples":["background_job_repository/: Modular with base.rs, worker.rs, metadata.rs, cleanup.rs","session_repository.rs: Session CRUD with history management","terminal_repository.rs: Terminal session persistence and output logging","settings_repository.rs: Key-value settings storage"]},"rehydration":{"heading":"State Rehydration","description":"When the app starts, state is restored from SQLite:","sessions":"Active session is loaded with task description, file selections, and model preferences. Recent sessions are available in the session picker."},"retention":{"heading":"Data Retention","description":"Old data is cleaned up based on configurable retention periods:","exports":"Sessions and jobs can be exported for backup before cleanup."},"cta":{"heading":"Explore job processing","description":"See how background jobs use this data model.","links":{"jobs":"Background jobs","terminals":"Terminal sessions"}}},"serverSetup":{"meta":{"title":"Dedicated server setup - PlanToCode","description":"Ansible-based infrastructure setup: base hardening, PostgreSQL, Redis, and application deployment."},"category":"Deployment","date":"2025-09-25","readTime":"12 min","title":"Dedicated Server Setup","description":"Ansible-based infrastructure: base hardening, app deployment, and vault-managed secrets.","intro":"PlanToCode runs on dedicated servers managed through Ansible playbooks. This document covers the infrastructure setup, security hardening, and deployment process.","layers":{"heading":"Infrastructure Layers","description":"The infrastructure is organized into layers, each managed by dedicated playbooks:","items":["Base layer: OS hardening, SSH configuration, firewall rules","Database layer: PostgreSQL 17 with replication and backups","Cache layer: Redis 7+ for session state and job queues","Application layer: Rust server binary with systemd service","Proxy layer: Nginx reverse proxy with SSL termination"]},"servers":{"heading":"Server Regions","description":"PlanToCode runs in two regions for geographic redundancy:","items":["EU region: Hetzner dedicated server (api-eu.plantocode.com)","US region: InterServer dedicated server (api-us.plantocode.com)"]},"requirements":{"heading":"Server Requirements","items":["Debian 12 or Ubuntu 22.04 LTS","4+ CPU cores, 16GB+ RAM, 200GB+ SSD","Public IPv4 with firewall access to ports 22, 80, 443","SSH key access for Ansible deployment"]},"hardening":{"heading":"Base Hardening","description":"site-base.yml applies security hardening:","items":["Disable root SSH login, require key authentication","Configure UFW firewall with minimal open ports","Install fail2ban for brute force protection","Enable automatic security updates","Configure audit logging"]},"postgresql":{"heading":"PostgreSQL Setup","description":"PostgreSQL 17 is configured for production use:","items":["Connection pooling with PgBouncer","Automated daily backups with pg_dump","WAL archiving for point-in-time recovery","SSL required for all connections","Row-level security for multi-tenant data"]},"redis":{"heading":"Redis Setup","description":"Redis 7+ handles caching and session state:","items":["Password authentication required","AOF persistence for durability","Memory limits with eviction policy","TLS encryption for connections"]},"zeroDowntime":{"heading":"Zero-Downtime Deployment","description":"Deployments use a rolling update strategy:","items":["New binary uploaded alongside running version","Health check confirms new version is ready","Systemd restarts with graceful shutdown","Load balancer drains connections during switch","Rollback available via previous binary symlink"]},"quickStart":{"heading":"Quick Start","steps":["Clone the infrastructure repository","Copy inventory.example to inventory and configure hosts","Set vault password in .vault_pass","Run: ansible-playbook -i inventory site-base.yml","Run: ansible-playbook -i inventory site-app.yml"]},"vault":{"heading":"Secrets Management","description":"Sensitive configuration uses Ansible Vault:","items":["Database credentials","API keys for LLM providers","SSL certificates and private keys","Auth0 client secrets","Stripe webhook secrets"]},"operations":{"heading":"Common Operations","items":["ansible-playbook -i inventory site-app.yml --tags deploy","ansible-playbook -i inventory site-base.yml --tags backup","ansible-playbook -i inventory site-app.yml --tags rollback","ansible-playbook -i inventory site-base.yml --tags logs"]},"ssl":{"heading":"SSL/TLS Configuration","description":"Let's Encrypt provides free SSL certificates:","items":["Certbot configured with Nginx plugin","Automatic renewal via cron job","HSTS headers enabled","TLS 1.2+ only, modern cipher suite"]},"security":{"heading":"Security Checklist","items":["All default passwords changed","SSH key rotation scheduled","Firewall rules audited","Security updates automated","Backup restoration tested"]},"recovery":{"heading":"Disaster Recovery","description":"Recovery procedures for common failure scenarios:","items":["Database corruption: Restore from latest pg_dump backup","Server failure: Provision new server and run playbooks","SSL expiration: Manual certbot renew --force-renewal","Security breach: Rotate all credentials, audit logs"]}},"tauriV2":{"meta":{"title":"Tauri v2 development guide - PlanToCode","description":"Project layout, commands, capabilities, and development workflow for Tauri v2."},"category":"Deployment","date":"2025-09-25","readTime":"10 min","title":"Tauri v2 Development Guide","description":"Project layout, commands, and capability-based permissions for Tauri v2.","intro":"PlanToCode uses Tauri v2 for the desktop application. This guide covers the project structure, command system, capability-based permissions, and development workflow.","projectLayout":{"heading":"Project Layout","description":"The desktop application follows standard Tauri v2 conventions:","items":["desktop/src/: React frontend with components, hooks, and providers","desktop/src-tauri/: Rust backend with commands, jobs, and services","desktop/src-tauri/src/lib.rs: Application entry point","desktop/src-tauri/src/commands/: Tauri command handlers (~35 modules)","desktop/src-tauri/capabilities/: Permission definitions","desktop/src-tauri/tauri.conf.json: Tauri configuration"]},"configuration":{"heading":"Tauri Configuration","description":"tauri.conf.json configures the application:","items":["productName, version, identifier for app metadata","build.beforeDevCommand and beforeBuildCommand for frontend","bundle settings for installers (DMG)","security.csp for Content Security Policy","plugins configuration for official plugins"]},"capabilities":{"heading":"Capability-Based Permissions","description":"Tauri v2 uses capabilities to control what the app can access:","items":["default.json: Base permissions for all windows","desktop-default.json: Desktop-specific permissions","plantocode-api.json: Custom permissions for PlanToCode commands","Permissions grant access to: filesystem, shell, http, dialog, notification"]},"plugins":{"heading":"Tauri Plugins","description":"PlanToCode uses several official Tauri plugins:","items":["tauri-plugin-http: HTTP client for API calls","tauri-plugin-dialog: Native file/folder pickers","tauri-plugin-shell: Shell command execution","tauri-plugin-store: Persistent key-value storage","tauri-plugin-notification: Desktop notifications","tauri-plugin-updater: In-app updates","tauri-plugin-single-instance: Single instance enforcement"]},"appState":{"heading":"Application State","description":"Rust state managed through Tauri's state system:","items":["AppState struct holds shared state","RuntimeConfig for server URLs and feature flags","TokenManager for secure credential storage","ConfigCache for AI model configuration"]},"commands":{"heading":"Creating Commands","description":"Tauri commands expose Rust functions to the frontend:","items":["Use #[tauri::command] attribute on async functions","Return Result for error handling","Access state via State parameter","Register in lib.rs invoke_handler"]},"singleInstance":{"heading":"Single Instance","description":"The app enforces single instance to prevent data conflicts:","items":["tauri-plugin-single-instance handles detection","Second launch focuses existing window","Deep links forwarded to running instance"]},"devWorkflow":{"heading":"Development Workflow","description":"Common commands for development:","items":["pnpm tauri dev: Start development with hot reload","pnpm tauri build: Build production release","cargo test: Run Rust tests","cargo clippy: Lint Rust code"]},"mobile":{"heading":"Mobile Considerations","description":"Tauri v2 supports mobile, but PlanToCode uses native Swift:","items":["iOS app built with SwiftUI for native experience","Shared API contracts between desktop and mobile","Device linking via WebSocket relay"]},"distribution":{"heading":"Distribution","description":"Build artifacts for each platform:","items":["macOS: .dmg with universal binary (Intel + Apple Silicon)","iOS: App Store distribution"]}},"distributionMacos":{"meta":{"title":"macOS distribution - PlanToCode","description":"Code signing, notarization, DMG packaging, and updater configuration for macOS."},"category":"Deployment","date":"2025-09-25","readTime":"10 min","title":"macOS Distribution","description":"Signing, notarization, DMG packaging, and updater artifacts.","intro":"Distributing on macOS requires code signing, notarization, and proper packaging. This document covers the complete process for PlanToCode.","signing":{"heading":"Code Signing","description":"All binaries must be signed with an Apple Developer ID:","items":["Developer ID Application certificate for app signing","Developer ID Installer certificate for PKG signing","Certificates stored in CI secrets, imported to keychain","Hardened runtime enabled for notarization compatibility"]},"entitlements":{"heading":"Entitlements","description":"Required entitlements for PlanToCode features:","items":["com.apple.security.cs.allow-jit","com.apple.security.cs.allow-unsigned-executable-memory","com.apple.security.device.audio-input","com.apple.security.network.client","com.apple.security.files.user-selected.read-write"]},"build":{"heading":"Build Process","description":"Steps to build a signed release:","steps":["Run pnpm tauri build --target universal-apple-darwin","Tauri signs with APPLE_SIGNING_IDENTITY from environment","Universal binary created with lipo for Intel + ARM","DMG packaged with custom background and layout"]},"universalBinaries":{"heading":"Universal Binaries","description":"PlanToCode ships as a universal binary:","items":["Single .app supports both Intel and Apple Silicon","Built with --target universal-apple-darwin","Slightly larger binary but simpler distribution","Native performance on both architectures"]},"notarization":{"heading":"Notarization","description":"Apple notarization is required for Gatekeeper approval:","items":["DMG submitted to Apple notary service","Uses notarytool with App Store Connect credentials","Stapling attaches notarization ticket to DMG","Process takes 1-5 minutes typically"]},"updater":{"heading":"In-App Updates","description":"tauri-plugin-updater handles automatic updates:","items":["Checks update endpoint on launch","Downloads new version in background","Prompts user to restart to apply","Signature verification before installation"]},"latestJson":{"heading":"Update Manifest","description":"latest.json describes available updates:","items":["version: Semantic version string","platforms.darwin-universal: URL and signature","notes: Release notes in markdown","pub_date: ISO 8601 publish timestamp"]},"pitfalls":{"heading":"Common Pitfalls","description":"Issues frequently encountered:","items":["Keychain locked during CI: Unlock before signing","Notarization timeout: Retry with exponential backoff","Invalid signature: Check entitlements match capabilities","Gatekeeper rejection: Verify notarization stapled correctly"]},"verification":{"heading":"Verification Commands","description":"Commands to verify signing and notarization:","items":["codesign -dv --verbose=4 PlanToCode.app","spctl --assess --verbose PlanToCode.app","stapler validate PlanToCode.dmg","xcrun notarytool log "]}},"promptTypes":{"meta":{"title":"Prompt types and templates - PlanToCode","description":"Catalog of prompt-driven job types and template assembly process."},"category":"Reference","date":"2025-09-25","readTime":"8 min","title":"Prompt Types & Templates","description":"Catalog of prompt-driven job types and template assembly.","intro":"Every LLM-backed job in PlanToCode uses a structured prompt built from templates. This document catalogs the job types and explains how prompts are assembled.","catalog":{"heading":"Job Type Catalog","items":[{"job":"implementation_plan","title":"Implementation Plan","description":"Generates file-by-file implementation plans with XML structure. Uses streaming for progressive display."},{"job":"implementation_plan_merge","title":"Plan Merge","description":"Combines multiple plans with user instructions. Source plans wrapped in XML tags."},{"job":"text_improvement","title":"Text Improvement","description":"Refines selected text while preserving formatting. Non-streaming for quick results."},{"job":"root_folder_selection","title":"Root Folder Selection","description":"Analyzes directory tree to select relevant project roots. Returns JSON array."},{"job":"regex_file_filter","title":"Regex File Filter","description":"Generates regex patterns for file filtering based on task description."},{"job":"file_relevance_assessment","title":"File Relevance Assessment","description":"Scores file content relevance to task. Processes in batches."},{"job":"extended_path_finder","title":"Extended Path Finder","description":"Discovers related files through imports and dependencies."},{"job":"web_search_prompts","title":"Web Search Prompts","description":"Generates research queries for deep research workflow."},{"job":"video_analysis","title":"Video Analysis","description":"Analyzes screen recordings for UI state and action sequences."}]},"templateStructure":{"heading":"Template Structure","description":"Prompts are assembled from system templates and user content:","sampleLabel":"Example template structure:","sample":"\n You are an AI assistant that generates implementation plans.\n [template content from server]\n\n\n\n [user's task description]\n\n\n\n [selected file paths and content]\n\n\n\n [project structure]\n"},"visuals":{"template":{"title":"Prompt assembly flow","description":"How templates combine with user content to form complete prompts.","imageSrc":"/images/docs/implementation-plans/structure.svg","imageAlt":"Prompt template assembly diagram","caption":"Placeholder for prompt assembly diagram."}},"assembly":{"heading":"Assembly Process","steps":["Processor retrieves template ID from task model config","System prompt template loaded from server cache","User content wrapped in semantic XML tags","Context (files, tree) added based on job type","Complete prompt stored in job record before sending"]},"serverConfig":{"heading":"Server-Side Configuration","description":"Templates and model settings are configured server-side:","fields":"task_model_config defines: default_model, allowed_models, system_prompt_template_id, max_tokens, temperature"},"tokenGuards":{"heading":"Token Guardrails","description":"Each task type has token limits to prevent context overflow:","items":["max_tokens_input: Maximum prompt size","max_tokens_output: Maximum response size","Validation before sending prevents wasted API calls","UI shows token count and warns when approaching limits"]},"versioning":{"heading":"Template Versioning","description":"System prompt templates are versioned for reproducibility. Each job records the template ID used, enabling traceability and comparison of results across template versions."},"designNotes":{"heading":"Design Notes","items":["XML tags provide clear boundaries for LLM parsing","Semantic naming (task, files, context) aids model understanding","Templates avoid instruction injection by sanitizing user input","Streaming jobs use end tags for completion detection"]},"cta":{"heading":"See job processing in action","description":"Learn how these prompts flow through the job system.","links":{"jobs":"Background jobs","merge":"Merge instructions"}}},"mergeInstructionsDoc":{"meta":{"title":"Merge instructions - PlanToCode","description":"How multiple plan drafts are merged using XML-tagged source plans and user guidance."},"category":"Planning","date":"2025-09-25","readTime":"8 min","title":"Merge Instructions","description":"How multiple plan drafts are merged using XML-tagged source plans and user guidance.","intro":"When you have multiple implementation plans that need to be combined, the merge workflow lets you select plans, provide guidance, and generate a unified plan that incorporates the best elements from each source.","processor":{"heading":"ImplementationPlanMergeProcessor","description":"The ImplementationPlanMergeProcessor fetches source plan responses, wraps them in XML-tagged sections, and streams the merged result through the LlmTaskRunner.","payload":"Accepts source_job_ids array, optional merge_instructions string, and inherits model configuration from the session.","storage":"Merged plan stored as JobResultData::Text with metadata including source_job_ids, merge_instructions, source_count, merged_at timestamp, and session context."},"inputs":{"heading":"Merge Inputs","items":["Source plans: 2-5 implementation plans selected from the plan list","Merge instructions: User guidance on how to combine (prioritize, resolve conflicts)","Model selection: LLM model for merge generation","Task context: Original task description for reference"]},"xmlFormat":{"heading":"XML-Tagged Source Plans","description":"Source plans are wrapped in XML tags with sequential identifiers:","example":"\n [original task from session]\n\n\n\n \n [full plan content from first source]\n \n \n [full plan content from second source]\n \n\n\n\n Prioritize API structure from plan 1.\n Use database schema from plan 2.\n Resolve conflicts by preferring newer patterns.\n"},"prompt":{"heading":"Merge Prompt Structure","description":"The merge prompt includes all context needed for intelligent combination:","sections":["System prompt with merge guidelines","Source plans in XML tags","User's merge instructions","Task description for context","Output format requirements"]},"visuals":{"mergeWalkthrough":{"title":"Merge workflow walkthrough","description":"Video showing the complete merge process from selection to output.","videoSrc":"/videos/docs/merge-instructions/walkthrough.mp4","posterSrc":"/images/docs/merge-instructions/flow.svg","caption":"Placeholder for merge walkthrough video."},"mergeFlow":{"title":"Merge instructions flow","description":"Diagram showing multi-model merge workflow with XML-tagged source plans.","imageSrc":"/images/docs/merge-instructions/flow.svg","caption":"Merge flow showing source selection, instruction processing, and output generation"}},"rules":{"heading":"Merge Rules","description":"The LLM follows these rules when merging plans:","examples":["Preserve file paths exactly as specified in source plans","Combine non-conflicting changes from all sources","For conflicts, follow explicit user instructions","Maintain consistent code style across merged content","Include provenance comments indicating source plan"]},"output":{"heading":"Merged Output","description":"The merged plan is returned as raw text from the LLM, following the same flexible format as individual plans.","provenance":"Each section includes comments indicating which source plan contributed the content.","metadata":"source_job_ids, merge_instructions, source_count, merged_at timestamp, planTitle, summary, isStructured (false), and sessionName stored in job metadata."},"ui":{"heading":"UI Integration","description":"The Implementation Plans panel supports merge workflow:","audit":"Merged plans link back to source plans for traceability."},"cta":{"heading":"Learn about plan generation","description":"Understand how individual plans are created before merging.","links":{"plans":"Implementation plans","runtime":"Runtime walkthrough"}}},"meetingIngestionDoc":{"meta":{"title":"Meeting and recording ingestion - PlanToCode","description":"How recordings are analyzed into task summaries through the video analysis pipeline."},"category":"Inputs","date":"2025-09-25","readTime":"8 min","title":"Meeting & Recording Ingestion","description":"How recordings become task summaries and planning inputs.","intro":"PlanToCode can analyze meeting recordings and screen captures with the video analysis job. The model is guided by a system prompt that adapts to your goal, whether you are debugging, reviewing UI, or documenting a workflow.","visuals":{"ingestionFlow":{"title":"Recording ingestion flow","description":"How recordings flow through upload and analysis.","imageSrc":"/images/docs/deep-research/workflow.svg","imageAlt":"Recording ingestion flow diagram","caption":"Placeholder for ingestion flow diagram."}},"inputs":{"heading":"Supported Inputs","description":"The ingestion workflow accepts video recordings captured in the app or uploaded from other tools.","items":["Screen recordings captured in the desktop app","Meeting recordings exported from Zoom, Meet, or Teams (video files)","Design walkthroughs or bug reproductions recorded as video","For audio-only notes, use voice transcription"]},"uploadProcess":{"heading":"Upload Process","description":"Recordings are uploaded to the server as multipart form data for analysis.","stepsHeading":"Processing Steps","steps":["Desktop saves the recording locally and calculates duration","Video file and analysis prompt are uploaded to /api/llm/video/analyze","Server stores the file temporarily and routes it to Gemini video models","Long recordings are split into 2-minute chunks by the desktop and processed in parallel","Analysis summary is returned and stored in the job response"]},"normalization":{"heading":"Format Normalization","description":"Recordings are sent mostly as-is. WebM recordings are remuxed to fix container metadata before analysis.","outputs":"No separate transcript or frame artifacts are generated; the output is a text analysis summary."},"multimodalAnalysis":{"heading":"Multimodal Analysis","description":"Recordings are analyzed with {code} video models, which accept video and audio in a single request.","combined":"The default video analysis system prompt adapts the output to your goal rather than forcing a fixed schema."},"transcription":{"heading":"Audio context","description":"Audio is analyzed as part of the video; the app does not generate a standalone transcript.","attribution":"If spoken content is unclear, the model may mark it as partially visible rather than guessing.","featuresHeading":"Audio analysis notes","features":["Narration steers the summary","Spoken intent and errors can be quoted","No diarization or timestamped transcript"]},"frames":{"heading":"Frame rate hint","description":"FPS is a sampling hint sent with the analysis request. For large files the provider may ignore it.","timestamps":"Long recordings can be chunked to keep analysis responsive."},"structuredExtraction":{"heading":"Structured Extraction","description":"The analysis output is freeform and adapts to your prompt. Typical outputs include:","extractedHeading":"Extracted Elements","items":["Bug reproduction steps and observed errors","UI walkthrough notes and navigation paths","Design feedback or UX issues shown on screen","Suggested fixes or follow-up tasks"]},"artifacts":{"heading":"Analysis Artifacts","description":"Video analysis produces artifacts stored with the job:","items":["analysis_summary: Text summary stored in background_jobs.response","job_metadata: durationMs, framerate, videoPath","chunk_info: chunk boundaries for long recordings (when applicable)"]},"keyFiles":{"heading":"Key Source Files","items":["desktop/src/app/components/generate-prompt/_components/video-recording-dialog.tsx","desktop/src/contexts/screen-recording/Provider.tsx","desktop/src-tauri/src/jobs/processors/video_analysis_processor.rs","server/src/handlers/proxy/specialized/video_analysis.rs","server/src/utils/multipart_utils.rs","server/src/clients/google_client.rs"]},"handoff":{"heading":"Planning Handoff","description":"Video analysis summaries can be incorporated into the task description for planning.","pipeline":"The summary can be refined with text_improvement and task_refinement before file discovery."},"cta":{"heading":"Continue to video analysis","description":"Learn more about how video frames are analyzed.","links":{"video":"Video analysis","textImprovement":"Text improvement"}}},"videoAnalysisDoc":{"meta":{"title":"Video analysis - PlanToCode","description":"Adaptive analysis of screen recordings with Gemini video models."},"category":"Inputs","date":"2025-09-25","readTime":"6 min","title":"Video Analysis","description":"Adaptive analysis and prompts for screen recordings.","intro":"Video analysis sends the recording to Gemini video models with a system prompt that adapts to your goal. The output is a text summary, not a frame-by-frame export or separate transcript.","visuals":{"frameNotes":{"title":"Video analysis pipeline","description":"How recordings flow through the analysis model.","imageSrc":"/assets/images/demo-video-analysis.jpg","imageAlt":"Video analysis interface","caption":"The video analysis interface showing analysis options."}},"apiEndpoint":{"heading":"API Endpoint","endpoint":"Video analysis is handled by {code} on the server. The endpoint accepts multipart form data with the video file and analysis parameters.","payloadHeading":"Payload Fields","payloadFields":["video: The video file","model: Model identifier for analysis (google/* required)","prompt: Task description and optional focus prompt (wrapped in and )","temperature: Sampling temperature from task settings","durationMs: Recording duration in milliseconds","framerate: Sampling hint (0.1-20 from the UI)","systemPrompt: Composed system prompt (server-generated)"]},"inputs":{"heading":"Supported Input Formats","items":["MP4, WebM, MOV, and AVI are common inputs","Large files may be uploaded with the provider File API","Long recordings are chunked by the desktop app before analysis"]},"sampling":{"heading":"Frame rate hint","description":"FPS is a hint for how densely to sample the video. For large files the provider may ignore it; for long recordings the desktop may downsample when chunking.","fps":"Default recorder rate is 5 FPS. Lower rates reduce cost but may miss rapid UI changes.","parametersHeading":"Sampling Parameters","parameters":["framerate: 0.1-20 selection in the UI (provider requests are clamped to 1-20)","chunking: long recordings split into 2-minute segments","audio: include narration when \"Include dictation\" is enabled"]},"modelRequirements":{"heading":"Model Requirements","format":"Video analysis requires Gemini video models. Model identifiers follow {code} format; only {code} models are supported.","reasoning":"The server restricts video analysis to Google Gemini models that accept video inputs."},"analysis":{"heading":"Analysis Process","description":"The model analyzes the full video (and audio if present) and produces a goal-oriented summary.","prompting":"The default system prompt (default_video_analysis) tells the model to adapt to your goal, quote visible text when relevant, and mark unclear content instead of guessing.","promptElementsHeading":"Prompt Elements","promptElements":["Goal alignment: focus on the user's stated intent","Evidence: quote visible errors, logs, or UI text when relevant","Sequence: describe the order of events or steps shown","Next steps: suggest fixes or follow-up tasks"]},"outputs":{"heading":"Analysis Outputs","items":["Analysis summary text tailored to the prompt","Quoted errors or UI text when visible","Workflow notes describing what happened on screen","Suggested fixes or follow-up tasks"]},"billing":{"heading":"Token Usage & Billing","description":"Video analysis usage and cost are tracked per job using provider-reported tokens or duration-based estimates.","tracked":["tokens_sent: Prompt + video tokens","tokens_received: Analysis response tokens","actual_cost: Computed from model pricing"]},"storage":{"heading":"Result Storage","description":"Analysis results are stored in background_jobs.response with task_type \"video_analysis\". Long recordings may include chunk metadata.","reuse":"Results can be incorporated into task descriptions or used directly in the planning workflow."},"keyFiles":{"heading":"Key Source Files","items":["desktop/src/app/components/generate-prompt/_components/video-recording-dialog.tsx","desktop/src/contexts/screen-recording/Provider.tsx","desktop/src-tauri/src/jobs/processors/video_analysis_processor.rs","server/src/handlers/proxy/specialized/video_analysis.rs","server/src/clients/google_client.rs"]},"integration":{"heading":"Integration with Planning","description":"Video analysis summaries can be appended to the task description for context-aware planning.","followup":"Use text_improvement or task_refinement to polish the summary before file discovery."},"cta":{"heading":"See meeting ingestion","description":"Learn more about how video analysis works.","links":{"meeting":"Meeting ingestion","runtime":"Runtime walkthrough"}}},"mobileIos":{"meta":{"title":"iOS client architecture - PlanToCode","description":"iOS control plane: workspace tabs, attention monitoring, chat outbox, RPC command routing, and relay connectivity."},"category":"Architecture","date":"2025-09-25","readTime":"12 min","title":"iOS Client Architecture","description":"Control-plane companion with workspace chat, attention monitoring, terminal contexts, and relay connectivity.","intro":"The PlanToCode iOS app is the control plane for the system — it issues intents, monitors run and attention state, and notifies the operator. The app provides a full workspace with four tabs (Workspace chat, Terminal, Changes, Settings), an attention summary bar with Now/Running/Next/Handoff counters, project and session context switching, and connectivity state management. Desktop remains the execution authority; iOS drives oversight and intervention from anywhere.","visuals":{"app":{"title":"iOS app interface","description":"Screenshots of the iOS app showing device linking and terminal view.","imageSrc":"/images/docs/overview/system-map.svg","imageAlt":"PlanToCode iOS app screenshots","caption":"Placeholder for iOS app screenshots."}},"packageStructure":{"heading":"Swift Package Structure","description":"The iOS app is organized into Swift packages:","packages":[{"name":"Core","path":"mobile/ios/Core/","description":"Data services, RPC command routing, and relay event processing","components":["CommandRouter","SessionDataService","DataServicesManager","MultiConnectionManager","PushNotificationManager"]},{"name":"Security","path":"mobile/ios/Security/","description":"Authentication and credential storage","components":["Auth0Manager","KeychainHelper","TokenStore"]},{"name":"VibeUI","path":"mobile/ios/VibeUI/","description":"SwiftUI workspace with run monitoring, chat, and terminal surfaces","components":["SessionWorkspaceView","WorkspaceChatTab","TerminalTab","GitChangesTab","DeviceSelectionView","ConnectionBanners"]}]},"auth":{"heading":"Auth0 PKCE Integration","description":"The iOS app uses Auth0 with PKCE flow for secure authentication:","flow":["User taps Sign In, app generates code verifier and challenge","ASWebAuthenticationSession opens Auth0 login page","User authenticates and Auth0 redirects with authorization code","App exchanges code for tokens using code verifier","Tokens stored securely in iOS Keychain"],"tokenManagement":{"heading":"Token Management","items":["Access token used for API requests","Refresh token stored for silent renewal","Token refresh triggered before expiry","Logout clears all tokens from Keychain"]}},"deviceLink":{"heading":"Device Linking via WebSocket Relay","description":"iOS connects to the desktop through the server's WebSocket relay using a heartbeat-monitored connection:","protocol":{"heading":"Linking Protocol","steps":["Desktop generates link code and displays QR","iOS scans QR or enters code manually","Both connect to /ws/device-link with credentials","Server validates and establishes relay with heartbeat monitoring","Bidirectional communication enabled through canonical RPC namespaces"]},"messageTypes":{"heading":"Relay Event Types","items":["run:* events: run:created, run:status-changed, run:stream-progress, run:finalized, run:error-details, etc.","attention.raised / attention.cleared: Overseer attention events with Now/Running/Next counters","terminal.*: Terminal output streaming and session management","session.*: Session state synchronization and history merge","rpc_command: JSON-RPC commands from iOS to desktop via canonical namespaces"]},"reconnection":{"heading":"Connectivity State Management","description":"iOS tracks four connectivity states: healthy, transientReconnecting (brief blip with auto-recovery), degradedDisconnected (persistent failure with reconnect banner), and offlineModeCandidate (explicit offline with queued outbox). Relay disconnect preserves local state; replay gaps trigger reconciliation on reconnect."}},"rpcRouting":{"heading":"RPC Command Routing","description":"iOS sends commands to the desktop through canonical RPC namespaces. Unsupported namespaces return method_not_found.","commands":{"heading":"Canonical Namespaces","items":["session.*: create, get, list, update, delete, duplicate, rename, getHistoryState, syncHistoryState, mergeHistoryState","plan.*: create, merge, read, generateMarkdown — all run-keyed via runId","run.*: list, get, cancel, delete","files.*: list, search, getMetadata","terminal.*: getAvailableShells, getDefaultShell, setDefaultShell, start, write, resize, kill, getLog, getStatus, getMetadata, getActiveSessions"]},"implementation":{"heading":"Implementation","description":"Commands are JSON-RPC messages sent over the WebSocket relay. The desktop RPC router in remote_api/router.rs validates the namespace and method, dispatches to the corresponding handler, and returns results asynchronously. runId is the canonical control identifier for all run-scoped operations."}},"offlineQueue":{"heading":"Chat Outbox and Offline Queue","description":"The workspace chat composer includes a persistent outbox that queues messages when the desktop is unreachable:","architecture":{"heading":"Outbox Architecture","items":["Messages stored locally with session-scoped entries and retry state","Outbox entries retry with exponential backoff (800ms initial, 30s max, 5 attempts, 20% jitter)","Priority-next supersession lets the operator compose follow-up messages while a prior send is in-flight","Offline status line: 'your message will send automatically when reconnected'"]},"supportedActions":{"heading":"Queued Capabilities","items":["Chat messages with text and file/image attachments","Voice dictation transcription stored locally and queued for send","Session and preference changes"]}},"localStorage":{"heading":"SQLite Local Storage","description":"iOS uses SQLite for local persistence:","database":{"heading":"Database Schema","path":"~/Documents/plantocode.sqlite","tables":["linked_devices: Desktop connections","offline_queue: Pending sync actions","cached_sessions: Recent session data","transcriptions: Local voice recordings"]},"migrations":{"heading":"Migrations","description":"Schema version tracked in user_version pragma. Migrations run on app launch."}},"sessions":{"heading":"Workspace and Session Management","description":"SessionWorkspaceViewModel coordinates the full mobile workspace:","lifecycle":["Load most recent session for the active project on launch","Connect to linked desktop and start session-scoped sync for accurate run counts","Context switcher bar enables project and session switching without returning to device selection","Workspace attention summary bar surfaces Now/Running/Next/Handoff counts with tap-to-focus navigation"]},"workflows":{"heading":"Workspace Tabs","description":"The iOS workspace provides four tabs matching the operator's workflow:","items":["Workspace (Chat): Full chat timeline with run output streaming, activity events, inline file previews, model override, reasoning level controls, and the outbox-backed composer.","Terminal: Multi-context terminal with session shell and per-run terminal contexts. PTY output streams via relay with connection status indicators.","Changes: Git diff viewer showing changed files from run output, enabling review before commit.","Settings: Region, model, and preference configuration."]},"region":{"heading":"Region Settings","description":"iOS respects user region preference for API routing:","implementation":"Region stored in UserDefaults, used to select api-eu.plantocode.com or api-us.plantocode.com for all requests."}},"providerRouting":{"meta":{"title":"Provider routing and streaming - PlanToCode","description":"How PlanToCode routes LLM requests through a proxy, normalizes responses, and streams tokens to the desktop client."},"category":"Research & Models","date":"2025-09-24","readTime":"10 min","title":"Provider Routing and Streaming","description":"Routing layer that mediates all external LLM requests with normalization, streaming, and usage tracking.","visuals":{"routingMap":{"title":"Provider routing map","description":"Diagram of how requests flow from the desktop app to the proxy and out to providers.","imageSrc":"/images/docs/provider-routing/routing-map.svg","imageAlt":"Diagram of provider routing flow from desktop to external providers","caption":"Placeholder for provider routing diagram."}},"cta":{"heading":"Continue into model configuration","description":"Model configuration explains how allowed lists and token guardrails are exposed to the UI.","links":{"modelConfiguration":"Model configuration","runtimeWalkthrough":"Runtime walkthrough"}}}},"nav":{"docs":"Documentation","downloads":"Downloads","features":"Components","architecture":"Architecture","evolution":"Evolution","evolutionDescription":"How the architecture evolved over time","runtimeWalkthrough":"Runtime Walkthrough","source":"Source Code","sourceDescription":"Browse the full source on GitHub","more":"More","downloadsDescription":"Get the latest builds","supportDescription":"Community support and resources","changelogDescription":"Recent updates and releases","aboutDescription":"About the project and team"},"seo":{"seo":{"defaultDescription":"Technical documentation and architecture walkthrough for PlanToCode: file discovery, plan generation, terminal execution, and LLM routing.","defaultTitle":"PlanToCode — Technical Documentation","siteName":"PlanToCode"}},"home":{"technicalLanding":{"title":"PlanToCode: Desktop workspace for Codex CLI","description":"PlanToCode wraps Codex CLI in a desktop workspace with Codex-backed chat, Gemini video analysis for rich context, structured implementation planning, reusable skills, and background run monitoring across projects — with an iOS control plane to continue sessions from your phone.","note":"Hosted uses managed model access; BYOK is available only for self-hosting.","noteLink":"Self-hosting guide","repo":{"title":"Source available on GitHub","description":"This site is the front page for the PlanToCode repository. Browse the code, docs, and architecture from here.","starsLabel":"GitHub stars","licenseLabel":"BSL 1.1"},"walkthroughTitle":"Step-by-step: how the pieces work together","walkthroughDescription":"Follow an end-to-end walkthrough of how the Tauri desktop app, Codex CLI integration, background job system, and Rust backend coordinate tasks and stream results across desktop and mobile.","tags":["Codex CLI desktop app","Codex-backed chat","Implementation planning","Mobile companion","Source available (BSL)"]},"gallery":{"heading":"What the desktop app does","intro":"Codex-backed chat in a desktop workspace, Gemini video analysis for rich context, structured implementation plans, background run monitoring, and a growing catalog of reusable skills.","video":{"title":"Desktop workflow overview","description":"A walkthrough of the Codex CLI desktop workspace — from Codex-backed chat and implementation planning to background run monitoring.","bullets":["Codex-backed chat with a streaming timeline in a desktop workspace","Browse reusable skills and drag them into chat as prompt context","Generate, review, and merge implementation plans across models","Monitor background runs across projects with token usage and cost tracking"]},"cards":{"fileFinder":{"title":"File Discovery Pipeline","description":"A four-stage Rust workflow: LLM-assisted root selection, regex filtering, relevance scoring, and extended path finding to build a focused file set.","features":["Root folder selection uses the directory tree and task prompt","Regex filter generates pattern groups and applies git ls-files","Relevance scoring chunks file contents with token estimates","Extended path finder expands context with file + tree data"]},"fileFinderWorkflow":{"title":"Skills catalog","description":"Browse reusable skills and drag them into Codex CLI chat as prompt context. Skills are templates stored in the repo that add structure to your conversations.","features":["Repository-local and external skill catalogs","Drag-and-drop skills into chat prompts as context","Trust levels and verification status per skill","Side-by-side skill comparison and source viewer"]},"videoAnalysis":{"title":"Gemini video analysis for rich context","description":"Record your screen or upload videos — Gemini's multimodal analysis extracts UI details, workflows, and bugs into structured summaries you can feed directly into Codex CLI chat or implementation plans.","features":["Multimodal analysis of screen recordings, design reviews, and bug walkthroughs","Gemini processes video with a focus prompt to extract relevant context","Analysis summaries attach to task descriptions for richer Codex conversations","Usage and cost tracked per analysis job"]},"implementationPlans":{"title":"Multi-model plan drafts","description":"Run the same task through multiple models and compare drafts before merging or execution.","features":["Plan jobs include selected file contents + directory tree","Explicit file operations with exact paths","Structured plan metadata captured per draft","Merge prompt uses and ","Final plan stored alongside source drafts"]},"backgroundTasks":{"title":"Background Jobs Sidebar","description":"Multi-project run monitoring sidebar with project groups, detailed panels showing system prompts, responses, errors, model config, and cost breakdown.","features":["Project-grouped run cards with status, progress, and timing","Detailed panels with system prompt, response, and error views","Token usage and cost tracking per run and per project","Run filtering, history clearing, and terminal output modals"]},"settingsPrompts":{"title":"System prompts and model control","description":"See and edit system prompts, choose models per task, and understand exactly what is sent.","features":["Per-task allowed models and defaults","System prompts served by the server API","Project-level prompt overrides in project_system_prompts","Local key_value_store for runtime preferences"]},"terminalVoiceRecording":{"title":"Codex CLI chat","description":"The app wraps Codex CLI and reads its JSONL output to render a live chat timeline. You interact through a desktop workspace with streaming, session persistence, and configurable access modes.","features":["Codex CLI spawned and managed by the Rust backend","JSONL timeline parsed and rendered in real time","Configurable access modes (read-only, full-auto, full-access)","Context window tracking with token usage reporting"]},"mergeInstructionsWorkflow":{"title":"Plan merge instructions","description":"Provide merge guidance, keep source traceability, and store the merged plan alongside its inputs.","features":["Source plans pulled by run ID","Merge instructions stored in metadata","File contents + directory tree add context","Merged plan stored alongside inputs","Mobile voice dictation for merge instructions"]},"billingTransactions":{"title":"Usage and Cost Ledger","description":"Server-side usage entries and run metadata capture model usage across providers.","features":["Per-run token and cost metadata","Provider-aware usage entries","Billing endpoints expose usage summaries","Usage history for model spend"]}},"viewFullSize":"View full size","cta":{"title":"Ready to use Codex CLI with a full desktop workspace?","description":"Download the desktop app for Codex-backed chat, implementation planning, reusable skills, and background run monitoring.","primary":"Download PlanToCode","secondary":"See the plan format"}},"governance":{"cards":{"filePlans":{"description":"Implementation plans break down changes by file and operation so scope is explicit before anything runs.","title":"File-by-file plans with exact paths"},"handoff":{"description":"Approved plans are handed to Codex CLI or the integrated terminal with full context. Logs stay in the app.","title":"Execution handoff"},"workflow":{"description":"Review and edit plans on desktop or mobile before execution. Every chat session and run output is stored for audit.","title":"Review, edit, approve"}},"subtitle":"Review plans before execution, track chat sessions and background runs, and keep a full audit trail in SQLite.","title":"Review before execution"},"integrations":{"cards":{"allIntegrations":{"description":"Run the server yourself to control provider routing and supply your own API keys.","link":"Server setup guide ->","title":"Self-hosting and BYOK"},"claudeCode":{"description":"Default system prompts and skill templates are stored in the repo and server database so you can inspect and override them per project.","link":"Prompt types docs ->","title":"System prompts you can read"},"cursor":{"description":"The full system is on GitHub under the Business Source License so you can audit the architecture.","link":"View GitHub repo ->","title":"Source available (BSL 1.1)"}},"subtitle":"System prompts, source code, and self-hosting details are visible and documented.","title":"Transparency and control"},"faq":{"items":{"q1":{"q":"Do I need an external LLM provider?","a":"The Codex-backed chat runs through Codex CLI. Planning, merge, transcription, and video analysis run through additional LLM providers — screen recordings are analyzed by Gemini for rich multimodal context. The hosted app uses managed provider access; self-hosting lets you supply your own keys."},"q10":{"q":"Can I edit plans before execution?","a":"Yes. Plans open in a Monaco editor on desktop and render as Markdown on mobile so you can edit, comment, and rerun generation."},"q11":{"q":"How do merge instructions work?","a":"Select two or more plan drafts, add merge guidance (typing or voice on mobile), and the merge processor stores the merged result alongside the originals."},"q12":{"q":"What guardrails exist before execution?","a":"Prompt previews, model allowlists, token estimates, and terminal health checks surface issues before any command runs. Every run stores its inputs and outputs for review."},"q13":{"q":"What does a typical workflow look like?","a":"Open a session → use Codex-backed chat → optionally generate implementation plans → review and merge plans → execute via the integrated terminal or Codex handoff. Background runs track each step, and the iOS control plane lets you continue sessions from your phone."},"q14":{"q":"Is the source code and system prompts available?","a":"Yes. The repo is source-available under the Business Source License, and the default system prompts are shipped in the repo and editable in the app."},"q2":{"q":"What gets sent to LLM providers?","a":"Only the task prompt and the files or excerpts you select are sent. Local project state, terminal logs, and plan drafts remain in the SQLite database unless you explicitly export them."},"q3":{"q":"Do plans map to exact files in the repo?","a":"Yes. Plans are structured around explicit file paths and operations (create, modify, delete) so you can review scope before execution."},"q4":{"q":"How is this different from using Codex CLI directly?","a":"PlanToCode wraps Codex CLI in a desktop workspace that adds a persistent chat UI, structured implementation planning, reusable skill templates, background run monitoring across projects, and an iOS control plane for remote sessions. You still use Codex CLI — the app adds workspace features around it."},"q5":{"q":"Can I run it without an LLM provider?","a":"Not for planning or analysis. Hosted includes managed provider access; self-hosting requires your own keys."},"q6":{"q":"Which models are supported?","a":"Codex CLI chat is backed by Codex. Planning and analysis runs route through OpenAI, Anthropic, Google, OpenRouter, and xAI providers. Screen recording analysis uses Gemini for multimodal video understanding. You can run multiple plan drafts across allowed models and choose what to merge or execute."},"q7":{"q":"Where is project state stored?","a":"Sessions, plans, run history, chat timelines, skill references, and terminal output are stored locally in SQLite. You can resume sessions because all records and artifacts persist across restarts. The background runs sidebar shows history across all projects."},"q8":{"q":"How does the integrated terminal work?","a":"Each tab is a PTY session managed by the Rust backend. Output is streamed to the UI and stored in SQLite so you can review or resume later."},"q9":{"q":"How does it handle large codebases?","a":"File discovery is a multi-stage pipeline that filters and scores candidate paths before any plan generation. Each stage is stored as a background run so you can inspect results."}},"subtitle":"Common questions about the desktop Codex workspace, planning pipeline, and execution.","title":"Workspace and workflow questions"},"hero":{"cta":{"viewDemo":"Download PlanToCode","howItWorks":"Explore the workspace"}}},"features":{"hub":{"meta":{"title":"PlanToCode Feature Internals - System Components","description":"Technical walkthrough of the components that implement planning, file discovery, multimodal input, and execution."},"badge":"Component docs","cta":{"description":"Use these component docs to trace each subsystem to the processors, prompts, and UI surfaces that implement it.","title":"Trace the implementation","links":{"docs":"Open docs","architecture":"Architecture overview"}}},"fileDiscovery":{"benefits":{"costEffective":{"description":"Token-aware batching with cost tracking at each stage.","title":"Token budgeting"},"multiStage":{"description":"Four-stage workflow with regex filtering, relevance assessment, and relationship analysis to identify relevant files.","title":"Multi-stage pipeline"},"realTimeProgress":{"description":"Stage-by-stage progress updates emitted by background runs.","title":"Progress visibility"}},"capabilities":{"git":{"description":"Executes `git ls-files --cached --others --exclude-standard` to respect .gitignore rules. Falls back to git2 library if command fails.","features":["Git ls-files with .gitignore respect","Binary file detection and filtering","Extension-based exclusion list for common binary types","Content analysis for binary detection"],"title":"Git Repository Integration"},"planIntegration":{"description":"Discovered files feed directly into the implementation planning system. Context is preserved and reused across sessions.","features":["Plan generation handoff","Context preservation across sessions","Multiple plan drafts per task","Structured plan inputs"],"title":"Implementation Plan Integration"},"title":"Advanced Discovery Capabilities","tokenManagement":{"description":"Content-aware token estimation drives batching. Ratios for JSON/XML (5 chars/token), code (3 chars/token), and text (4 chars/token) guide chunking.","features":["Dynamic chunk sizing per file type","2000-token prompt overhead reservation","Token-budgeted batching (size varies by content and limits)","Chunking based on estimated tokens, not fixed file counts"],"title":"Smart Token Management"},"workflow":{"description":"WorkflowOrchestrator manages lifecycle with lazy initialization, dependency scheduling, and orphaned run recovery. Each stage runs as an independent background task.","features":["Stage dependency management","Event-driven progress updates via Tauri","WorkflowIntermediateData persistence","Exponential backoff retry logic"],"title":"Distributed Workflow Orchestration"}},"cta":{"links":{"docs":"Read file discovery docs"},"title":"Explore the internals"},"hero":{"badge":"File discovery workflow","description":"PlanToCode stages file discovery as a Rust workflow that narrows, scores, and persists context before any plan generation.","title":"File Discovery Pipeline"},"pipeline":{"title":"How the File Discovery Pipeline Works","description":"Before any LLM call, the system builds a candidate index, applies deterministic filters, then uses relevance scoring to minimize tokens and noise.","cards":{"index":{"title":"Index","description":"Scan Git-tracked paths and build a local candidate set with directory hierarchy context."},"filter":{"title":"Filter","description":"Apply regex patterns, ignore rules, and file-type heuristics to reduce the candidate pool."},"score":{"title":"Score","description":"Run LLM-assisted relevance scoring and persist ranked results for later plan generation."}}},"performance":{"accuracy":{"description":"Multi-stage refinement with relevance assessment and relationship analysis captured per run.","title":"Relevance Quality","value":"Traceable"},"cost":{"description":"Token estimation and batching keep prompts small before LLM scoring.","title":"Token Budgeting","value":"Token-aware"},"speed":{"description":"Stage-by-stage runs stream updates without blocking the UI.","title":"Run Scheduling","value":"Staged"},"title":"Operational Characteristics"},"workflow":{"stage1":{"description":"Analyzes the directory structure (up to 2 levels deep) to identify candidate project areas and select parent folders vs. subdirectories.","features":["Hierarchical directory analysis","Parent/subdirectory selection heuristics","Avoids redundant nested selections"],"title":"Root Folder Selection"},"stage2":{"description":"Generates regex patterns and performs initial file filtering. Integrates with git to respect .gitignore rules and filter binary files.","features":["Dynamic regex pattern creation","Git ls-files integration","Binary file detection and exclusion"],"title":"Regex Pattern Generation & Filtering"},"stage3":{"description":"LLM-based relevance scoring to assess file relevance to the task. Uses token-aware batching with content-aware estimation.","features":["Content-based relevance scoring","Token-aware batching","2000-token overhead management"],"title":"File Relevance Assessment"},"stage4":{"description":"Discovers additional contextually relevant files through relationship analysis. Analyzes imports, configurations, and project structure to find related files.","features":["Import statement analysis","Dependency graph traversal","Configuration file discovery"],"title":"Extended Path Discovery"},"title":"The 4-Stage Discovery Workflow"}},"mergeInstructions":{"capabilities":{"instructionControl":{"examples":[{"type":"Prioritization","example":"\"Focus on Plan 2's security\""},{"type":"Structure","example":"\"Organize by component\""},{"type":"Approach","example":"\"Use Plan 1's database strategy\""},{"type":"Quality","example":"\"Include comprehensive testing\""},{"type":"Scope","example":"\"Exclude deployment steps\""},{"type":"Integration","example":"\"Use example from docs\""},{"type":"Resolution","example":"\"Prefer microservices over monolith\""}],"title":"How instructions guide the merge"},"title":"Merge processor capabilities","whatAIDoes":{"items":["Parses source plans into a structured step schema","Aligns steps by tags, file paths, and intent","Flags conflicts for explicit resolution","Records source plan IDs for each merged step","Stores merge instructions and prompt inputs with the run","Incorporates external examples when provided","Keeps output scoped to the original task"],"title":"What the merge processor does"}},"cta":{"description":"See how merge instructions, plan tagging, and conflict resolution are represented in the implementation-plan pipeline.","links":{"docs":"Implementation plan docs","planMode":"Plan generation flow"},"title":"Review the merge pipeline in the docs"},"features":{"architecturalAnalysis":{"description":"Plans are parsed into a structured schema so steps can be aligned and compared before merging.","title":"Structured plan parsing"},"solidResolution":{"description":"Conflicts are resolved with explicit rules rather than leaving everything to a single model response.","title":"Conflict resolution rules"},"sourceTraceability":{"description":"Merged output retains links back to source plans so reviewers can trace decisions to specific inputs.","title":"Traceable merge output"}},"hero":{"badge":"Plan Merge Pipeline","description":"PlanToCode generates multiple implementation plans, then merges them into a single draft using structured prompts and explicit merge instructions.","title":"Merge instructions and plan consolidation"},"example":{"heading":"Example merged output with source traceability:","steps":["Step 1: Set up database schema [src:P1 step 3]","Step 2: Implement authentication [src:P2 step 1, P3 step 2]","Step 3: Create API endpoints [src:P3 step 4 - cleaner approach]","Step 4: Add error handling [src:EMERGENT - combining P1, P2 patterns]","Step 5: Implement caching [src:P1 step 7, optimized with P2 insights]"]},"implementation":{"aiPrompt":{"description":"Structured prompt enforces merge rules and traceability.","features":["Merge role prompt","Explicit conflict resolution criteria","Mandatory source attribution","Step alignment guidance","Validation checks"],"title":"Merge prompt template"},"backend":{"description":"ImplementationPlanMergeProcessor orchestrates the merge pipeline.","features":["Fetches raw XML from source plans","Extracts relevant file contexts","Generates project structure tree","Builds comprehensive LLM prompt","Streams response with progress updates"],"title":"Backend Processing"},"frontend":{"description":"Rich UI for plan selection and instruction input.","features":["MergePlansSection with collapsible UI","FloatingMergeInstructions (draggable)","Text enhancement support during editing","Debounced state management","Session persistence for instructions"],"title":"Frontend Components"},"metadata":{"description":"Full run history for traceability and debugging.","features":["Source run context preserved","Full prompt stored for debugging","Merge instructions tracked","File operations extracted","Priority-based run scheduling"],"title":"Metadata & Storage"},"title":"Technical Implementation Details"},"process":{"deepAnalysis":{"description":"Plans are compared step-by-step so overlapping work is merged and conflicting approaches are surfaced explicitly.","features":["Identifies unique insights from each plan","Aligns steps by tags and semantics","Preserves important architectural decisions","Flags conflicts for explicit resolution"],"title":"Plan alignment and comparison"},"instructions":{"description":"Merge instructions guide how the processor resolves conflicts or prioritizes specific plan elements.","examples":["Prioritization: \"Focus on security from Plan 2\"","Structure: \"Group by subsystem\"","Approach: \"Use Plan 1's database strategy\"","Scope: \"Exclude deployment steps\""],"title":"Merge Instruction Processing"},"multiModel":{"description":"ImplementationPlanProcessor can request multiple plans across models or prompts, keeping each draft isolated for later comparison.","features":["Each plan stored with metadata","Relevant files captured per plan","Project context included in prompts","Multiple drafts available for review"],"title":"Plan draft generation"},"synthesis":{"description":"ImplementationPlanMergeProcessor composes a single draft and records references back to source plans.","features":["Source references preserved","Merge guidance stored with output","Conflict resolution decisions logged","Single draft for review and editing"],"title":"Merged draft with traceability"},"title":"The merge pipeline"},"value":{"architecturalSynthesis":{"description":"Merging is performed with structured prompts so the final plan reconciles overlapping steps instead of concatenating drafts.","title":"Structured merge output"},"completeTraceability":{"description":"Merge notes capture which draft contributed each step so reviewers can trace decisions.","title":"Traceable merge output"},"solidPractices":{"description":"Conflicts are resolved using explicit criteria and review guidance rather than silent overwrites.","title":"Explicit conflict resolution"},"title":"Why structured merging matters"}},"planMode":{"copyButtons":{"examples":{"serverConfigured":{"button":"Button: \"Parallel Claude Coding Agents\"","hint":"+ Custom instructions...","template":"Template: \"{{IMPLEMENTATION_PLAN}}\""},"stepExtraction":{"copyAll":"Copy All Steps","copyStep":"Copy Step 3","copyWithInstructions":"Copy with Instructions"}},"serverConfigured":{"description":"Server-configured copy buttons with template placeholders.","title":"Server-Configured Buttons"},"stepExtraction":{"description":"Copy individual steps or full plans using the structured plan format.","title":"Structured Step Extraction"},"title":"Configurable Copy Button System"},"cta":{"description":"Follow how plans are generated, reviewed, merged, and handed off to execution, with run history for each step.","links":{"mergePlans":"Merge pipeline","terminal":"Terminal sessions"},"title":"Trace the plan pipeline"},"editing":{"monaco":{"description":"Monaco-based editor for plan review with syntax highlighting and structured diffs.","features":["XML syntax highlighting","Find & replace with regex","Multi-cursor editing","Auto-save to database"],"title":"Monaco Editor Integration"},"terminal":{"description":"Execute steps in persistent PTY sessions with logs recorded alongside the plan.","features":["Persistent terminal sessions","Voice transcription input","Copy plan/steps to terminal","Session health monitoring"],"title":"Integrated Terminal Execution"},"title":"Editing and execution surfaces"},"features":{"intelligentGeneration":{"description":"Loads file contents and directory context, then applies per-task model configuration before generating plans.","title":"Plan generation pipeline"},"monacoEditor":{"description":"Monaco editor with XML syntax highlighting. Edits are auto-saved to the database.","title":"Monaco Editor"},"terminalExecution":{"description":"Execute plans in the integrated terminal or export steps to external tools.","title":"Execution handoff"}},"fileByFile":{"description":"Plans are structured as file-by-file changes so scope and dependencies are visible before execution.","exactPaths":{"description":"Each step includes explicit file paths, operations, and ordering.","title":"Exact File Paths"},"preventRegressions":{"description":"Review scope and dependency impact before running commands.","features":["Impact assessment","Change review checkpoints","Legacy code safeguards"],"title":"Change impact review"},"title":"File-by-file plan structure"},"generation":{"fullContext":{"description":"Full file contents are loaded with warnings when token budgets are exceeded.","features":["Complete file content, no truncation","Parallel file loading","Token warnings at >100k tokens","Directory tree generation"],"title":"Full Context Loading"},"multiModel":{"description":"Multiple models can be configured per project with temperature and context limits.","features":["Configured model allowlist per project","Project-specific model settings","Token estimation before execution","Context window validation"],"title":"Multi-model configuration"},"streaming":{"description":"Plan generation streams output with progress updates and run status tracking.","features":["Streaming output with progress bars","Syntax highlighting during streaming","Token count updates during generation","Background run status tracking"],"title":"Streaming output"},"title":"Plan generation with full context","xmlFormat":{"description":"Plans use structured XML with numbered steps, enabling programmatic manipulation and extraction.","features":[" organization","Title and description per step","File operations tracking","Step-by-step extraction support"],"title":"Structured XML Format"}},"guides":{"claudeCode":{"description":"Export plans into IDEs or external tools when you need a guided execution surface.","link":"Open IDE handoff notes","name":"IDE handoff"},"codex":{"description":"Use plan outputs to drive CLI agents or scripts with explicit scope and steps.","link":"Open CLI execution notes","name":"CLI execution"},"cursor":{"description":"Combine integrated terminal execution with external tools for hybrid execution.","link":"Open hybrid execution notes","name":"Hybrid execution"},"title":"Execution environments"},"hero":{"badge":"Implementation plan pipeline","description":"Plan generation and merging rely on external LLM providers managed by the server; review and execution remain local.","title":"Implementation planning pipeline"},"humanInLoop":{"approve":{"description":"Approved plans can be exported or executed in the integrated terminal with logs attached.","title":"Approve and hand off"},"description":"Plans are reviewed, edited, and approved before execution so scope and dependencies are explicit.","edit":{"description":"Edit steps, reorder work, add constraints, and keep the plan aligned with repo structure.","title":"Edit and refine plans"},"review":{"description":"Plans open in Monaco for review; execution is a separate, explicit action.","title":"Review before execution"},"title":"Human-in-the-loop review"},"technical":{"noTruncation":{"description":"Full file contents are loaded with warnings when token budgets are exceeded.","title":"Full-context loading"},"persistence":{"description":"Plans are stored with run metadata and prompt history for traceability.","title":"SQLite persistence"},"templates":{"description":"Server-side prompts with project overrides and placeholders for context fields.","title":"Prompt templates"},"title":"Implementation details"},"workflow":{"steps":[{"title":"File discovery stage","description":"File discovery identifies relevant paths and persists selections for later steps."},{"title":"Plan drafts (multiple models or prompts)","description":"Run multiple models or prompts and compare structured drafts."},{"title":"Review and edit in Monaco","description":"Review and edit steps with Monaco, then save revisions."},{"title":"Merge with instructions","description":"Merge drafts with guidance and preserve provenance for review."},{"title":"Execute in terminal","description":"Execute steps in a persistent terminal session with logs recorded."}],"title":"Planning pipeline"},"references":{"architecture":{"description":"System boundaries, IPC, and background processing.","title":"Architecture overview"},"buildYourOwn":{"description":"Design the pipeline stages in your own project.","title":"Build your own pipeline"},"implementationPlans":{"description":"Plan format, storage, and review flow.","title":"Implementation plan format"},"link":"Open docs","title":"Related references"}},"textImprovement":{"capabilities":{"contextAware":{"description":"Prompt payloads can include file tree, selected files, and project settings.","title":"Context-aware refinement"},"customizable":{"description":"Per-project templates with placeholders and policy limits.","title":"Customizable system prompts"},"instant":{"description":"Non-streaming responses applied inline with conflict detection.","title":"Inline application"},"mentalModel":{"description":"Iterative refinement lets you converge on exact requirements.","title":"Iterative refinement"},"title":"Core mechanics"},"cta":{"links":{"docs":"Text improvement docs"},"title":"Continue in the docs"},"faq":{"codeEditor":{"answer":"Yes. The selection popover appears in task description fields and Monaco editors.","question":"Does it work inside the editors?"},"conflicts":{"answer":"The run aborts to avoid overwriting; you can re-run after updating the text.","question":"What if the text changes mid-run?"},"customize":{"answer":"Yes. Templates are stored per project with placeholders for file context and instructions.","question":"Can I customize the prompts?"},"model":{"answer":"The model is configurable per project; defaults are documented in the settings panel.","question":"Which model does it use?"}},"hero":{"badge":"Stage 1: Text enhancement and task refinement","credits":"Prompt templates and run metadata are documented for traceability.","description":"Two prompt types turn raw task notes into structured, implementation-ready requirements. Text Enhancement cleans language; Task Refinement expands constraints and edge cases using project context.","installButton":"Read the docs","subtitle":"Outputs are stored with the task and feed directly into file discovery and plan generation.","title":"Specification Capture: Text Enhancement and Task Refinement"},"howItWorks":{"steps":[{"step":"Select text or task description","description":"Highlight text in a task description or plan note to open the refinement popover."},{"step":"Choose a prompt type","description":"Run Text Enhancement for clarity or Task Refinement for completeness and constraints."},{"step":"Capture context","description":"The run bundles task text, project settings, and optional file context for the prompt."},{"step":"Apply and store results","description":"Refined text replaces the selection and is stored with run metadata for traceability."}],"title":"Pipeline steps"},"painPoints":{"mentalModels":{"description":"Design intent, edge cases, and non-functional requirements need to be explicit before planning.","title":"Constraints must be explicit"},"rewriting":{"description":"Manual cleanup often changes intent and loses details that matter in downstream plans.","title":"Manual cleanup can drift intent"},"title":"Why this stage exists","vague":{"description":"Loose task text yields brittle plans because constraints and acceptance criteria are missing.","title":"Unstructured notes produce ambiguous prompts"}},"promptTypes":{"note":"Both prompts write results back to the task and store run metadata for traceability.","taskRefinement":{"description":"Expands requirements with constraints, edge cases, and acceptance criteria using project context.","features":["Surfaces implicit requirements","Adds validation and rollback notes","Highlights affected components","Prepares inputs for file discovery"],"title":"Task Refinement"},"textEnhancement":{"description":"Lightweight prompt for grammar, clarity, and structure without changing meaning.","features":["Keeps original intent and terminology","Normalizes style for review","Preserves code identifiers","Returns a single replacement block"],"title":"Text Enhancement"},"title":"Two prompt types in the pipeline"},"useCases":{"clarify":{"description":"Turn a vague note into a structured spec with constraints and acceptance criteria.","title":"Clarify ambiguous requirements"},"expand":{"description":"Expand shorthand into full requirements with dependencies and validation steps.","title":"Expand shorthand notes"},"refine":{"description":"Normalize and polish text before review and file discovery.","title":"Refine for review"},"title":"Example outcomes"}},"voiceTranscription":{"accuracy":{"bottomLine":"Summary: Audio quality and the configured model drive accuracy. Review transcribed text before planning.","about":"About transcription quality","models":{"aws":"Transcription runs through the configured provider; there is no offline or on-device mode.","google":"Additional providers can be enabled by self-hosted admins via the allowlist.","gpt":"Primary transcription model is configured per project from the server allowlist.","whisper":"No diarization or speaker labels are produced in the current pipeline."},"title":"Accuracy factors"},"capabilities":{"multiLanguage":{"description":"The configured transcription provider supports multiple languages. Project settings select the default language.","title":"Multiple Language Support"},"perProject":{"description":"Set project defaults for language, temperature, and transcription model. Integrates with text_improvement and task_refinement prompts.","title":"Per-Project Configuration"},"terminalDictation":{"description":"Dictate commands into the active PTY session; the transcript is inserted into the terminal input buffer.","title":"Terminal Dictation (Stage 5)"},"title":"Key Capabilities"},"cta":{"links":{"docs":"Voice transcription docs"},"title":"Voice transcription in the pipeline"},"example":{"competitor":{"label":"Baseline transcription","text":"Create a Postgres replica in us-east with 2 CPUs, 8GB RAM, and enable replication; set wal level logical and max senders equals ten."},"comparisonTitle":"Token-level comparison","errorSummary":"Errors — Substitutions: {sub}, Deletions: {del}, Insertions: {ins}. Small errors can flip units or flags.","impact":"Impact: Mishearing \"read-replica\" as \"replica\", dropping region suffix \"-1\", or changing \"wal_level=logical\" can lead to incorrect deployments or data flows.","primaryBadge":"reference-aligned","primaryLabel":"Primary transcription model","gpt":"Create a Postgres read-replica in us-east-1 with 2 vCPU, 8 GB RAM, and enable logical replication; set wal_level=logical and max_wal_senders=10.","reference":"Create a Postgres read-replica in us-east-1 with 2 vCPU, 8GB RAM, and enable logical replication; set wal_level=logical and max_wal_senders=10.","title":"Transcription comparison"},"faq":{"customize":{"answer":"Yes. You can configure language and model settings per project. Settings persist across sessions and are reused by transcription runs.","question":"Can I customize transcription settings per project?"},"languages":{"answer":"Supported languages depend on the configured transcription provider. You can set a default language per project.","question":"Which languages are supported for voice transcription?"},"model":{"answer":"The transcription model is configured per project from the provider allowlist.","question":"Which model is used for transcription?"},"offline":{"answer":"No. Voice transcription requires an internet connection to send audio to the configured provider.","question":"Does voice transcription work offline?"},"whereToUse":{"answer":"Voice transcription works in two places: (1) Task description panel - dictate implementation requirements (Stage 1), and (2) Terminal modal - dictate commands that are appended to your active shell session (Stage 5).","question":"Where can I use voice transcription in the app?"}},"hero":{"badge":"Stage 1 & Stage 5 Voice Input","description":"Dictate tasks and commands; audio is sent to the configured transcription provider and inserted into the task description or PTY input. Voice transcription respects per-project settings and feeds text enhancement and task refinement.","title":"Voice transcription for specification capture and terminal control"},"workflow":{"stage1":{"description":"Dictate tasks to capture constraints, context, and intent; transcribed text becomes input for refinement runs.","title":"Stage 1: Dictating Tasks"},"stage5":{"description":"Dictate terminal commands while reviewing output or diffs; the command is inserted into the PTY input.","title":"Stage 5: Terminal Voice Control"},"integration":{"description":"Voice respects per-project language and temperature settings. Transcribed text feeds into text enhancement for grammar polish and task refinement for completeness expansion.","title":"Integration with Text Enhancement Prompts"},"title":"Voice Transcription Across Stages"},"nextSteps":{"description":"Voice transcription is Stage 1 input in the planning pipeline. After capturing dictated text, text_improvement cleans grammar and task_refinement expands completeness, preparing specs for Stage 2 file discovery.","link":"Learn about text_improvement and task_refinement","taskRefinement":{"description":"Expand descriptions with implied requirements, edge cases, and technical considerations. Prepares specs for FileFinderWorkflow.","title":"Task Refinement (Stage 1 → 2)"},"textEnhancement":{"description":"Polish grammar, improve clarity, and preserve intent for review.","title":"Text Enhancement (Stage 1)"},"title":"Refine Dictated Text Before File Discovery"},"painPoints":{"captureIdeas":{"description":"Dictation preserves context at discovery time and creates clean text inputs for refinement runs.","title":"Capture context at discovery time"},"contextSwitching":{"description":"Dictation writes directly into the active task or terminal field so the session context stays intact.","title":"Keep input in the active surface"},"handsBusy":{"description":"Voice capture keeps input flowing during code review, debugging, or sketching; dictated text stays in the task or session.","title":"Hands-free input during active review"},"title":"Why voice capture exists in intake"},"useCases":{"codeReview":{"outcome":"Transcribed text is ready for text_improvement and task_refinement.","scenario":"While reviewing a diff, dictate refactor requirements into the task panel; the dictated text is stored in the task description.","title":"Dictate refactor notes during review (Stage 1)"},"fasterEntry":{"outcome":"Dictated notes are queued for task_refinement to normalize into specs.","scenario":"After QA, dictate multiple bug reports; each dictation becomes task input you can refine.","title":"Batch capture for repeated reports"},"handsFree":{"outcome":"Captured text is stored as task input and can be refined later.","scenario":"During a debugging session, dictate related issues without leaving the terminal or editor.","title":"Capture issues during debug (Stage 1)"},"terminalCommands":{"outcome":"The command and output are logged to the session history.","scenario":"While monitoring output, dictate a command into the active PTY input buffer.","title":"Dictated commands in PTY (Stage 5)"},"title":"Pipeline examples"}},"integratedTerminal":{"cta":{"description":"A terminal surface tied to planning artifacts, with persistent PTY sessions and SQLite-backed history.","links":{"docs":"Read technical docs","voice":"Explore voice commands"},"title":"Trace the terminal pipeline"},"features":{"integratedPlanning":{"description":"Execute implementation plans and copy steps into the terminal with plan context preserved in the session log.","title":"Integrated with Planning"},"persistent":{"description":"Sessions persist in SQLite so terminal context can be rehydrated across restarts.","title":"Persistent Sessions"},"title":"Terminal surface capabilities","voiceSupport":{"description":"Copy buttons and voice dictation insert commands into PTY sessions while keeping the plan view intact.","title":"Voice and Copy Support"}},"hero":{"badge":"Integrated PTY Terminal","description":"Execute plan steps in persistent PTY sessions; output streams to the UI and persists in SQLite session logs.","title":"Workspace terminal that keeps context"}},"videoAnalysis":{"meta":{"title":"Video Analysis Pipeline - PlanToCode","description":"Adaptive analysis of screen recordings guided by system prompts and your focus prompt."},"capabilities":{"fileUpload":{"description":"Upload existing recordings or capture new ones for analysis.","features":["MP4, WebM, MOV, AVI support","Local recording stored before upload","Long recordings split into chunks"],"title":"Recording upload"},"fpsControl":{"description":"FPS is a sampling hint that trades detail for cost; for large files the provider may ignore it.","features":["0.1 to 20 FPS selection in the UI","Lower FPS reduces token usage","Long recordings may be chunked for analysis"],"title":"Frame rate hint"},"gemini":{"description":"Video analysis uses Google Gemini video models configured per project; usage is tracked with run metadata.","features":["Allowed models set by server config","Per-project model defaults","Usage and cost tracking"],"title":"Model selection"},"screenRecording":{"description":"Local capture with synchronized audio and video stored alongside the task.","features":["Full screen or window capture","Audio and video sync","Stored with the task id"],"title":"Screen recording"},"title":"Pipeline controls"},"cta":{"description":"Connect video artifacts to the rest of the planning pipeline: deep research and file discovery.","links":{"fileDiscovery":"File discovery pipeline","research":"Deep research stage"},"title":"Continue in the pipeline"},"faq":{"formats":{"answer":"MP4, WebM, MOV, and AVI are supported. Other formats may work but are not guaranteed.","question":"Which video formats are supported?"},"fps":{"answer":"FPS is a sampling hint. Higher FPS can increase cost; for very large files the provider may sample at a fixed rate, and long recordings may be chunked.","question":"What FPS settings should I use?"},"model":{"answer":"Video analysis uses Google Gemini video models. The default model is configured per project from the server allowlist.","question":"Which model should I choose?"},"optimization":{"answer":"Trim to relevant segments, keep the focus prompt specific, and use lower FPS when high visual detail is not required.","question":"How can I optimize analysis costs?"}},"hero":{"badge":"Stage 1 input: Screen recording analysis","description":"Record or upload a screen recording, add a focus prompt, and let the video analysis system prompt guide a Gemini model to extract what matters. Results are stored as an analysis response you can attach to the task.","title":"Multimodal video analysis for requirements capture"},"howItWorks":{"steps":[{"title":"Capture or upload video","description":"Record your screen (with optional audio) or pick an existing file. Recordings stay local until analysis starts."},{"title":"Set a focus prompt","description":"Your task description and optional focus prompt are wrapped in and tags."},{"title":"Run adaptive analysis","description":"The default video analysis system prompt tells the model to focus on what you show and say and to quote visible text when relevant."},{"title":"Attach to the task pipeline","description":"The analysis summary is stored in the session record and can be appended to the task description."}],"title":"How the pipeline runs"},"insights":{"actionItems":{"description":"Action items and suggested fixes based on what was shown and said.","title":"Action items"},"decisions":{"description":"Decisions or open questions captured from the recording.","title":"Decisions"},"description":"Analysis results are stored in the session and can be applied to the task description for refinement and planning.","discussionPoints":{"description":"UI issues, design tradeoffs, or bugs worth following up.","title":"Discussion points"},"title":"Structured outputs"},"models":{"flash":{"description":"Lower cost and latency for straightforward UI flows and documentation.","features":["Fast turnaround","Lower cost for straightforward recordings","Good for simple flows"],"title":"Fast analysis model"},"pro":{"description":"Deeper context for complex UI issues and nuanced workflows.","features":["Richer reasoning","Better for complex flows","Higher cost for complex recordings"],"title":"Deep analysis model"},"title":"Model tradeoffs"},"multimodal":{"audioTranscript":{"description":"The model analyzes the audio track directly; the app does not generate a separate transcript.","features":["Narration guides what to focus on","Spoken intent and errors inform the summary","No standalone transcript file produced"],"title":"Audio and narration context"},"title":"Audio and visual extraction","visualContent":{"description":"The model analyzes what is visible in the video and can quote on-screen text when it is clear.","features":["UI flows and state changes from what is visible","Best-effort quotes of logs, errors, and labels","No local frame export or OCR pipeline"],"title":"Visual context from the recording"}},"painPoints":{"incompleteNotes":{"description":"Screenshare changes and error dialogs are easy to miss in notes; recordings preserve that context.","title":"Manual notes omit frame references"},"requirementsLost":{"description":"Text notes miss on-screen state and timing; recordings keep the visual context intact.","title":"UI state lives in recordings"},"reviewTime":{"description":"Long recordings are hard to review; a focused summary highlights what matters.","title":"Raw recordings are expensive to review"},"title":"Why multimodal ingestion exists"},"useCases":{"bugCapture":{"description":"Summarize reproduction steps and visible errors from a recording.","title":"Bug timeline artifacts"},"onboarding":{"description":"Produce walkthrough notes from a screen recording.","title":"Walkthrough summaries"},"title":"Example outputs","uiDemo":{"description":"Capture UI states and flows shown in the recording.","title":"UI state capture"}}},"copyButtons":{"concept":{"dragDrop":{"description":"Drag-and-drop ordering for button sets. Organize buttons by execution stage or priority.","title":"Drag-and-drop ordering"},"serverConfigured":{"description":"Template prompts with placeholders: {{IMPLEMENTATION_PLAN}}, {{TASK_DESCRIPTION}}, {{STEP_CONTENT}}. Server defaults with project-level overrides.","title":"Template Placeholders"},"terminal":{"description":"Send templated content to persistent terminal sessions (Stage 5). Large content is chunked when writing to the PTY.","title":"Terminal integration (Stage 5)"}},"configuration":{"projectSettings":{"description":"Copy buttons are stored in per-project task settings in key_value_store and merged with server defaults.","features":["Key-value storage in SQLite","Server-managed default configurations","Project directory scoping","Settings sync across desktop and mobile"],"title":"Project-Specific Settings"},"title":"Configuration & Management","visualUI":{"description":"Configuration editor with drag-drop reordering and debounced inputs for labels and templates.","features":["Drag handles for visual reordering","300ms debounced input processing","Read-only mode for system buttons","Template ordering support"],"title":"Visual Configuration UI"}},"cta":{"links":{"planMode":"See Stage 3 planning & Stage 4 merge","terminal":"Explore Stage 5 terminal integration"},"title":"Template-driven execution handoff"},"exampleConfig":{"title":"Example button configuration:","footer":"→ Button runs the configured template","templateBody":"{{IMPLEMENTATION_PLAN}}\n\nReview the plan. Read the files mentioned, understand them and launch parallel coding agents that run at the same time..."},"exampleLabels":{"button":"Button:","dynamic":"Dynamic:","label":"Label:","purpose":"Purpose:","result":"Result:","template":"Template:"},"exampleValues":{"investigationButton":"\"Investigate Results\"","investigationPurpose":"Validation and review workflows","parallelButton":"\"Parallel Claude Coding Agents\"","parallelPurpose":"Parallel agent instruction templates","projectContextTemplate":"{{TASK_DESCRIPTION}}","projectDynamic":"Task-aware instructions","stepResult":"Focused step execution","stepTemplate":"{{STEP_CONTENT}}"},"hero":{"badge":"Template handoff","description":"Copy buttons insert {{IMPLEMENTATION_PLAN}}, {{TASK_DESCRIPTION}}, and {{STEP_CONTENT}} into predefined templates.","title":"Template prompts with plan substitution"},"technical":{"architecture":{"heading":"# Copy button system architecture","note":"[Extend with new placeholders and templates as needed]","sections":{"execution":"## 4. Execution flow","processing":"## 2. Template processing","storage":"## 1. Configuration storage","ui":"## 3. UI integration"},"execution":"Button click triggers template processing -> clipboard copy or PTY write (chunked)","processing":"Regex placeholder matching -> substitution with plan, step, and task text -> missing values become empty strings","storage":"CopyButtonConfig[] stored in per-project task settings (key_value_store) plus server-side defaults","ui":"Implementation plan cards → Content viewing modals → Terminal interface headers → Drag-drop configuration editor"},"title":"Technical Implementation"},"templateSystem":{"placeholders":{"description":"Template prompts with {{PLACEHOLDER}} substitution. Supported placeholders include plan content, step content, and task description.","examples":["{{IMPLEMENTATION_PLAN}} - Full plan content","{{STEP_CONTENT}} - Selected step content","{{TASK_DESCRIPTION}} - Task requirements"],"title":"Placeholder Substitution"},"processor":{"description":"Template processor injects XML plans, task descriptions, and governance constraints into predefined prompts.","features":["Regex-based placeholder matching","XML plan formatting and escaping","Multi-line governance instruction support","Graceful undefined handling"],"title":"Unified Prompt Processing"},"title":"Template system"},"terminalIntegration":{"oneClick":{"description":"Copy buttons integrate with Stage 5 terminal sessions and insert plan context into the active PTY with logging.","features":["Automatic paste to active terminal session","Chunked sending for large XML plans","Session health monitoring","Clipboard fallback for safety"],"title":"Stage 5 execution handoff"},"title":"Stage 5 Terminal Execution"},"useCases":{"customTeam":{"description":"Team-specific governance constraints with {{PROJECT_CONTEXT}} and coding standards.","title":"Team governance templates"},"investigation":{"description":"Standardized review prompts for Stage 3 implementation plan results.","title":"Investigation and review"},"parallel":{"description":"Example button: \"Parallel agent template\" inserts the plan XML and governance instructions.","title":"Parallel agent templates"},"stepByStep":{"description":"Extract individual implementation steps with {{STEP_CONTENT}}. Execute step-by-step with full plan context.","title":"Step-by-step execution"},"title":"Example configurations"}},"deepResearch":{"advanced":{"features":[{"title":"Migration guide retrieval","description":"Fetches official migration guides and breaking changes for framework upgrades (e.g., Next.js 14 → 15 or React 17 → 18)."},{"title":"API documentation retrieval","description":"Background runs pull API documentation, SDK changes, and version compatibility notes for external services."},{"title":"Background Processing","description":"Long-running research tasks execute in the background with progress updates."},{"title":"Plan Context Integration","description":"Research findings attach to task descriptions or implementation plans and feed into plan prompts."},{"title":"Pattern extraction","description":"Summarizes recommended patterns, anti-patterns, and gotchas from official documentation and community sources."},{"title":"On-demand research","description":"Runs research only when needed, with query gating and provider limits."}],"title":"Research helper capabilities"},"aiCapabilities":{"multiModel":{"description":"Supports multiple configured models for research tasks with different prompts or scopes.","models":["Configured provider models","Research-specific prompt variants","Per-task allowlists","Context window limits"],"title":"Multi-model routing"},"parallel":{"description":"Execute multiple research tasks simultaneously with result aggregation and synthesis.","features":["Concurrent execution","Progress tracking","Error handling","Result synthesis"],"title":"Parallel execution"},"projectContext":{"description":"Uses project structure, technology stack, and dependencies to contextualize research prompts.","features":["File structure signals","Technology stack detection","Dependency mapping","Context tokens in prompts"],"title":"Project context integration"},"title":"Research run controls"},"cta":{"links":{"planMode":"See Stage 3 implementation planning","textImprovement":"Explore Stage 1 text enhancement"},"title":"Research pipeline for migrations and upgrades"},"developmentFocus":{"contextFiltering":{"description":"Research scope tailored to the migration scenario: relevant framework versions, API changes, and compatibility notes.","features":["Framework version compatibility checking","Breaking change identification","Migration path recommendations","Deprecated API alternatives"],"title":"Migration-Focused Filtering"},"implementationReady":{"description":"Research results formatted for implementation plans, including code examples, migration scripts, and upgrade steps.","features":["Migration code snippet extraction","Upgrade script templates","Breaking change workarounds","Rollback strategy notes"],"title":"Implementation-Ready Migration Insights"},"title":"Migration-focused research"},"features":{"parallelExecution":{"description":"Execute multiple provider queries concurrently (migration guides, upgrade docs, compatibility notes).","title":"Parallel search execution"},"projectIntegration":{"description":"Research findings attach to task descriptions or implementation plans and inform plan prompts with sources and constraints.","title":"Task and plan integration"},"queryGeneration":{"description":"Queries are generated from migration context, API upgrades, and library version changes, with multiple angles when needed.","title":"Query planning"}},"hero":{"badge":"Background research stage","description":"Background runs generate search queries, fetch migration guides and API docs, then attach summaries and citations to tasks and plans.","title":"Deep research pipeline for migrations and upgrades"},"intelligence":{"contextIntegration":{"description":"Findings attach to the task description and feed plan prompts with sources and constraints.","features":["Structured research notes","Constraints and compatibility flags","Links back to sources","Plan prompt attachment"],"title":"Task and plan integration"},"execution":{"description":"Research runs execute queries across providers, normalize responses, and track usage per run.","features":["Parallel execution with progress updates","Provider routing and retry handling","Result normalization and deduplication","Usage and cost metadata per run"],"title":"Search execution"},"queryExpansion":{"description":"Expands the initial task into provider-specific search queries based on versions, APIs, and constraints.","features":["Version- and dependency-aware queries","Multiple query variants for coverage","Provider-specific syntax tuning","Rate-limit aware batching"],"title":"Query planning"},"synthesis":{"description":"Summarizes results into structured notes with citations and version context.","features":["Citation-linked summaries","Version-specific recommendations","Task-context tags","Plan-ready excerpts"],"title":"Result synthesis"},"title":"Research pipeline stages"},"process":{"stage1":{"description":"Generate queries from task context, version targets, and constraints. The query set is stored with the run for traceability.","title":"Query generation stage"},"stage2":{"description":"Execute provider searches, extract results, and store summaries with citations and metadata.","title":"Search execution stage"},"title":"Two-stage research process"}},"features":{"copyButtons":{"description":"Template-based prompt buttons that inject plan snippets, file lists, and task inputs.","slug":"/docs/copy-buttons","title":"Copy Buttons"},"deepResearch":{"description":"Parallel research stages that gather external context and attach notes before planning.","slug":"/docs/deep-research","title":"Deep Research"},"fileDiscovery":{"description":"Multi-stage file discovery pipeline that scores and persists relevant files before planning.","slug":"/docs/file-discovery","title":"File Discovery","meta":{"title":"File Discovery Pipeline - PlanToCode","description":"Multi-stage workflow that indexes, filters, and scores files before LLM planning."}},"integratedTerminal":{"description":"PTY-backed terminal sessions with persistent logs and workspace binding.","slug":"/docs/terminal-sessions","title":"Integrated Terminal"},"mergeInstructions":{"description":"Plan merge processor that reconciles multiple plan drafts into one structured sequence.","slug":"/docs/merge-instructions","title":"Plan Merge Instructions","meta":{"title":"Plan Merge Processor - Structured Merge","description":"Structured merge of multiple plans with explicit instructions and traceable step alignment."}},"planMode":{"description":"Structured implementation plans with reviewable steps and links back to runs.","slug":"/docs/implementation-plans","title":"Implementation Plans","meta":{"title":"Implementation Planning Pipeline - PlanToCode","description":"Generate structured, reviewable implementation plans before execution."}},"textImprovement":{"description":"Text improvement and task refinement prompts that normalize requirements.","slug":"/docs/text-improvement","title":"Task Refinement & Text Improvement","meta":{"title":"Task Refinement & Text Improvement","description":"Normalize task descriptions and expand missing constraints before planning."}},"videoAnalysis":{"description":"Multimodal ingestion of recordings with prompt-guided analysis summaries.","slug":"/docs/video-analysis","title":"Video Analysis Pipeline"},"voiceTranscription":{"description":"Speech-to-text capture for requirements and terminal commands.","slug":"/docs/voice-transcription","title":"Voice to Text","meta":{"title":"Voice Transcription Pipeline","description":"Capture spoken requirements with transcript insertion and session context."}}}},"pages":{"home":{"meta":{"title":"PlanToCode - Desktop Workspace for AI-Assisted Implementation Planning","description":"PlanToCode is a desktop workspace for AI-assisted coding. Plan and execute implementations across multiple LLM providers, monitor runs, browse verified skills, and extend sessions from your phone."}},"about":{"meta":{"description":"What PlanToCode does: a desktop workspace for multi-model AI-assisted coding with implementation planning, verified skills, and a mobile companion.","title":"About PlanToCode – Desktop AI Workspace"}},"evolution":{"meta":{"title":"System Evolution and Tradeoffs - PlanToCode","description":"How PlanToCode evolved from a plan review tool into a run-centric desktop workspace, why specific technologies were chosen, and what tradeoffs those decisions created."}},"aboutPage":{"hero":{"title":"What PlanToCode Is For","description":"PlanToCode is a desktop workspace for AI-assisted implementation planning and execution. It manages multi-model chat sessions with tool calls and reasoning levels, streams responses through a rich UI, and organizes work into runs with implementation planning, run monitoring, a verified skill catalog, and a mobile companion for remote oversight. The core experience is a run-centric workspace that coordinates AI-assisted coding across providers."},"reference":{"title":"Reference architecture focus","description":"The system wires together a Tauri shell, a Rust backend, SQLite persistence, an LLM proxy layer, and a multi-model chat runtime. This page explains how those parts fit together so you can learn from the architecture."},"governance":{"title":"Safety, Governance, and Guardrails","description":"You review plans before they run. Implementation plans are editable artifacts that require explicit approval before execution, and chat sessions support configurable sandbox and approval policies."},"stack":{"title":"Where This Fits in Your Stack","description":"PlanToCode sits alongside your editor and local tools. The core is a multi-model chat interface with session history and run-centric execution. On top of that, it adds file discovery, plan generation, terminal sessions, and a verified skill catalog you can browse and apply in chat. It assumes Git workflows and external LLM providers."}},"architecturePage":{"hero":{"title":"Architecture Overview","description":"PlanToCode is a Tauri desktop app with a Rust backend, a React/Vite frontend, and a SQLite-backed local database. The multi-model chat runtime is the core, with supporting features for implementation planning, verified skills, run monitoring, and a device relay for mobile access. Self-hosting supports your own keys. This page explains how those pieces fit together."},"visuals":{"systemMap":{"title":"System map snapshot","description":"$33","imageSrc":"/images/architecture/system-map.svg","imageAlt":"Diagram showing PlanToCode system map","caption":"Five-layer architecture with data flowing down, events streaming back up, and device relay syncing across platforms."}},"sections":{"shell":{"title":"Tauri Shell and Desktop Frontend","description":"The desktop app bundles a React UI inside a Tauri shell. The primary view is the unified workspace chat interface; additional panels provide run monitoring, a git diff viewer, and a browsable skill catalog. Frontend code calls Rust commands for chat sessions, file system access, terminal sessions, and runs."},"core":{"title":"Rust Core and SQLite Persistence","description":"The Rust core manages multi-model chat sessions, runs, PTY sessions, skill discovery and verification, and durable state. SQLite stores sessions, chat history, run metadata, and terminal session logs as the local record of work."},"jobs":{"title":"Run Scheduling","description":"A run scheduler executes multi-stage tasks (file discovery, plan generation, research). Each stage is a Rust processor that can call out to LLM providers, read or write to the project, and emit streaming updates back to the UI. The run monitoring sidebar provides per-project grouping with detailed panels showing system prompt, response, errors, model configuration, token usage, and cost."},"llm":{"title":"Multi-Model LLM Integration","description":"The server layer routes requests to different providers, normalizes responses, and tracks usage. The desktop app receives a unified streaming API regardless of provider. The chat runtime supports tool calls, reasoning levels, and configurable sandbox and approval policies."}},"communication":{"title":"How the Pieces Communicate","description":"Commands flow from the React UI into Tauri, which invokes Rust functions. Long-running work is executed as runs that stream updates (including partial LLM tokens) back to the UI. SQLite is the durable local store so sessions and terminal history can be replayed or resumed.","followup":"For a deeper dive, read the architecture documentation and the build-your-own guides that map these concepts to code modules."},"meta":{"title":"System Architecture - PlanToCode","description":"Detailed overview of the PlanToCode architecture: Tauri desktop shell, Rust backend, React/Vite frontend, SQLite persistence, and multi-model LLM routing."}},"evolutionPage":{"hero":{"title":"Evolution and Tradeoffs","description":"This page outlines the major architectural decisions behind PlanToCode and how the system changed as new workflows and constraints appeared."},"visuals":{"timeline":{"title":"Architecture timeline","description":"$34","imageSrc":"","imageAlt":"Timeline of PlanToCode system evolution","caption":"Evolution timeline graphic not yet available."}},"origins":{"title":"Project Origins","description":"PlanToCode began as an experiment in separating planning from execution: use LLMs to propose concrete implementation plans, then execute them via local tools and terminals. Early prototypes were editor-centric; over time, the architecture moved toward a dedicated desktop shell with tighter control over file access and run scheduling. The system evolved into a run-centric workspace with multi-model chat, streaming responses through a rich UI. Supporting features were built around it: run monitoring, a verified skill catalog, live git diff integration, a device relay for the iOS companion, and native voice dictation."},"choices":{"title":"Technology Choices","items":[{"title":"Tauri over Electron:","description":"Chosen for a smaller binary, a Rust backend, and a more constrained security model. It also enables shared logic between CLI-like workflows and the desktop app."},{"title":"SQLite as the local source of truth:","description":"A file-based database is easy to ship, snapshot, and inspect. It stores sessions, run metadata, and terminal history so workflows can be resumed or reviewed."},{"title":"Multi-provider LLM routing:","description":"The server supports multiple providers and models, normalizing responses and tracking usage centrally. This makes it easier to swap models without rewriting the desktop client."}]},"sourceAvailable":{"title":"What the system focuses on","description":"The focus is on multi-model chat and planning workflows: interactive chat sessions with tool calls and reasoning levels, file discovery, multi-model plan generation, review, and execution handoff. A verified skill catalog provides structured starting points and reusable workflows for common tasks. These capabilities depend on external LLM providers for inference, while the desktop and iOS companion apps handle workspace management, review, storage, and execution logs."}},"changelog":{"meta":{"title":"Changelog - Latest Updates","description":"Release notes for PlanToCode, highlighting architecture, workflow, and system changes."},"hero":{"title":"Changelog","subtitle":"Release notes focused on architecture changes, workflow updates, and system improvements."},"changes":{"added":"Added","improved":"Improved","fixed":"Fixed","removed":"Removed"},"footer":{"title":"Follow updates","subtitle":"Track release notes and architecture changes as the system evolves.","followX":"Follow updates on X","joinCommunity":"Join the community"}},"downloads":{"cta":{"architect":"Architecture overview","docs":"Terminal docs","footer":"Managed provider access on hosted • Local session storage","professional":"Implementation plan docs","title":"Need implementation context?"},"hero":{"subtitle":"Run PlanToCode locally for AI-assisted implementation planning through a desktop workspace. Includes multi-model chat, run monitoring, git diff viewer, file discovery, a verified skill catalog, and execution handoff. Hosted uses managed providers; self-hosting supports BYOK.","title":"Download PlanToCode"},"macos":{"professional":{"description":"Apple-notarized and code signed. Local CLI integration with persistent PTY sessions and session restore.","title":"Signed and notarized"},"requirements":{"internet":"Internet connection and PlanToCode server access required (BYOK only for self-host)","os":"macOS 11.0 (Big Sur) or later","processor":"Apple Silicon (M1/M2/M3/M4) processor","ram":"4GB RAM minimum (8GB recommended)","title":"System Requirements"},"subtitle":"Native macOS with Persistent Terminal Sessions","title":"macOS"},"meta":{"description":"Download PlanToCode for macOS and iOS. Desktop AI workspace with implementation planning and a mobile companion. Hosted uses managed providers; self-hosting supports BYOK.","title":"Download PlanToCode - macOS & iOS"},"trust":{"planning":{"description":"Multi-model plan generation plus merge instructions produce structured, reviewable change sets.","title":"Structured planning"},"pricing":{"description":"Token estimates run before each API call, with usage recorded per run.","title":"Usage tracking"},"professional":{"description":"Codebase-aware file discovery narrows large repos into a focused file set before planning.","title":"File discovery workflow"},"terminal":{"description":"Integrated PTY sessions provide a controlled execution surface for plan handoff and command logs.","title":"Execution surface"},"title":"System characteristics"},"mobile":{"button":"Download on App Store","connected":{"description":"The iOS companion acts as a control surface for your desktop workspace: monitor runs, review chat sessions, access remote terminals, and view git diffs streamed from your desktop with offline message queuing.","title":"Mobile Companion"},"features":{"design":"Native iOS/iPadOS design language","monitor":"Multi-device connection management with status banners and offline queuing","review":"Run monitoring, remote terminal, git changes viewer","sync":"Real-time sync with your desktop workspace sessions","title":"Features","voice":"Native voice dictation and text enhancement","terminal":"Remote terminal access from your phone"},"subtitle":"Companion Control Surface for iPhone & iPad","title":"iOS Companion App"}},"securityNotarization":{"meta":{"title":"macOS Notarization and Gatekeeper - PlanToCode","description":"How the macOS build is signed and notarized, how Gatekeeper verifies it, and where to read Apple's docs.","imageAlt":"PlanToCode macOS notarization and Gatekeeper overview"},"hero":{"title":"macOS notarization","subtitle":"The macOS build is signed and notarized by Apple. Notarization validates developer identity and scans the build for malicious content; Gatekeeper uses the notarization ticket when the app is first opened."},"links":{"gatekeeper":{"label":"Apple Support:","text":"Gatekeeper and runtime protection"},"notarize":{"label":"Apple Developer:","text":"Notarizing macOS software before distribution"}},"footer":{"text":"If Gatekeeper blocks first launch, use Finder -> Open to approve the app, or visit","link":"Downloads"}},"legal":{"meta":{"title":"Select Your Region - Legal Documents | PlanToCode","description":"Choose your region (EU/UK or United States) to view applicable legal documents including terms of service, privacy policy, and regional compliance requirements."},"restricted":{"meta":{"title":"451 - Service Not Available in Your Region","description":"This service is not available in your geographic region."}}},"howItWorks":{"cta":{"links":{"architecture":"Architecture overview","buildYourOwn":"Build your own pipeline","docs":"Read documentation","workflows":"Implementation plan docs"},"subtitle":"Follow the pipeline end to end, then trace each stage to the internal processors and data flows.","title":"Continue the technical walkthrough"},"hero":{"badge":"Technical pipeline walkthrough","subtitle":"A step-by-step view of how the multi-model chat workspace and planning pipeline turn inputs into executed changes. Use interactive chat sessions for direct AI collaboration, browse the skill catalog for reusable workflows, or follow the planning pipeline for structured review. LLM access is required (managed on hosted, BYOK on self-host).","title":"How the workspace and pipeline work"},"keyFeatures":{"deploy":{"description":"Self-host the proxy server to control provider routing and API keys. Hosted uses managed provider access and usage tracking.","title":"Deployment flexibility"},"governance":{"description":"Review, edit, merge, and approve plans before any execution step is triggered. Chat sessions support configurable sandbox and approval policies.","title":"Human-in-the-loop governance"},"sessions":{"description":"PTY sessions, chat histories, and logs persist locally so long-running work can be resumed.","title":"Persistent sessions"},"skills":{"description":"Browse a verified skill catalog, apply skills in chat, and reference them in your conversations. Skills provide structured starting points and reusable workflows for common tasks.","title":"Verified skill catalog"},"title":"Key workspace and pipeline properties"},"meta":{"description":"Technical walkthrough of the desktop workspace and planning pipeline: multi-model chat sessions, verified skills, capture inputs, discover files, generate plans, merge, and execute.","title":"How It Works - Workspace and Pipeline"},"workflow":{"exampleMergeInstructions":"Example merge instructions:","step1":{"description":"Capture requirements from recordings, screen captures, or voice notes. Screen recordings are analyzed by the video analysis run and produce a summary you can attach to the task.","meetings":{"description":"Upload meeting recordings or design reviews. The analysis uses video and audio to summarize decisions, issues, and UI context.","title":"Meeting Recordings"},"links":{"meeting":"Meeting ingestion details","voice":"Voice transcription details"},"screen":{"description":"Record workflows, bugs, or UI walkthroughs. The analysis summary can be attached to the task description.","title":"Screen Recordings"},"subtitle":"Stage 1: Voice, video, notes become specifications","title":"Capture Ideas and Context","voice":{"description":"Dictate requirements directly into the task input. Speech-to-text runs through the configured provider and inserts text into the active field.","title":"Voice Dictation"}},"step2":{"description":"Transform raw transcripts and notes into clear specifications using two prompt types: text_improvement for clarity and task_refinement for completeness.","subtitle":"Stage 2: text_improvement and task_refinement prompts","taskRefinement":{"description":"Expands task descriptions by identifying implied requirements, filling in overlooked gaps, clarifying expected behavior and edge cases, and adding technical considerations for implementation readiness.","title":"Task Refinement"},"textEnhancement":{"description":"Improves grammar, sentence structure, clarity, and conciseness while maintaining original intent and technical detail. Useful for polishing transcripts and notes.","title":"Text Enhancement"},"links":{"specCapture":"Specification capture details"},"title":"Refine into Precise Specifications"},"step3":{"description":"FileFinderWorkflow runs staged indexing, filtering, and relevance scoring. The plan processor generates structured implementation_plan documents with explicit file paths, operation types, and line ranges for review.","features":{"dependencies":"Dependency and impact notes captured per plan","models":"Model allowlists configured per project","multiple":"Multiple draft plans for comparison","operations":"Clear operation types (modify, create, delete)","paths":"Exact file paths from your repository structure","ranges":"Specific line ranges and modification details"},"links":{"fileDiscovery":"File discovery pipeline","planGeneration":"Plan generation details"},"subtitle":"Stage 3: FileFinderWorkflow + implementation_plan generation","title":"Discover Files and Generate Plans"},"step4":{"capabilities":{"approve":"Approve before execution","editing":"Direct editing of all plan steps and details","editor":"Monaco editor with syntax highlighting","merge":"Merge multiple plans with custom instructions","modifications":"Request modifications or alternative approaches","visibility":"Complete visibility into proposed changes"},"description":"Plans open in Monaco for review. You can edit steps directly, merge drafts with custom guidance, or delete drafts you do not want to keep. No code changes occur without explicit human approval, keeping scope and dependencies explicit.","links":{"governance":"Review and governance","merge":"Plan merging details"},"subtitle":"Stage 4: Side-by-side review + implementation_plan_merge","title":"Review and Merge Plans"},"step5":{"description":"After approval, execute via the integrated terminal or export the plan into external tools. Copy buttons insert plan context into templated commands, and every run is logged to session history.","links":{"terminal":"Terminal integration details","planDocs":"Implementation plan format"},"subtitle":"Stage 5: Execution handoff and terminal sessions","title":"Execute and record changes","tools":{"audit":"Execution history stored in SQLite","claude":"External tool handoff via templated prompts","codex":"IDE or CLI export with structured steps","cursor":"Template-driven copy buttons with plan context","sessions":"Persistent terminal sessions with recovery","terminal":"Integrated terminal with voice dictation"}},"title":"The complete pipeline"}},"support":{"button":"Contact Support","hero":{"subtitle":"Get help with PlanToCode","title":"Support"},"meta":{"description":"Help with installation, troubleshooting, and documentation questions.","title":"PlanToCode Support"},"resources":{"changelog":"Changelog","feedback":"Feedback","help":"Help Center","roadmap":"Roadmap","title":"FeatureBase Resources"}},"schedule":{"footer":"Can't find a time? Email us at"}},"legal":{"regionSelector":{"eu":{"documents":"Includes: Terms, Privacy, Imprint, Sub-processors, Withdrawal Policy","features":["GDPR data protection rights","14-day withdrawal period","German law applies","Consumer protections"],"title":"European Union / UK"},"notice":{"content":"PlanToCode is only available to residents of and users accessing from the European Union/EEA, United Kingdom, and United States. Access from all other regions is restricted. We use IP geolocation, payment verification, and other methods to enforce these restrictions. VPN or proxy use to circumvent regional restrictions is prohibited.","title":"Service Availability Notice"},"subtitle":"Choose your region to view the applicable legal documents","title":"Select Your Region","us":{"documents":"Includes: Terms of Service, Privacy Policy, Sub-processors","features":["CCPA/State privacy rights","US law applies","DMCA process","Standard commercial terms"],"title":"United States"}}}},"now":"$undefined","timeZone":"UTC","children":"$L35"}]

Documentation is being rewritten