Inferara · 0xGeorgii · Mar 2, 2026 · Mar 2, 2026 · Mar 6, 2026 · Mar 6, 2026
diff --git a/Cargo.toml b/Cargo.toml
@@ -33,6 +33,7 @@ inference-type-checker = { path = "./core/type-checker", version = "0.0.1" }
 inference-cli = { path = "./core/cli", version = "0.0.1" }
 inference-wasm-to-v-translator = { path = "./core/wasm-to-v", version = "0.0.1" }
 inference-wasm-codegen = { path = "./core/wasm-codegen", version = "0.0.1" }
+inference-analysis = { path = "./core/analysis", version = "0.0.1" }
 
 # IDE support crates
 inference-base-db = { path = "./ide/base-db", version = "0.0.1" }

diff --git a/core/analysis/Cargo.toml b/core/analysis/Cargo.toml
@@ -0,0 +1,15 @@
+[package]
+name = "inference-analysis"
+version = { workspace = true }
+edition = { workspace = true }
+license = { workspace = true }
+homepage = { workspace = true }
+repository = { workspace = true }
+description = "Static analysis pass for the Inference compiler"
+keywords = ["compiler", "analysis", "control-flow", "verification"]
+categories = ["compilers"]
+
+[dependencies]
+inference-ast.workspace = true
+inference-type-checker.workspace = true
+thiserror.workspace = true
diff --git a/core/analysis/README.md b/core/analysis/README.md
@@ -0,0 +1,41 @@
+# inference-analysis
+
+Static analysis rules for the Inference compiler. Runs after type checking, before code generation.
+
+## Architecture
+
+Each analysis check is an independent struct implementing the `Rule` trait. Rules receive the
+fully-typed `TypedContext` and return a list of `AnalysisError` values. The `analyze()` entry
+point runs all rules sequentially and collects every error before returning.
+
+A shared `walk_function_bodies()` walker handles AST traversal with `loop_depth` and
+`nondet_depth` counters so individual rules focus on detection logic only.
+
+The `rule!` macro reduces boilerplate for rule definitions:
+
+```rust
+rule! {
+    /// Break must appear inside a loop body.
+    #[id = "A001"]
+    #[name = "Break outside loop"]
+    pub struct BreakOutsideLoop;
+    fn check(ctx: &TypedContext) -> Vec<AnalysisError> {
+        // implementation using walk_function_bodies
+    }
+}
+```
+
+## How to add a new rule
+
+1. Create `src/rules/new_rule.rs` using the `rule!` macro (see existing rules for examples).
+2. Add `pub mod new_rule;` to `src/rules/mod.rs`.
+3. Add `Box::new(NewRule)` to the vec in `all_rules()`.
+
+## Rules
+
+| ID | Rule | Diagnostic Message |
+|----|------|--------------------|
+| A001 | `break` must be inside a loop body | `break statement is only valid inside a loop body` |
+| A002 | `break` must not be inside a non-deterministic block (`forall`, `exists`, `assume`, `unique`) | `break statement is not allowed inside a non-deterministic block` |
+| A003 | `return` must not appear inside a loop body | `return inside a loop is not allowed; use break to exit the loop, then return after it` |
+| A004 | Infinite `loop { }` must contain a reachable `break` | `infinite loop must contain a break statement` |
diff --git a/core/analysis/src/errors.rs b/core/analysis/src/errors.rs
@@ -0,0 +1,237 @@
+//! Analysis Error Types
+//!
+//! This module defines the error types produced by the analysis pass, providing
+//! detailed context and location information for all control flow violations.
+//!
+//! ## Error Design
+//!
+//! All analysis errors:
+//! - Include precise source location (line and column)
+//! - Provide actionable error messages with guidance
+//! - Use descriptive error messages via `thiserror`
+//! - Are collected and reported together (error recovery)
+//!
+//! ## Error Categories
+//!
+//! **Loop Control Flow Errors**:
+//! - [`AnalysisError::BreakOutsideLoop`] - `break` used outside a loop body
+//! - [`AnalysisError::BreakInsideNonDetBlock`] - `break` used inside a non-deterministic block
+//! - [`AnalysisError::ReturnInsideLoop`] - `return` used inside a loop body
+//! - [`AnalysisError::InfiniteLoopWithoutBreak`] - Infinite loop missing a `break` statement
+
+use std::fmt::{self, Display, Formatter};
+
+use inference_ast::nodes::Location;
+use thiserror::Error;
+
+/// Severity level for analysis findings.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum Severity {
+    Info,
+    Warning,
+    Error,
+}
+
+/// Represents a control flow analysis error with source location.
+#[derive(Debug, Clone, Error)]
+pub enum AnalysisError {
+    #[error(
+        "{location}: break statement is only valid inside a loop body"
+    )]
+    BreakOutsideLoop { location: Location },
+
+    #[error(
+        "{location}: break statement is not allowed inside a non-deterministic block; non-deterministic blocks must explore all execution paths, and break would exit the enclosing loop"
+    )]
+    BreakInsideNonDetBlock { location: Location },
+
+    #[error(
+        "{location}: return inside a loop is not allowed; use break to exit the loop, then return after it"
+    )]
+    ReturnInsideLoop { location: Location },
+
+    #[error("{location}: infinite loop must contain a reachable break statement; a loop without a condition requires break to terminate")]
+    InfiniteLoopWithoutBreak { location: Location },
+
+    #[error("{location}: return statement is not allowed inside a non-deterministic block; non-deterministic blocks must explore all execution paths, and return would exit the enclosing function")]
+    ReturnInsideNonDetBlock { location: Location },
+}
+
+impl AnalysisError {
+    /// Returns the source location associated with this error.
+    #[must_use = "returns the source location without modifying the error"]
+    pub fn location(&self) -> &Location {
+        match self {
+            AnalysisError::BreakOutsideLoop { location }
+            | AnalysisError::BreakInsideNonDetBlock { location }
+            | AnalysisError::ReturnInsideLoop { location }
+            | AnalysisError::InfiniteLoopWithoutBreak { location }
+            | AnalysisError::ReturnInsideNonDetBlock { location } => location,
+        }
+    }
+}
+
+/// Wrapper for multiple analysis errors, following the `TypeCheckErrors` pattern.
+///
+/// Collects all analysis errors found during a single pass, allowing the user
+/// to see all issues at once rather than fixing one error at a time.
+#[derive(Debug, Clone)]
+pub struct AnalysisErrors {
+    errors: Vec<AnalysisError>,
+}
+
+impl AnalysisErrors {
+    pub(crate) fn new(errors: Vec<AnalysisError>) -> Self {
+        Self { errors }
+    }
+
+    /// Returns the list of analysis errors.
+    #[must_use]
+    pub fn errors(&self) -> &[AnalysisError] {
+        &self.errors
+    }
+}
+
+impl Display for AnalysisErrors {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
+        let messages: Vec<String> = self.errors.iter().map(ToString::to_string).collect();
+        write!(f, "{}", messages.join("; "))
+    }
+}
+
+impl std::error::Error for AnalysisErrors {}
+
+/// Holds non-fatal analysis findings (warnings and informational messages).
+///
+/// Returned from `analyze()` when no hard errors are found, allowing the
+/// compilation pipeline to continue while still reporting lesser findings.
+#[derive(Debug, Clone)]
+pub struct AnalysisResult {
+    pub warnings: Vec<AnalysisError>,
+    pub infos: Vec<AnalysisError>,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn test_location() -> Location {
+        Location {
+            offset_start: 4,
+            offset_end: 9,
+            start_line: 1,
+            start_column: 5,
+            end_line: 1,
+            end_column: 10,
+        }
+    }
+
+    #[test]
+    fn display_break_outside_loop() {
+        let err = AnalysisError::BreakOutsideLoop {
+            location: test_location(),
+        };
+        assert_eq!(
+            err.to_string(),
+            "1:5: break statement is only valid inside a loop body"
+        );
+    }
+
+    #[test]
+    fn display_break_inside_nondet_block() {
+        let err = AnalysisError::BreakInsideNonDetBlock {
+            location: test_location(),
+        };
+        assert_eq!(
+            err.to_string(),
+            "1:5: break statement is not allowed inside a non-deterministic block; non-deterministic blocks must explore all execution paths, and break would exit the enclosing loop"
+        );
+    }
+
+    #[test]
+    fn display_return_inside_loop() {
+        let err = AnalysisError::ReturnInsideLoop {
+            location: test_location(),
+        };
+        assert_eq!(
+            err.to_string(),
+            "1:5: return inside a loop is not allowed; use break to exit the loop, then return after it"
+        );
+    }
+
+    #[test]
+    fn display_infinite_loop_without_break() {
+        let err = AnalysisError::InfiniteLoopWithoutBreak {
+            location: test_location(),
+        };
+        assert_eq!(
+            err.to_string(),
+            "1:5: infinite loop must contain a reachable break statement; a loop without a condition requires break to terminate"
+        );
+    }
+
+    #[test]
+    fn display_return_inside_nondet_block() {
+        let err = AnalysisError::ReturnInsideNonDetBlock {
+            location: test_location(),
+        };
+        assert_eq!(
+            err.to_string(),
+            "1:5: return statement is not allowed inside a non-deterministic block; non-deterministic blocks must explore all execution paths, and return would exit the enclosing function"
+        );
+    }
+
+    #[test]
+    fn error_location_accessor() {
+        let loc = test_location();
+        let err = AnalysisError::BreakOutsideLoop { location: loc };
+        assert_eq!(err.location(), &loc);
+    }
+
+    #[test]
+    fn display_analysis_errors_single() {
+        let errors = AnalysisErrors::new(vec![AnalysisError::BreakOutsideLoop {
+            location: test_location(),
+        }]);
+        assert_eq!(
+            errors.to_string(),
+            "1:5: break statement is only valid inside a loop body"
+        );
+    }
+
+    #[test]
+    fn display_analysis_errors_multiple() {
+        let errors = AnalysisErrors::new(vec![
+            AnalysisError::BreakOutsideLoop {
+                location: test_location(),
+            },
+            AnalysisError::ReturnInsideLoop {
+                location: Location {
+                    offset_start: 20,
+                    offset_end: 30,
+                    start_line: 3,
+                    start_column: 10,
+                    end_line: 3,
+                    end_column: 20,
+                },
+            },
+        ]);
+        assert_eq!(
+            errors.to_string(),
+            "1:5: break statement is only valid inside a loop body; 3:10: return inside a loop is not allowed; use break to exit the loop, then return after it"
+        );
+    }
+
+    #[test]
+    fn display_analysis_errors_empty() {
+        let errors = AnalysisErrors::new(vec![]);
+        assert_eq!(errors.to_string(), "");
+    }
+
+    #[test]
+    fn severity_variants() {
+        assert_ne!(Severity::Error, Severity::Warning);
+        assert_ne!(Severity::Warning, Severity::Info);
+        assert_ne!(Severity::Error, Severity::Info);
+    }
+}
diff --git a/core/analysis/src/lib.rs b/core/analysis/src/lib.rs
@@ -0,0 +1,75 @@
+#![warn(clippy::pedantic)]
+//! Control Flow Analysis Pass for the Inference Compiler
+//!
+//! This crate provides semantic analysis that validates control flow invariants
+//! beyond what the type checker covers. It operates on the fully-typed AST and
+//! runs after type checking but before code generation.
+//!
+//! ## Current Analyses
+//!
+//! ### Loop Control Flow Validation
+//!
+//! - `break` must appear inside a loop body
+//! - `break` must not appear inside a non-deterministic block
+//! - `return` must not appear inside a loop body
+//! - Infinite loops (`loop { ... }`) must contain a `break` statement
+//!
+//! ## Pipeline Position
+//!
+//! ```text
+//! parse -> type_check -> analyze -> codegen
+//! ```
+//!
+//! The `analyze()` function is called by the orchestration layer in
+//! `core/inference/src/lib.rs` after type checking succeeds.
+//!
+//! ## Rule Architecture
+//!
+//! Each analysis check is an independent struct implementing the [`rule::Rule`]
+//! trait. Rules are registered in [`rules::all_rules()`] and executed
+//! sequentially. The [`rule!`] macro reduces boilerplate for rule definitions.
+//!
+//! ## Design
+//!
+//! This crate depends on `inference-ast` and `inference-type-checker`.
+//! The entry point accepts `&TypedContext` from the type checker.
+
+use inference_type_checker::typed_context::TypedContext;
+
+pub mod errors;
+pub mod rule;
+pub mod rules;
+mod walker;
+
+use errors::{AnalysisErrors, AnalysisResult, Severity};
+
+/// Performs control flow analysis on the typed AST.
+///
+/// Runs all registered analysis rules and collects errors. Currently includes:
+/// - Loop control flow validation (break placement, return inside loop,
+///   infinite loop detection)
+///
+/// # Errors
+///
+/// Returns `AnalysisErrors` if any control flow violations are found.
+/// All errors are collected before returning, allowing the user to see
+/// all issues at once.
+pub fn analyze(typed_context: &TypedContext) -> Result<AnalysisResult, AnalysisErrors> {
+    let all_rules = rules::all_rules();
+    let mut errors = Vec::new();
+    let mut warnings = Vec::new();
+    let mut infos = Vec::new();
+    for r in &all_rules {
+        let findings = r.check(typed_context);
+        match r.severity() {
+            Severity::Error => errors.extend(findings),
+            Severity::Warning => warnings.extend(findings),
+            Severity::Info => infos.extend(findings),
+        }
+    }
+    if errors.is_empty() {
+        Ok(AnalysisResult { warnings, infos })
+    } else {
+        Err(AnalysisErrors::new(errors))
+    }
+}