DevSymphony · sehwan505 · Nov 13, 2025 · Nov 12, 2025 · Nov 12, 2025 · Nov 12, 2025
diff --git a/internal/engine/llm/engine.go b/internal/engine/llm/engine.go
@@ -0,0 +1,285 @@
+package llm
+
+import (
+	"context"
+	"fmt"
+	"os"
+	"strings"
+	"time"
+
+	"github.com/DevSymphony/sym-cli/internal/engine/core"
+	"github.com/DevSymphony/sym-cli/internal/llm"
+)
+
+// Engine validates code using LLM-based analysis.
+// Unlike other engines that use static analysis tools, this engine
+// uses an LLM to understand and validate code against natural language rules.
+type Engine struct {
+	client *llm.Client
+	config core.EngineConfig
+}
+
+// NewEngine creates a new LLM engine.
+func NewEngine() *Engine {
+	return &Engine{}
+}
+
+// Init initializes the engine.
+func (e *Engine) Init(ctx context.Context, config core.EngineConfig) error {
+	e.config = config
+
+	// Initialize LLM client
+	apiKey := os.Getenv("ANTHROPIC_API_KEY")
+	if apiKey == "" {
+		apiKey = os.Getenv("OPENAI_API_KEY")
+	}
+
+	if apiKey == "" {
+		return fmt.Errorf("LLM API key not found (ANTHROPIC_API_KEY or OPENAI_API_KEY)")
+	}
+
+	e.client = llm.NewClient(apiKey)
+	return nil
+}
+
+// Validate validates files against an LLM-based rule.
+func (e *Engine) Validate(ctx context.Context, rule core.Rule, files []string) (*core.ValidationResult, error) {
+	start := time.Now()
+
+	// Filter files by selector
+	files = core.FilterFiles(files, rule.When)
+
+	if len(files) == 0 {
+		return &core.ValidationResult{
+			RuleID:   rule.ID,
+			Passed:   true,
+			Engine:   "llm-validator",
+			Duration: time.Since(start),
+		}, nil
+	}
+
+	violations := make([]core.Violation, 0)
+
+	// Validate each file
+	for _, file := range files {
+		// Read file content
+		content, err := os.ReadFile(file)
+		if err != nil {
+			if e.config.Debug {
+				fmt.Printf("⚠️  Failed to read file %s: %v\n", file, err)
+			}
+			continue
+		}
+
+		// Validate with LLM
+		fileViolations, err := e.validateFile(ctx, rule, file, string(content))
+		if err != nil {
+			if e.config.Debug {
+				fmt.Printf("⚠️  Failed to validate file %s: %v\n", file, err)
+			}
+			continue
+		}
+
+		violations = append(violations, fileViolations...)
+	}
+
+	return &core.ValidationResult{
+		RuleID:     rule.ID,
+		Passed:     len(violations) == 0,
+		Violations: violations,
+		Duration:   time.Since(start),
+		Engine:     "llm-validator",
+		Metrics: &core.Metrics{
+			FilesProcessed: len(files),
+		},
+	}, nil
+}
+
+// validateFile validates a single file using LLM
+func (e *Engine) validateFile(ctx context.Context, rule core.Rule, filePath string, content string) ([]core.Violation, error) {
+	// Build prompt for LLM
+	systemPrompt := `You are a code reviewer. Check if the code violates the given coding convention.
+
+Respond with JSON only:
+{
+  "violates": true/false,
+  "description": "explanation of violation if any",
+  "suggestion": "how to fix it if violated",
+  "line": line_number_if_applicable (0 if not applicable)
+}`
+
+	userPrompt := fmt.Sprintf(`File: %s
+
+Coding Convention:
+%s
+
+Code:
+%s
+
+Does this code violate the convention?`, filePath, rule.Desc, content)
+
+	// Call LLM
+	response, err := e.client.Complete(ctx, systemPrompt, userPrompt)
+	if err != nil {
+		return nil, err
+	}
+
+	// Parse response
+	result := parseValidationResponse(response)
+	if !result.Violates {
+		return []core.Violation{}, nil
+	}
+
+	message := result.Description
+	if result.Suggestion != "" {
+		message += fmt.Sprintf(" | Suggestion: %s", result.Suggestion)
+	}
+
+	// Use custom message if provided in rule
+	if rule.Message != "" {
+		message = rule.Message + " | " + message
+	}
+
+	violation := core.Violation{
+		RuleID:   rule.ID,
+		Severity: rule.Severity,
+		Message:  message,
+		File:     filePath,
+		Line:     result.Line,
+		Category: rule.Category,
+	}
+
+	return []core.Violation{violation}, nil
+}
+
+// GetCapabilities returns engine capabilities.
+func (e *Engine) GetCapabilities() core.EngineCapabilities {
+	return core.EngineCapabilities{
+		Name: "llm-validator",
+		// LLM is language-agnostic - can understand any programming language
+		SupportedLanguages: []string{
+			"javascript", "typescript", "jsx", "tsx",
+			"python", "go", "java", "rust", "c", "cpp",
+			"ruby", "php", "swift", "kotlin", "scala",
+		},
+		SupportedCategories: []string{
+			"convention", "style", "best-practice",
+			"security", "performance", "maintainability",
+		},
+		SupportsAutofix:     false, // Future enhancement
+		RequiresCompilation: false,
+		ExternalTools:       []core.ToolRequirement{}, // No external tools needed
+	}
+}
+
+// Close cleans up resources.
+func (e *Engine) Close() error {
+	return nil
+}
+
+// validationResponse represents the parsed LLM response
+type validationResponse struct {
+	Violates    bool
+	Description string
+	Suggestion  string
+	Line        int
+}
+
+// parseValidationResponse parses the LLM response
+func parseValidationResponse(response string) validationResponse {
+	// Default to no violation
+	result := validationResponse{
+		Violates:    false,
+		Description: "",
+		Suggestion:  "",
+		Line:        0,
+	}
+
+	lower := strings.ToLower(response)
+
+	// Check if no violation
+	if strings.Contains(lower, `"violates": false`) ||
+		strings.Contains(lower, `"violates":false`) ||
+		strings.Contains(lower, "does not violate") {
+		return result
+	}
+
+	// Check if violates
+	if strings.Contains(lower, `"violates": true`) ||
+		strings.Contains(lower, `"violates":true`) {
+		result.Violates = true
+
+		// Extract description
+		if desc := extractJSONField(response, "description"); desc != "" {
+			result.Description = desc
+		} else {
+			result.Description = "Rule violation detected"
+		}
+
+		// Extract suggestion
+		if sugg := extractJSONField(response, "suggestion"); sugg != "" {
+			result.Suggestion = sugg
+		}
+
+		// Extract line number
+		if lineStr := extractJSONField(response, "line"); lineStr != "" {
+			// Parse line number
+			var line int
+			if _, err := fmt.Sscanf(lineStr, "%d", &line); err == nil {
+				result.Line = line
+			}
+		}
+	}
+
+	return result
+}
+
+// extractJSONField extracts a field value from JSON response
+func extractJSONField(response, field string) string {
+	// Look for "field": "value"
+	key := fmt.Sprintf(`"%s"`, field)
+	idx := strings.Index(response, key)
+	if idx == -1 {
+		return ""
+	}
+
+	// Find : after field name
+	colonIdx := strings.Index(response[idx:], ":") + idx
+	if colonIdx <= idx {
+		return ""
+	}
+
+	// Find opening quote or number
+	start := colonIdx + 1
+	for start < len(response) && (response[start] == ' ' || response[start] == '\t' || response[start] == '\n') {
+		start++
+	}
+
+	if start >= len(response) {
+		return ""
+	}
+
+	// Handle string value
+	if response[start] == '"' {
+		openIdx := start
+		closeIdx := openIdx + 1
+		for closeIdx < len(response) {
+			if response[closeIdx] == '"' && (closeIdx == openIdx+1 || response[closeIdx-1] != '\\') {
+				return response[openIdx+1 : closeIdx]
+			}
+			closeIdx++
+		}
+		return ""
+	}
+
+	// Handle numeric value
+	end := start
+	for end < len(response) && response[end] >= '0' && response[end] <= '9' {
+		end++
+	}
+	if end > start {
+		return response[start:end]
+	}
+
+	return ""
+}
diff --git a/internal/engine/registry/builtin.go b/internal/engine/registry/builtin.go
@@ -4,6 +4,7 @@ import (
 	"github.com/DevSymphony/sym-cli/internal/engine/ast"
 	"github.com/DevSymphony/sym-cli/internal/engine/core"
 	"github.com/DevSymphony/sym-cli/internal/engine/length"
+	"github.com/DevSymphony/sym-cli/internal/engine/llm"
 	"github.com/DevSymphony/sym-cli/internal/engine/pattern"
 	"github.com/DevSymphony/sym-cli/internal/engine/style"
 	"github.com/DevSymphony/sym-cli/internal/engine/typechecker"
@@ -35,4 +36,9 @@ func init() {
 	MustRegister("typechecker", func() (core.Engine, error) {
 		return typechecker.NewEngine(), nil
 	})
+
+	// Register LLM validator engine
+	MustRegister("llm-validator", func() (core.Engine, error) {
+		return llm.NewEngine(), nil
+	})
 }
diff --git a/internal/llm/inference.go b/internal/llm/inference.go
@@ -13,11 +13,12 @@ import (
 const systemPrompt = `You are a code linting rule analyzer. Extract structured information from natural language coding rules.
 
 Extract:
-1. **engine**: pattern|length|style|ast|custom
+1. **engine**: pattern|length|style|ast|llm-validator
    - Use "style" for code formatting rules (semicolons, quotes, indentation, spacing)
    - Use "pattern" for naming conventions or content matching
    - Use "length" for size/length constraints
    - Use "ast" for structural complexity rules
+   - Use "llm-validator" for complex semantic rules that cannot be expressed with simple patterns
 
 2. **category**: naming|formatting|security|error_handling|testing|documentation|dependency|commit|performance|architecture|custom
 

diff --git a/internal/llm/types.go b/internal/llm/types.go
@@ -2,7 +2,7 @@ package llm
 
 // RuleIntent represents the structured interpretation of a natural language rule
 type RuleIntent struct {
-	Engine     string         // "pattern", "length", "style", "ast", "custom"
+	Engine     string         // "pattern", "length", "style", "ast", "llm-validator"
 	Category   string         // "naming", "formatting", "security", "error_handling", etc.
 	Target     string         // "identifier", "content", "import", "class", "method", etc.
 	Scope      string         // "line", "file", "function", "method", "class", etc.