H4LFdotDEV
diff --git a/‎.env.example‎
Lines changed: 0 additions & 53 deletions b/‎.env.example‎
Lines changed: 0 additions & 53 deletions
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 0 additions & 1 deletion b/‎.github/workflows/ci.yml‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎CLAUDE.md‎
Lines changed: 2 additions & 25 deletions b/‎CLAUDE.md‎
Lines changed: 2 additions & 25 deletions
diff --git a/‎README.md‎
Lines changed: 6 additions & 7 deletions b/‎README.md‎
Lines changed: 6 additions & 7 deletions
diff --git a/‎config/litellm.yaml‎
Lines changed: 0 additions & 159 deletions b/‎config/litellm.yaml‎
Lines changed: 0 additions & 159 deletions
@@ -106,35 +106,6 @@ EMBEDDING_PROVIDER=ollama
 EMBEDDING_DIMENSIONS=768
 
 
-# ─────────────────────────────────────────────────────────────────────────────
-# LITELLM ROUTING CONFIGURATION
-# ─────────────────────────────────────────────────────────────────────────────
-#
-# LiteLLM provides intelligent routing, fallbacks, and cost tracking.
-# Strategy options:
-#   cost_optimized   - Prefer cheapest model that can handle the task
-#   quality_first    - Prefer best model, fall back on failure
-#   balanced         - Balance cost and quality
-#   local_first      - Try local models first, escalate to API
-#
-# ─────────────────────────────────────────────────────────────────────────────
-
-LITELLM_MASTER_KEY=sk-litellm-...
-LITELLM_PORT=4000
-LITELLM_LOG_LEVEL=INFO
-
-# Routing strategy
-LITELLM_ROUTING_STRATEGY=local_first
-
-# Cost tracking
-LITELLM_BUDGET_DAILY=10.00
-LITELLM_BUDGET_MONTHLY=200.00
-
-# Token thresholds for model escalation
-ESCALATE_AT_TOKENS=4000
-ESCALATE_AT_COMPLEXITY=0.7
-
-
 # ─────────────────────────────────────────────────────────────────────────────
 # REDIS (Hot Tier)
 # ─────────────────────────────────────────────────────────────────────────────
@@ -180,27 +151,6 @@ LIVEGREP_BUILD_PARALLELISM=4
 LIVEGREP_INDEX_ON_SESSION_END=true
 
 
-# ─────────────────────────────────────────────────────────────────────────────
-# HOUND (Project Search)
-# ─────────────────────────────────────────────────────────────────────────────
-
-HOUND_BIND_ADDRESS=127.0.0.1:6080
-HOUND_POLL_INTERVAL=30000
-HOUND_MAX_CONCURRENT_INDEXERS=2
-
-
-# ─────────────────────────────────────────────────────────────────────────────
-# LANCEDB (Semantic Search Vector Store)
-# ─────────────────────────────────────────────────────────────────────────────
-
-LANCEDB_PATH=${CLAUDE_CODE_PP_HOME}/memory/semantic.lance
-LANCEDB_TABLE_NAME=code_embeddings
-
-# Chunking settings for semantic indexing
-CHUNK_SIZE_LINES=150
-CHUNK_OVERLAP_LINES=20
-
-
 # ─────────────────────────────────────────────────────────────────────────────
 # OBSIDIAN VAULT (Archive - Human Readable)
 # ─────────────────────────────────────────────────────────────────────────────
@@ -263,22 +213,19 @@ DEFAULT_PERMISSION_LEVEL=standard
 # FAST_MODEL=llama3.2:3b
 # EMBEDDING_MODEL=nomic-embed-text
 # EMBEDDING_PROVIDER=ollama
-# LITELLM_ROUTING_STRATEGY=local_first
 #
 # ─── PRESET: Balanced (Local simple, API for complex) ────────────────────────
 # EFFICIENCY_PRESET=balanced
 # PRIMARY_MODEL=claude-sonnet-4-5-20250929
 # FAST_MODEL=llama3.2:3b
 # EMBEDDING_MODEL=nomic-embed-text
-# LITELLM_ROUTING_STRATEGY=balanced
 #
 # ─── PRESET: Quality First (Best models, higher cost) ────────────────────────
 # EFFICIENCY_PRESET=quality
 # PRIMARY_MODEL=claude-opus-4-5-20251101
 # FAST_MODEL=claude-haiku-4-5-20251001
 # EMBEDDING_MODEL=voyage-code-3
 # EMBEDDING_PROVIDER=voyage
-# LITELLM_ROUTING_STRATEGY=quality_first
 #
 # ─────────────────────────────────────────────────────────────────────────────
 
 
@@ -178,7 +178,6 @@ jobs:
           # Set required environment variables
           export NEO4J_PASSWORD=test
           export REDIS_PASSWORD=test
-          export LITELLM_MASTER_KEY=sk-litellm-test
           export ANTHROPIC_API_KEY=""
           export OPENAI_API_KEY=""
 
 
@@ -17,8 +17,7 @@ An AI-native development environment that extends Claude Code with persistent me
 ├─────────────────────────────────────────────────────────────┤
 │  Infrastructure                                              │
 │  ├── Redis - Hot memory cache (port 6379)                   │
-│  ├── Neo4j - Knowledge graph (port 7687)                    │
-│  └── LiteLLM - Model routing (port 4000)                    │
+│  └── Neo4j - Knowledge graph (port 7474/7687)               │
 └─────────────────────────────────────────────────────────────┘
 ```
 
@@ -162,16 +161,6 @@ The memory system uses automatic tier promotion based on access patterns:
 
 **Automatic Promotion:** Documents accessed 5+ times are promoted to warm tier (Graphiti knowledge graph). Access tracking uses LRU eviction (max 10k entries) with Redis distributed tracking when available.
 
-### LiteLLM Router
-
-Intelligent model routing with cost optimization.
-
-**Configured Models:**
-- `claude-opus-4-5-20251101` - Complex reasoning
-- `claude-sonnet-4-5-20251101` - Main development
-- `gpt-4o` - Fallback/comparison
-- `ollama/llama3.2` - Local inference
-
 ## Configuration
 
 ### Directory Structure
@@ -180,11 +169,9 @@ Intelligent model routing with cost optimization.
 ~/.claude-code-pp/
 ├── config/
 │   ├── settings.yaml      # Main configuration
-│   ├── mcp-servers.json   # MCP server definitions
-│   └── litellm.yaml       # Model routing config
+│   └── mcp-servers.json   # MCP server definitions
 ├── memory/
 │   ├── sqlite/            # Metadata and FTS
-│   ├── lancedb/           # Vector embeddings
 │   └── vault/             # Obsidian-compatible notes
 ├── logs/
 └── cache/
@@ -242,7 +229,6 @@ docker-compose -f docker/docker-compose.yaml --profile local-llm up -d
 |---------|------|---------|
 | redis | 6379 | Hot memory cache |
 | neo4j | 7474/7687 | Knowledge graph (HTTP/Bolt) |
-| litellm | 4000 | Model routing |
 | playwright | 9222 | Browser automation (optional) |
 | ollama | 11434 | Local LLM (optional) |
 
@@ -274,15 +260,6 @@ docker-compose -f docker/docker-compose.yaml logs
 docker-compose -f docker/docker-compose.yaml restart redis
 ```
 
-### LiteLLM routing errors
-```bash
-# Test endpoint
-curl http://localhost:4000/health
-
-# Check configured models
-curl http://localhost:4000/v1/models
-```
-
 ## Development
 
 ### Building Swift Controller
 
@@ -10,7 +10,7 @@ Claude Code++ adds enterprise-grade capabilities to Claude Code through MCP (Mod
 - **Search MCP** - Multi-layer search (SQLite FTS → livegrep → Graphiti)
 - **System Controller** - macOS Accessibility API integration
 - **Research Environment** - Voice conversations + webcam whiteboard capture
-- **Infrastructure** - Docker-based services for Redis, Neo4j, and model routing
+- **Infrastructure** - Docker-based services for Redis and Neo4j
 
 ## Architecture
 
@@ -35,10 +35,10 @@ Claude Code++ adds enterprise-grade capabilities to Claude Code through MCP (Mod
 │  └──────────┘  └───────────┘  └───────────┘  └───────────────────┘           │
 │                                                                              │
 │  INFRASTRUCTURE                                                              │
-│  ┌──────────┐  ┌───────────┐  ┌───────────┐  ┌───────────────────┐           │
-│  │  Redis   │  │  Neo4j    │  │  SQLite   │  │  LiteLLM Router   │           │
-│  │  Cache   │  │  Graph DB │  │  Metadata │  │  Model routing    │           │
-│  └──────────┘  └───────────┘  └───────────┘  └───────────────────┘           │
+│  ┌──────────┐  ┌───────────┐  ┌───────────┐                                  │
+│  │  Redis   │  │  Neo4j    │  │  SQLite   │                                  │
+│  │  Cache   │  │  Graph DB │  │  Metadata │                                  │
+│  └──────────┘  └───────────┘  └───────────┘                                  │
 │                                                                              │
 └──────────────────────────────────────────────────────────────────────────────┘
 ```
@@ -209,8 +209,7 @@ docker-compose -f docker/docker-compose.yaml ps
 | Service | Port | Purpose |
 |---------|------|---------|
 | redis | 6379 | Hot memory cache |
-| neo4j | 7687 | Knowledge graph (Graphiti) |
-| litellm | 4000 | Model routing |
+| neo4j | 7474/7687 | Knowledge graph (Graphiti) |
 
 ## Research Environment