micro
diff --git a/‎README.md‎
Lines changed: 4 additions & 42 deletions b/‎README.md‎
Lines changed: 4 additions & 42 deletions
diff --git a/‎admin/env.go‎
Lines changed: 1 addition & 6 deletions b/‎admin/env.go‎
Lines changed: 1 addition & 6 deletions
diff --git a/‎ai/ai.go‎
Lines changed: 1 addition & 4 deletions b/‎ai/ai.go‎
Lines changed: 1 addition & 4 deletions
diff --git a/‎ai/providers.go‎
Lines changed: 8 additions & 211 deletions b/‎ai/providers.go‎
Lines changed: 8 additions & 211 deletions
@@ -140,59 +140,22 @@ export YOUTUBE_API_KEY=xxx
 
 #### Chat Model
 
-**Ollama (Default)**
-
-By default, Mu uses [Ollama](https://ollama.ai/) for LLM queries. Install and run Ollama locally:
-
-```
-# Install Ollama from https://ollama.ai/
-# Pull a model (e.g., llama3.2)
-ollama pull llama3.2
-
-# Ollama runs on http://localhost:11434 by default
-```
-
-Optional environment variables:
-```
-export MODEL_NAME=llama3.2              # Default model
-export MODEL_API_URL=http://localhost:11434  # Ollama API URL
-```
-
-**Fanar (Optional)**
-
-Alternatively, use [Fanar](https://fanar.qa/) by setting the API key:
-
-```
-export FANAR_API_KEY=xxx
-export FANAR_API_URL=https://api.fanar.qa  # Optional, this is the default
-```
-
-When `FANAR_API_KEY` is set, Mu will use Fanar instead of Ollama.
-
-**Note:** Fanar has a rate limit of 10 requests per minute. Mu enforces this limit automatically.
-
-**Anthropic Claude (Optional)**
-
-You can also use Anthropic's Claude API:
+Mu uses Anthropic Claude for all AI features:
 
 ```
 export ANTHROPIC_API_KEY=xxx
-export ANTHROPIC_MODEL=claude-haiku-4.5-20250311  # Optional, this is the default
+export ANTHROPIC_MODEL=claude-sonnet-4-20250514  # Optional, this is the default
 ```
 
-Priority order: Anthropic > Fanar > Ollama
-
-For vector search see this [doc](docs/VECTOR_SEARCH.md)
-
 ### Data Storage
 
-By default, Mu stores search index and embeddings in JSON files loaded into memory. For production use with large datasets, enable SQLite storage to reduce memory usage:
+By default, Mu stores the search index in JSON files loaded into memory. For production use, enable SQLite with FTS5 full-text search:
 
 ```
 export MU_USE_SQLITE=1
 ```
 
-This stores the search index and embeddings in SQLite (`~/.mu/data/index.db`) instead of RAM. Migration from JSON happens automatically on first startup.
+This stores the search index in SQLite (`~/.mu/data/index.db`) with FTS5 for fast full-text search. Migration from JSON happens automatically on first startup.
 
 ### Run
 
@@ -221,7 +184,6 @@ Full documentation is available in the [docs](docs/) folder and at `/docs` on an
 - [Wallet & Credits](docs/WALLET_AND_CREDITS.md) - Credit system for metered usage
 **Reference**
 - [Configuration](docs/ENVIRONMENT_VARIABLES.md) - All environment variables
-- [Vector Search](docs/VECTOR_SEARCH.md) - Semantic search setup
 - [API Reference](docs/API_COVERAGE.md) - REST API endpoints
 - [MCP Server](docs/MCP.md) - AI tool integration via MCP
 - [Screenshots](docs/SCREENSHOTS.md) - Application screenshots
 
@@ -17,14 +17,9 @@ var knownEnvVars = []string{
 	"MU_DOMAIN",
 	"MU_USE_SQLITE",
 	"DATA_DIR",
-	// LLM providers
+	// LLM
 	"ANTHROPIC_API_KEY",
 	"ANTHROPIC_MODEL",
-	"FANAR_API_KEY",
-	"FANAR_API_URL",
-	"OLLAMA_API_URL",
-	"MODEL_API_URL",
-	"MODEL_NAME",
 	// Search
 	"BRAVE_API_KEY",
 	// External APIs
 
@@ -1,5 +1,4 @@
-// Package ai provides LLM integration for the Mu platform.
-// It supports multiple providers: Anthropic Claude, Fanar, and Ollama.
+// Package ai provides LLM integration for the Mu platform via Anthropic Claude.
 package ai
 
 import (
@@ -29,8 +28,6 @@ type History []Message
 const (
 	ProviderDefault   = ""          // Use configured default
 	ProviderAnthropic = "anthropic" // Force Anthropic Claude
-	ProviderFanar     = "fanar"     // Force Fanar
-	ProviderOllama    = "ollama"    // Force Ollama
 )
 
 // Prompt represents a request to the LLM
 
@@ -20,11 +20,6 @@ var (
 	llmSemaphore = semaphore.NewWeighted(5)
 	llmTimeout   = 60 * time.Second
 
-	// Rate limiter for Fanar API
-	fanarRateMu     sync.Mutex
-	fanarLastMinute []time.Time
-	fanarMaxPerMin  = 35
-
 	// Anthropic cache stats
 	cacheStatsMu        sync.Mutex
 	cacheHits           int
@@ -62,169 +57,20 @@ func generate(prompt *Prompt) (string, error) {
 
 	messages = append(messages, map[string]string{"role": "user", "content": prompt.Question})
 
-	// Check for forced provider
-	if prompt.Provider == ProviderAnthropic {
-		if key := os.Getenv("ANTHROPIC_API_KEY"); key != "" {
-			model := prompt.Model
-			if model == "" {
-				model = os.Getenv("ANTHROPIC_MODEL")
-			}
-			if model == "" {
-				model = "claude-sonnet-4-20250514"
-			}
-			return generateAnthropic(key, model, systemPromptText, messages)
-		}
-		return "", fmt.Errorf("anthropic provider requested but ANTHROPIC_API_KEY not set")
-	}
-
-	if prompt.Provider == ProviderFanar {
-		if key := os.Getenv("FANAR_API_KEY"); key != "" {
-			url := os.Getenv("FANAR_API_URL")
-			if url == "" {
-				url = "https://api.fanar.qa"
-			}
-			return generateFanar(url, key, messages, prompt.Priority)
-		}
-		return "", fmt.Errorf("fanar provider requested but FANAR_API_KEY not set")
+	key := os.Getenv("ANTHROPIC_API_KEY")
+	if key == "" {
+		return "", fmt.Errorf("ANTHROPIC_API_KEY not set")
 	}
 
-	if prompt.Provider == ProviderOllama {
-		model := os.Getenv("MODEL_NAME")
-		if model == "" {
-			model = "llama3.2"
-		}
-		url := os.Getenv("MODEL_API_URL")
-		if url == "" {
-			url = "http://localhost:11434"
-		}
-		return generateOllama(url, model, messages)
-	}
-
-	// Default provider priority: Anthropic > Fanar > Ollama
-	// (Anthropic first for quality, Fanar as fallback for Arabic/cultural content)
-	if key := os.Getenv("ANTHROPIC_API_KEY"); key != "" {
-		model := os.Getenv("ANTHROPIC_MODEL")
-		if model == "" {
-			model = "claude-sonnet-4-20250514"
-		}
-		return generateAnthropic(key, model, systemPromptText, messages)
-	}
-
-	if key := os.Getenv("FANAR_API_KEY"); key != "" {
-		url := os.Getenv("FANAR_API_URL")
-		if url == "" {
-			url = "https://api.fanar.qa"
-		}
-		return generateFanar(url, key, messages, prompt.Priority)
-	}
-
-	// Default to Ollama
-	model := os.Getenv("MODEL_NAME")
+	model := prompt.Model
 	if model == "" {
-		model = "llama3.2"
-	}
-	url := os.Getenv("MODEL_API_URL")
-	if url == "" {
-		url = "http://localhost:11434"
-	}
-	return generateOllama(url, model, messages)
-}
-
-func generateOllama(apiURL, model string, messages []map[string]string) (string, error) {
-	app.Log("ai", "[LLM] Using Ollama at %s with model %s", apiURL, model)
-
-	req := map[string]interface{}{
-		"model":    model,
-		"messages": messages,
-		"stream":   false,
+		model = os.Getenv("ANTHROPIC_MODEL")
 	}
-
-	body, _ := json.Marshal(req)
-	httpReq, _ := http.NewRequest("POST", apiURL+"/api/chat", bytes.NewReader(body))
-	httpReq.Header.Set("Content-Type", "application/json")
-
-	client := &http.Client{Timeout: llmTimeout}
-	resp, err := client.Do(httpReq)
-	if err != nil {
-		return "", fmt.Errorf("failed to connect to Ollama: %v", err)
-	}
-	defer resp.Body.Close()
-
-	respBody, _ := io.ReadAll(resp.Body)
-
-	var result struct {
-		Message struct {
-			Content string `json:"content"`
-		} `json:"message"`
-		Error string `json:"error"`
-	}
-	json.Unmarshal(respBody, &result)
-
-	if result.Error != "" {
-		return "", fmt.Errorf("ollama error: %s", result.Error)
-	}
-	return result.Message.Content, nil
-}
-
-func generateFanar(apiURL, apiKey string, messages []map[string]string, priority int) (string, error) {
-	if !checkFanarRateLimit(priority) {
-		maxWait := 3
-		if priority == PriorityHigh {
-			maxWait = 15
-		} else if priority == PriorityMedium {
-			maxWait = 8
-		}
-
-		app.Log("ai", "[LLM] Fanar rate limit reached (priority %d), waiting...", priority)
-		for i := 0; i < maxWait; i++ {
-			time.Sleep(time.Second)
-			if checkFanarRateLimit(priority) {
-				break
-			}
-			if i == maxWait-1 {
-				return "", fmt.Errorf("fanar rate limit exceeded")
-			}
-		}
-	}
-
-	app.Log("ai", "[LLM] Using Fanar at %s", apiURL)
-
-	req := map[string]interface{}{
-		"model":    "Fanar",
-		"messages": messages,
-	}
-	body, _ := json.Marshal(req)
-
-	httpReq, _ := http.NewRequest("POST", apiURL+"/v1/chat/completions", bytes.NewReader(body))
-	httpReq.Header.Set("Content-Type", "application/json")
-	httpReq.Header.Set("Authorization", "Bearer "+apiKey)
-
-	client := &http.Client{Timeout: llmTimeout}
-	resp, err := client.Do(httpReq)
-	if err != nil {
-		return "", fmt.Errorf("fanar API request failed: %v", err)
-	}
-	defer resp.Body.Close()
-
-	respBody, _ := io.ReadAll(resp.Body)
-
-	var result struct {
-		Choices []struct {
-			Message struct {
-				Content string `json:"content"`
-			} `json:"message"`
-		} `json:"choices"`
-		Error interface{} `json:"error"`
+	if model == "" {
+		model = "claude-sonnet-4-20250514"
 	}
-	json.Unmarshal(respBody, &result)
 
-	if result.Error != nil {
-		return "", fmt.Errorf("%v", result.Error)
-	}
-	if len(result.Choices) > 0 {
-		return result.Choices[0].Message.Content, nil
-	}
-	return "", nil
+	return generateAnthropic(key, model, systemPromptText, messages)
 }
 
 func generateAnthropic(apiKey, model, systemPrompt string, messages []map[string]string) (string, error) {
@@ -321,55 +167,6 @@ func generateAnthropic(apiKey, model, systemPrompt string, messages []map[string
 	return content, nil
 }
 
-func checkFanarRateLimit(priority int) bool {
-	fanarRateMu.Lock()
-	defer fanarRateMu.Unlock()
-
-	now := time.Now()
-	cutoff := now.Add(-time.Minute)
-
-	var recent []time.Time
-	for _, t := range fanarLastMinute {
-		if t.After(cutoff) {
-			recent = append(recent, t)
-		}
-	}
-	fanarLastMinute = recent
-
-	var maxForPriority int
-	switch priority {
-	case PriorityHigh:
-		maxForPriority = fanarMaxPerMin
-	case PriorityMedium:
-		maxForPriority = 25
-	default:
-		maxForPriority = 15
-	}
-
-	if len(fanarLastMinute) >= maxForPriority {
-		return false
-	}
-
-	fanarLastMinute = append(fanarLastMinute, now)
-	return true
-}
-
-// GetFanarRateStatus returns current rate limit status
-func GetFanarRateStatus() (used, max int) {
-	fanarRateMu.Lock()
-	defer fanarRateMu.Unlock()
-
-	now := time.Now()
-	cutoff := now.Add(-time.Minute)
-	count := 0
-	for _, t := range fanarLastMinute {
-		if t.After(cutoff) {
-			count++
-		}
-	}
-	return count, fanarMaxPerMin
-}
-
 // GetCacheStats returns Anthropic prompt cache statistics
 func GetCacheStats() (hits, misses, readTokens, creationTokens int) {
 	cacheStatsMu.Lock()