diff --git a/.idea/copilotDiffState.xml b/.idea/copilotDiffState.xml
new file mode 100644
index 0000000..fc8074a
--- /dev/null
+++ b/.idea/copilotDiffState.xml
@@ -0,0 +1,18 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="CopilotDiffPersistence">
+    <option name="pendingDiffs">
+      <map>
+        <entry key="$PROJECT_DIR$/llm.go">
+          <value>
+            <PendingDiffInfo>
+              <option name="filePath" value="$PROJECT_DIR$/llm.go" />
+              <option name="originalContent" value="package main&#10;&#10;import (&#10;&#9;&quot;bytes&quot;&#10;&#9;&quot;context&quot;&#10;&#9;&quot;encoding/json&quot;&#10;&#9;&quot;fmt&quot;&#10;&#9;&quot;io&quot;&#10;&#9;&quot;net/http&quot;&#10;&#9;&quot;strings&quot;&#10;&#9;&quot;text/template&quot;&#10;&#10;&#9;&quot;github.com/sirupsen/logrus&quot;&#10;)&#10;&#10;// LLMClient abstracts LLM API calls&#10;type LLMClient struct {&#10;&#9;APIKey  string&#10;&#9;BaseURL string&#10;&#9;Model   string&#10;}&#10;&#10;// NewLLMClient constructs a new LLMClient with the given API key and base URL&#10;func NewLLMClient(apiKey, baseURL string, model string) *LLMClient {&#10;&#9;return &amp;LLMClient{&#10;&#9;&#9;APIKey:  apiKey,&#10;&#9;&#9;BaseURL: baseURL,&#10;&#9;&#9;Model:   model,&#10;&#9;}&#10;}&#10;&#10;// renderPrompt renders a Go template with the given data&#10;func renderPrompt(tmplStr string, data any) (string, error) {&#10;&#9;tmpl, err := template.New(&quot;&quot;).Parse(tmplStr)&#10;&#9;if err != nil {&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;var buf bytes.Buffer&#10;&#9;if err := tmpl.Execute(&amp;buf, data); err != nil {&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;return buf.String(), nil&#10;}&#10;&#10;// ExtractKeywords calls LLM to extract keywords from user message&#10;func (llm *LLMClient) ExtractKeywords(ctx context.Context, message string) (map[string]interface{}, error) {&#10;&#9;prompt, err := renderPrompt(appConfig.LLM.ExtractKeywordsPrompt, map[string]string{&quot;Message&quot;: message})&#10;&#9;if err != nil {&#10;&#9;&#9;logrus.WithError(err).Error(&quot;[CONFIG] Failed to render ExtractKeywords prompt&quot;)&#10;&#9;&#9;return nil, err&#10;&#9;}&#10;&#9;logrus.WithField(&quot;prompt&quot;, prompt).Info(&quot;[LLM] ExtractKeywords prompt&quot;)&#10;&#9;format := map[string]interface{}{&#10;&#9;&#9;&quot;type&quot;: &quot;object&quot;,&#10;&#9;&#9;&quot;properties&quot;: map[string]interface{}{&#10;&#9;&#9;&#9;&quot;translate&quot;: map[string]interface{}{&quot;type&quot;: &quot;string&quot;},&#10;&#9;&#9;&#9;&quot;keyword&quot;:   map[string]interface{}{&quot;type&quot;: &quot;array&quot;, &quot;items&quot;: map[string]interface{}{&quot;type&quot;: &quot;string&quot;}},&#10;&#9;&#9;&#9;&quot;animal&quot;:    map[string]interface{}{&quot;type&quot;: &quot;string&quot;},&#10;&#9;&#9;},&#10;&#9;&#9;&quot;required&quot;: []string{&quot;translate&quot;, &quot;keyword&quot;, &quot;animal&quot;},&#10;&#9;}&#10;&#9;resp, err := llm.openAICompletion(ctx, prompt, format)&#10;&#9;logrus.WithFields(logrus.Fields{&quot;response&quot;: resp, &quot;err&quot;: err}).Info(&quot;[LLM] ExtractKeywords response&quot;)&#10;&#9;if err != nil {&#10;&#9;&#9;return nil, err&#10;&#9;}&#10;&#9;var result map[string]interface{}&#10;&#9;if err := json.Unmarshal([]byte(resp), &amp;result); err != nil {&#10;&#9;&#9;return nil, err&#10;&#9;}&#10;&#9;return result, nil&#10;}&#10;&#10;// DisambiguateBestMatch calls LLM to pick best match from candidates&#10;func (llm *LLMClient) DisambiguateBestMatch(ctx context.Context, message string, candidates []Visit) (string, error) {&#10;&#9;format := map[string]interface{}{&#10;&#9;&#9;&quot;type&quot;: &quot;object&quot;,&#10;&#9;&#9;&quot;properties&quot;: map[string]interface{}{&#10;&#9;&#9;&#9;&quot;visitReason&quot;: map[string]interface{}{&quot;type&quot;: &quot;string&quot;},&#10;&#9;&#9;},&#10;&#9;&#9;&quot;required&quot;: []string{&quot;visitReason&quot;},&#10;&#9;}&#10;&#9;entries, _ := json.Marshal(candidates)&#10;&#9;prompt, err := renderPrompt(appConfig.LLM.DisambiguatePrompt, map[string]string{&quot;Entries&quot;: string(entries), &quot;Message&quot;: message})&#10;&#9;if err != nil {&#10;&#9;&#9;logrus.WithError(err).Error(&quot;[CONFIG] Failed to render Disambiguate prompt&quot;)&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;logrus.WithField(&quot;prompt&quot;, prompt).Info(&quot;[LLM] DisambiguateBestMatch prompt&quot;)&#10;&#9;resp, err := llm.openAICompletion(ctx, prompt, format)&#10;&#9;logrus.WithFields(logrus.Fields{&quot;response&quot;: resp, &quot;err&quot;: err}).Info(&quot;[LLM] DisambiguateBestMatch response&quot;)&#10;&#9;if err != nil {&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;var parsed map[string]string&#10;&#9;if err := json.Unmarshal([]byte(resp), &amp;parsed); err != nil {&#10;&#9;&#9;return &quot;&quot;, fmt.Errorf(&quot;failed to unmarshal disambiguation response: %w&quot;, err)&#10;&#9;}&#10;&#10;&#9;visitReason := strings.TrimSpace(parsed[&quot;visitReason&quot;])&#10;&#9;if visitReason == &quot;&quot; {&#10;&#9;&#9;return &quot;&quot;, fmt.Errorf(&quot;visitReason not found in response&quot;)&#10;&#9;}&#10;&#10;&#9;return visitReason, nil&#10;}&#10;&#10;// openAICompletion now supports both Ollama (default local) and OpenRouter/OpenAI-compatible APIs without external branching.&#10;// It auto-detects by inspecting the BaseURL. If the URL contains &quot;openrouter.ai&quot; or &quot;/v1/&quot;, it assumes OpenAI-style.&#10;func (llm *LLMClient) openAICompletion(ctx context.Context, prompt string, format map[string]interface{}) (string, error) {&#10;&#9;apiURL := llm.BaseURL&#10;&#9;if apiURL == &quot;&quot; {&#10;&#9;&#9;// Default to Ollama local chat endpoint&#10;&#9;&#9;apiURL = &quot;http://localhost:11434/api/chat&quot;&#10;&#9;}&#10;&#10;&#9;isOpenAIStyle := strings.Contains(apiURL, &quot;openrouter.ai&quot;) || strings.Contains(apiURL, &quot;/v1/&quot;)&#10;&#10;&#9;// Helper to stringify the expected JSON schema for instructions&#10;&#9;schemaDesc := func() string {&#10;&#9;&#9;b, _ := json.MarshalIndent(format, &quot;&quot;, &quot;  &quot;)&#10;&#9;&#9;return string(b)&#10;&#9;}&#10;&#10;&#9;buildBody := func(useJSONSchema bool) map[string]interface{} {&#10;&#9;&#9;if isOpenAIStyle {&#10;&#9;&#9;&#9;// For OpenAI style we send system + user messages; use response_format type json_object (schema variant often unsupported on some providers)&#10;&#9;&#9;&#9;rfType := &quot;json_object&quot;&#10;&#9;&#9;&#9;if useJSONSchema {&#10;&#9;&#9;&#9;&#9;// We attempt json_schema only if explicitly requested; default false.&#10;&#9;&#9;&#9;&#9;rfType = &quot;json_schema&quot;&#10;&#9;&#9;&#9;}&#10;&#9;&#9;&#9;body := map[string]interface{}{&#10;&#9;&#9;&#9;&#9;&quot;model&quot;: llm.Model,&#10;&#9;&#9;&#9;&#9;&quot;messages&quot;: []map[string]string{&#10;&#9;&#9;&#9;&#9;&#9;{&quot;role&quot;: &quot;system&quot;, &quot;content&quot;: &quot;You are a strict JSON generator. ONLY output valid JSON matching this schema: &quot; + schemaDesc() + &quot; Do not add explanations.&quot;},&#10;&#9;&#9;&#9;&#9;&#9;{&quot;role&quot;: &quot;user&quot;, &quot;content&quot;: prompt},&#10;&#9;&#9;&#9;&#9;},&#10;&#9;&#9;&#9;&#9;&quot;response_format&quot;: map[string]interface{}{&quot;type&quot;: rfType},&#10;&#9;&#9;&#9;}&#10;&#9;&#9;&#9;if rfType == &quot;json_schema&quot; {&#10;&#9;&#9;&#9;&#9;body[&quot;response_format&quot;] = map[string]interface{}{&#10;&#9;&#9;&#9;&#9;&#9;&quot;type&quot;: &quot;json_schema&quot;,&#10;&#9;&#9;&#9;&#9;&#9;&quot;json_schema&quot;: map[string]interface{}{&#10;&#9;&#9;&#9;&#9;&#9;&#9;&quot;name&quot;:   &quot;structured_output&quot;,&#10;&#9;&#9;&#9;&#9;&#9;&#9;&quot;schema&quot;: format,&#10;&#9;&#9;&#9;&#9;&#9;},&#10;&#9;&#9;&#9;&#9;}&#10;&#9;&#9;&#9;}&#10;&#9;&#9;&#9;return body&#10;&#9;&#9;}&#10;&#9;&#9;// Ollama style&#10;&#9;&#9;return map[string]interface{}{&#10;&#9;&#9;&#9;&quot;model&quot;:    llm.Model,&#10;&#9;&#9;&#9;&quot;messages&quot;: []map[string]string{{&quot;role&quot;: &quot;user&quot;, &quot;content&quot;: prompt}},&#10;&#9;&#9;&#9;&quot;stream&quot;:   false,&#10;&#9;&#9;&#9;&quot;format&quot;:   format,&#10;&#9;&#9;}&#10;&#9;}&#10;&#10;&#9;// First attempt (json_object for OpenAI style)&#10;&#9;useJSONSchemaAttempt := false&#10;&#9;body := buildBody(useJSONSchemaAttempt)&#10;&#10;&#9;doRequest := func(body map[string]interface{}) (raw []byte, status int, err error) {&#10;&#9;&#9;jsonBody, _ := json.Marshal(body)&#10;&#9;&#9;logrus.WithFields(logrus.Fields{&quot;api_url&quot;: apiURL, &quot;prompt&quot;: prompt, &quot;is_openai_style&quot;: isOpenAIStyle, &quot;json_schema&quot;: body[&quot;response_format&quot;]}).Info(&quot;[LLM] completion POST&quot;)&#10;&#9;&#9;req, _ := http.NewRequestWithContext(ctx, http.MethodPost, apiURL, bytes.NewBuffer(jsonBody))&#10;&#9;&#9;if llm.APIKey != &quot;&quot; {&#10;&#9;&#9;&#9;req.Header.Set(&quot;Authorization&quot;, &quot;Bearer &quot;+llm.APIKey)&#10;&#9;&#9;}&#10;&#9;&#9;req.Header.Set(&quot;Content-Type&quot;, &quot;application/json&quot;)&#10;&#9;&#9;if strings.Contains(apiURL, &quot;openrouter.ai&quot;) {&#10;&#9;&#9;&#9;// Correct standard header field name is Referer&#10;&#9;&#9;&#9;req.Header.Set(&quot;Referer&quot;, &quot;https://github.com/&quot;)&#10;&#9;&#9;&#9;req.Header.Set(&quot;X-Title&quot;, &quot;vetrag-app&quot;)&#10;&#9;&#9;}&#10;&#9;&#9;client := &amp;http.Client{}&#10;&#9;&#9;resp, err := client.Do(req)&#10;&#9;&#9;if err != nil {&#10;&#9;&#9;&#9;return nil, 0, err&#10;&#9;&#9;}&#10;&#9;&#9;defer resp.Body.Close()&#10;&#9;&#9;raw, rerr := io.ReadAll(resp.Body)&#10;&#9;&#9;return raw, resp.StatusCode, rerr&#10;&#9;}&#10;&#10;&#9;raw, status, err := doRequest(body)&#10;&#9;if err != nil {&#10;&#9;&#9;logrus.WithError(err).Error(&quot;[LLM] completion HTTP error&quot;)&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;logrus.WithFields(logrus.Fields{&quot;status&quot;: status, &quot;raw&quot;: string(raw)}).Debug(&quot;[LLM] completion raw response&quot;)&#10;&#10;&#9;// If OpenAI style and provider specifically complains wanting json / json_object etc and we tried json_schema (future path), fallback handled below.&#10;&#9;if isOpenAIStyle &amp;&amp; status &gt;= 400 {&#10;&#9;&#9;// Detect unsupported json_schema (if we ever attempted it) or response_format issues and retry without schema if not already json_object.&#10;&#9;&#9;if strings.Contains(string(raw), &quot;response_format&quot;) &amp;&amp; strings.Contains(string(raw), &quot;json_schema&quot;) &amp;&amp; useJSONSchemaAttempt {&#10;&#9;&#9;&#9;logrus.Warn(&quot;[LLM] json_schema rejected; retrying with json_object&quot;)&#10;&#9;&#9;&#9;useJSONSchemaAttempt = false&#10;&#9;&#9;&#9;body = buildBody(false)&#10;&#9;&#9;&#9;raw, status, err = doRequest(body)&#10;&#9;&#9;&#9;if err != nil {&#10;&#9;&#9;&#9;&#9;return &quot;&quot;, fmt.Errorf(&quot;retry after json_schema failure: %w&quot;, err)&#10;&#9;&#9;&#9;}&#10;&#9;&#9;&#9;logrus.WithFields(logrus.Fields{&quot;status&quot;: status, &quot;raw&quot;: string(raw)}).Debug(&quot;[LLM] completion raw response (retry)&quot;)&#10;&#9;&#9;}&#10;&#9;&#9;// If still error, surface provider error below on unmarshal path.&#10;&#9;}&#10;&#10;&#9;// Attempt Ollama format parse&#10;&#9;var ollama struct {&#10;&#9;&#9;Message struct {&#10;&#9;&#9;&#9;Content string `json:&quot;content&quot;`&#10;&#9;&#9;} `json:&quot;message&quot;`&#10;&#9;&#9;Error string `json:&quot;error&quot;`&#10;&#9;&#9;} `json:&quot;message&quot;`&#10;&#9;&#9;Error string `json:&quot;error&quot;`&#10;&#9;}&#10;&#9;if err := json.Unmarshal(raw, &amp;ollama); err == nil &amp;&amp; ollama.Message.Content != &quot;&quot; {&#10;&#9;&#9;return ollama.Message.Content, nil&#10;&#9;// OpenAI style parse&#10;&#10;&#9;&#9;Choices []struct {&#10;&#9;&#9;&#9;Message struct {&#10;&#9;&#9;&#9;&#9;Content string `json:&quot;content&quot;`&#10;&#9;&#9;&#9;} `json:&quot;message&quot;`&#10;&#9;&#9;} `json:&quot;choices&quot;`&#10;&#9;&#9;Error *struct {&#10;&#9;&#9;&#9;Message string `json:&quot;message&quot;`&#10;&#9;&#9;&#9;Type    string `json:&quot;type&quot;`&#10;&#9;&#9;} `json:&quot;error&quot;`&#10;&#9;&#9;Choices []struct {&#10;&#9;&#9;&#9;Message struct {&#10;&#9;&#9;&#9;&#9;Content string `json:&quot;content&quot;`&#10;&#9;&#9;&#9;} `json:&quot;message&quot;`&#10;&#9;&#9;} `json:&quot;choices&quot;`&#10;&#9;&#9;Error *struct {&#10;&#9;&#9;&#9;Message string `json:&quot;message&quot;`&#10;&#9;&#9;&#9;Type    string `json:&quot;type&quot;`&#10;&#9;&#9;} `json:&quot;error&quot;`&#10;&#9;}&#10;&#9;if err := json.Unmarshal(raw, &amp;openAI); err == nil {&#10;&#9;&#9;if openAI.Error != nil || status &gt;= 400 {&#10;&#9;&#9;&#9;var msg string&#10;&#9;&#9;&#9;if openAI.Error != nil {&#10;&#9;&#9;&#9;&#9;msg = openAI.Error.Message&#10;&#9;&#9;&#9;} else {&#10;&#9;&#9;&#9;&#9;msg = string(raw)&#10;&#9;&#9;&#9;}&#10;&#9;&#9;&#9;return &quot;&quot;, fmt.Errorf(&quot;provider error: %s&quot;, msg)&#10;&#9;&#9;}&#10;&#9;&#9;if len(openAI.Choices) &gt; 0 &amp;&amp; openAI.Choices[0].Message.Content != &quot;&quot; {&#10;&#9;&#9;&#9;return openAI.Choices[0].Message.Content, nil&#10;&#9;&#9;}&#10;&#9;}&#10;&#10;&#9;return &quot;&quot;, fmt.Errorf(&quot;unrecognized LLM response format: %.200s&quot;, string(raw))&#10;}&#10;&#10;// LLMClientAPI allows mocking LLMClient in other places&#10;// Only public methods should be included&#10;&#10;type LLMClientAPI interface {&#10;&#9;ExtractKeywords(ctx context.Context, message string) (map[string]interface{}, error)&#10;&#9;DisambiguateBestMatch(ctx context.Context, message string, candidates []Visit) (string, error)&#10;}&#10;&#10;var _ LLMClientAPI = (*LLMClient)(nil)&#10;" />
+              <option name="updatedContent" value="package main&#10;&#10;import (&#10;&#9;&quot;bytes&quot;&#10;&#9;&quot;context&quot;&#10;&#9;&quot;encoding/json&quot;&#10;&#9;&quot;fmt&quot;&#10;&#9;&quot;io&quot;&#10;&#9;&quot;net/http&quot;&#10;&#9;&quot;strings&quot;&#10;&#9;&quot;text/template&quot;&#10;&#9;&quot;time&quot;&#10;&#10;&#9;&quot;github.com/sirupsen/logrus&quot;&#10;)&#10;&#10;// LLMClient abstracts LLM API calls&#10;type LLMClient struct {&#10;&#9;APIKey  string&#10;&#9;BaseURL string&#10;&#9;Model   string&#10;}&#10;&#10;// NewLLMClient constructs a new LLMClient with the given API key and base URL&#10;func NewLLMClient(apiKey, baseURL string, model string) *LLMClient {&#10;&#9;return &amp;LLMClient{&#10;&#9;&#9;APIKey:  apiKey,&#10;&#9;&#9;BaseURL: baseURL,&#10;&#9;&#9;Model:   model,&#10;&#9;}&#10;}&#10;&#10;// renderPrompt renders a Go template with the given data&#10;func renderPrompt(tmplStr string, data any) (string, error) {&#10;&#9;tmpl, err := template.New(&quot;&quot;).Parse(tmplStr)&#10;&#9;if err != nil {&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;var buf bytes.Buffer&#10;&#9;if err := tmpl.Execute(&amp;buf, data); err != nil {&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;return buf.String(), nil&#10;}&#10;&#10;// ExtractKeywords calls LLM to extract keywords from user message&#10;func (llm *LLMClient) ExtractKeywords(ctx context.Context, message string) (map[string]interface{}, error) {&#10;&#9;prompt, err := renderPrompt(appConfig.LLM.ExtractKeywordsPrompt, map[string]string{&quot;Message&quot;: message})&#10;&#9;if err != nil {&#10;&#9;&#9;logrus.WithError(err).Error(&quot;[CONFIG] Failed to render ExtractKeywords prompt&quot;)&#10;&#9;&#9;return nil, err&#10;&#9;}&#10;&#9;logrus.WithField(&quot;prompt&quot;, prompt).Info(&quot;[LLM] ExtractKeywords prompt&quot;)&#10;&#9;format := map[string]interface{}{&#10;&#9;&#9;&quot;type&quot;: &quot;object&quot;,&#10;&#9;&#9;&quot;properties&quot;: map[string]interface{}{&#10;&#9;&#9;&#9;&quot;translate&quot;: map[string]interface{}{&quot;type&quot;: &quot;string&quot;},&#10;&#9;&#9;&#9;&quot;keyword&quot;:   map[string]interface{}{&quot;type&quot;: &quot;array&quot;, &quot;items&quot;: map[string]interface{}{&quot;type&quot;: &quot;string&quot;}},&#10;&#9;&#9;&#9;&quot;animal&quot;:    map[string]interface{}{&quot;type&quot;: &quot;string&quot;},&#10;&#9;&#9;},&#10;&#9;&#9;&quot;required&quot;: []string{&quot;translate&quot;, &quot;keyword&quot;, &quot;animal&quot;},&#10;&#9;}&#10;&#9;resp, err := llm.openAICompletion(ctx, prompt, format)&#10;&#9;logrus.WithFields(logrus.Fields{&quot;response&quot;: resp, &quot;err&quot;: err}).Info(&quot;[LLM] ExtractKeywords response&quot;)&#10;&#9;if err != nil {&#10;&#9;&#9;return nil, err&#10;&#9;}&#10;&#9;var result map[string]interface{}&#10;&#9;if err := json.Unmarshal([]byte(resp), &amp;result); err != nil {&#10;&#9;&#9;return nil, err&#10;&#9;}&#10;&#9;return result, nil&#10;}&#10;&#10;// DisambiguateBestMatch calls LLM to pick best match from candidates&#10;func (llm *LLMClient) DisambiguateBestMatch(ctx context.Context, message string, candidates []Visit) (string, error) {&#10;&#9;format := map[string]interface{}{&#10;&#9;&#9;&quot;type&quot;: &quot;object&quot;,&#10;&#9;&#9;&quot;properties&quot;: map[string]interface{}{&#10;&#9;&#9;&#9;&quot;visitReason&quot;: map[string]interface{}{&quot;type&quot;: &quot;string&quot;},&#10;&#9;&#9;},&#10;&#9;&#9;&quot;required&quot;: []string{&quot;visitReason&quot;},&#10;&#9;}&#10;&#9;entries, _ := json.Marshal(candidates)&#10;&#9;prompt, err := renderPrompt(appConfig.LLM.DisambiguatePrompt, map[string]string{&quot;Entries&quot;: string(entries), &quot;Message&quot;: message})&#10;&#9;if err != nil {&#10;&#9;&#9;logrus.WithError(err).Error(&quot;[CONFIG] Failed to render Disambiguate prompt&quot;)&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;logrus.WithField(&quot;prompt&quot;, prompt).Info(&quot;[LLM] DisambiguateBestMatch prompt&quot;)&#10;&#9;resp, err := llm.openAICompletion(ctx, prompt, format)&#10;&#9;logrus.WithFields(logrus.Fields{&quot;response&quot;: resp, &quot;err&quot;: err}).Info(&quot;[LLM] DisambiguateBestMatch response&quot;)&#10;&#9;if err != nil {&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;var parsed map[string]string&#10;&#9;if err := json.Unmarshal([]byte(resp), &amp;parsed); err != nil {&#10;&#9;&#9;return &quot;&quot;, fmt.Errorf(&quot;failed to unmarshal disambiguation response: %w&quot;, err)&#10;&#9;}&#10;&#10;&#9;visitReason := strings.TrimSpace(parsed[&quot;visitReason&quot;])&#10;&#9;if visitReason == &quot;&quot; {&#10;&#9;&#9;return &quot;&quot;, fmt.Errorf(&quot;visitReason not found in response&quot;)&#10;&#9;}&#10;&#10;&#9;return visitReason, nil&#10;}&#10;&#10;// openAICompletion now supports both Ollama (default local) and OpenRouter/OpenAI-compatible APIs without external branching.&#10;// It auto-detects by inspecting the BaseURL. If the URL contains &quot;openrouter.ai&quot; or &quot;/v1/&quot;, it assumes OpenAI-style.&#10;func (llm *LLMClient) openAICompletion(ctx context.Context, prompt string, format map[string]interface{}) (string, error) {&#10;&#9;apiURL := llm.BaseURL&#10;&#9;if apiURL == &quot;&quot; {&#10;&#9;&#9;// Default to Ollama local chat endpoint&#10;&#9;&#9;apiURL = &quot;http://localhost:11434/api/chat&quot;&#10;&#9;}&#10;&#10;&#9;isOpenAIStyle := strings.Contains(apiURL, &quot;openrouter.ai&quot;) || strings.Contains(apiURL, &quot;/v1/&quot;)&#10;&#10;&#9;// Helper to stringify the expected JSON schema for instructions&#10;&#9;schemaDesc := func() string {&#10;&#9;&#9;b, _ := json.MarshalIndent(format, &quot;&quot;, &quot;  &quot;)&#10;&#9;&#9;return string(b)&#10;&#9;}&#10;&#10;&#9;truncate := func(s string, n int) string {&#10;&#9;&#9;if len(s) &lt;= n {&#10;&#9;&#9;&#9;return s&#10;&#9;&#9;}&#10;&#9;&#9;return s[:n] + &quot;...&lt;truncated&gt;&quot;&#10;&#9;}&#10;&#10;&#9;buildBody := func() map[string]interface{} {&#10;&#9;&#9;if isOpenAIStyle {&#10;&#9;&#9;&#9;return map[string]interface{}{&#10;&#9;&#9;&#9;&#9;&quot;model&quot;: llm.Model,&#10;&#9;&#9;&#9;&#9;&quot;messages&quot;: []map[string]string{&#10;&#9;&#9;&#9;&#9;&#9;{&quot;role&quot;: &quot;system&quot;, &quot;content&quot;: &quot;You are a strict JSON generator. ONLY output valid JSON matching this schema: &quot; + schemaDesc() + &quot; Do not add explanations.&quot;},&#10;&#9;&#9;&#9;&#9;&#9;{&quot;role&quot;: &quot;user&quot;, &quot;content&quot;: prompt},&#10;&#9;&#9;&#9;&#9;},&#10;&#9;&#9;&#9;&#9;&quot;response_format&quot;: map[string]interface{}{&quot;type&quot;: &quot;json_object&quot;},&#10;&#9;&#9;&#9;}&#10;&#9;&#9;}&#10;&#9;&#9;// Ollama style&#10;&#9;&#9;return map[string]interface{}{&#10;&#9;&#9;&#9;&quot;model&quot;:    llm.Model,&#10;&#9;&#9;&#9;&quot;messages&quot;: []map[string]string{{&quot;role&quot;: &quot;user&quot;, &quot;content&quot;: prompt}},&#10;&#9;&#9;&#9;&quot;stream&quot;:   false,&#10;&#9;&#9;&#9;&quot;format&quot;:   format,&#10;&#9;&#9;}&#10;&#9;}&#10;&#10;&#9;body := buildBody()&#10;&#10;&#9;doRequest := func(body map[string]interface{}) (raw []byte, status int, err error, dur time.Duration) {&#10;&#9;&#9;jsonBody, _ := json.Marshal(body)&#10;&#9;&#9;bodySize := len(jsonBody)&#10;&#9;&#9;logrus.WithFields(logrus.Fields{&#10;&#9;&#9;&#9;&quot;event&quot;:           &quot;llm_request&quot;,&#10;&#9;&#9;&#9;&quot;api_url&quot;:         apiURL,&#10;&#9;&#9;&#9;&quot;model&quot;:           llm.Model,&#10;&#9;&#9;&#9;&quot;is_openai_style&quot;: isOpenAIStyle,&#10;&#9;&#9;&#9;&quot;prompt_len&quot;:      len(prompt),&#10;&#9;&#9;&#9;&quot;body_size&quot;:       bodySize,&#10;&#9;&#9;}).Info(&quot;[LLM] sending request&quot;)&#10;&#9;&#9;req, _ := http.NewRequestWithContext(ctx, http.MethodPost, apiURL, bytes.NewBuffer(jsonBody))&#10;&#9;&#9;if llm.APIKey != &quot;&quot; {&#10;&#9;&#9;&#9;req.Header.Set(&quot;Authorization&quot;, &quot;Bearer &quot;+llm.APIKey)&#10;&#9;&#9;}&#10;&#9;&#9;req.Header.Set(&quot;Content-Type&quot;, &quot;application/json&quot;)&#10;&#9;&#9;req.Header.Set(&quot;Accept&quot;, &quot;application/json&quot;)&#10;&#9;&#9;if strings.Contains(apiURL, &quot;openrouter.ai&quot;) {&#10;&#9;&#9;&#9;req.Header.Set(&quot;Referer&quot;, &quot;https://github.com/&quot;)&#10;&#9;&#9;&#9;req.Header.Set(&quot;X-Title&quot;, &quot;vetrag-app&quot;)&#10;&#9;&#9;}&#10;&#9;&#9;start := time.Now()&#10;&#9;&#9;client := &amp;http.Client{}&#10;&#9;&#9;resp, err := client.Do(req)&#10;&#9;&#9;if err != nil {&#10;&#9;&#9;&#9;return nil, 0, err, time.Since(start)&#10;&#9;&#9;}&#10;&#9;&#9;defer resp.Body.Close()&#10;&#9;&#9;raw, rerr := io.ReadAll(resp.Body)&#10;&#9;&#9;return raw, resp.StatusCode, rerr, time.Since(start)&#10;&#9;}&#10;&#10;&#9;raw, status, err, dur := doRequest(body)&#10;&#9;if err != nil {&#10;&#9;&#9;logrus.WithFields(logrus.Fields{&#10;&#9;&#9;&#9;&quot;event&quot;:    &quot;llm_response&quot;,&#10;&#9;&#9;&#9;&quot;status&quot;:   status,&#10;&#9;&#9;&#9;&quot;latency_ms&quot;: dur.Milliseconds(),&#10;&#9;&#9;&#9;&quot;error&quot;:    err,&#10;&#9;&#9;}).Error(&quot;[LLM] request failed&quot;)&#10;&#9;&#9;return &quot;&quot;, err&#10;&#9;}&#10;&#9;logrus.WithFields(logrus.Fields{&#10;&#9;&#9;&quot;event&quot;:      &quot;llm_raw_response&quot;,&#10;&#9;&#9;&quot;status&quot;:     status,&#10;&#9;&#9;&quot;latency_ms&quot;: dur.Milliseconds(),&#10;&#9;&#9;&quot;raw_trunc&quot;:  truncate(string(raw), 600),&#10;&#9;&#9;&quot;raw_len&quot;:    len(raw),&#10;&#9;}).Debug(&quot;[LLM] raw response body&quot;)&#10;&#10;&#9;parseVariant := &quot;unknown&quot;&#10;&#10;&#9;// Attempt Ollama format parse&#10;&#9;var ollama struct {&#10;&#9;&#9;Message struct{ Content string `json:&quot;content&quot;` } `json:&quot;message&quot;`&#10;&#9;&#9;Error   string `json:&quot;error&quot;`&#10;&#9;}&#10;&#9;if err := json.Unmarshal(raw, &amp;ollama); err == nil &amp;&amp; ollama.Message.Content != &quot;&quot; {&#10;&#9;&#9;parseVariant = &quot;ollama&quot;&#10;&#9;&#9;content := ollama.Message.Content&#10;&#9;&#9;logrus.WithFields(logrus.Fields{&#10;&#9;&#9;&#9;&quot;event&quot;:         &quot;llm_response&quot;,&#10;&#9;&#9;&#9;&quot;status&quot;:        status,&#10;&#9;&#9;&#9;&quot;latency_ms&quot;:    dur.Milliseconds(),&#10;&#9;&#9;&#9;&quot;parse_variant&quot;: parseVariant,&#10;&#9;&#9;&#9;&quot;content_len&quot;:   len(content),&#10;&#9;&#9;&#9;&quot;content_snip&quot;:  truncate(content, 300),&#10;&#9;&#9;}).Info(&quot;[LLM] parsed response&quot;)&#10;&#9;&#9;return content, nil&#10;&#9;}&#10;&#10;&#9;// Attempt OpenAI/OpenRouter style parse&#10;&#9;var openAI struct {&#10;&#9;&#9;Choices []struct{ Message struct{ Content string `json:&quot;content&quot;` } `json:&quot;message&quot;` } `json:&quot;choices&quot;`&#10;&#9;&#9;Error *struct{ Message string `json:&quot;message&quot;`; Type string `json:&quot;type&quot;` } `json:&quot;error&quot;`&#10;&#9;}&#10;&#9;if err := json.Unmarshal(raw, &amp;openAI); err == nil {&#10;&#9;&#9;if openAI.Error != nil || status &gt;= 400 {&#10;&#9;&#9;&#9;parseVariant = &quot;openai&quot;&#10;&#9;&#9;&#9;var msg string&#10;&#9;&#9;&#9;if openAI.Error != nil {&#10;&#9;&#9;&#9;&#9;msg = openAI.Error.Message&#10;&#9;&#9;&#9;} else {&#10;&#9;&#9;&#9;&#9;msg = string(raw)&#10;&#9;&#9;&#9;}&#10;&#9;&#9;&#9;logrus.WithFields(logrus.Fields{&#10;&#9;&#9;&#9;&#9;&quot;event&quot;:         &quot;llm_response&quot;,&#10;&#9;&#9;&#9;&#9;&quot;status&quot;:        status,&#10;&#9;&#9;&#9;&#9;&quot;latency_ms&quot;:    dur.Milliseconds(),&#10;&#9;&#9;&#9;&#9;&quot;parse_variant&quot;: parseVariant,&#10;&#9;&#9;&#9;&#9;&quot;error&quot;:         msg,&#10;&#9;&#9;&#9;}).Error(&quot;[LLM] provider error&quot;)&#10;&#9;&#9;&#9;return &quot;&quot;, fmt.Errorf(&quot;provider error: %s&quot;, msg)&#10;&#9;&#9;}&#10;&#9;&#9;if len(openAI.Choices) &gt; 0 &amp;&amp; openAI.Choices[0].Message.Content != &quot;&quot; {&#10;&#9;&#9;&#9;parseVariant = &quot;openai&quot;&#10;&#9;&#9;&#9;content := openAI.Choices[0].Message.Content&#10;&#9;&#9;&#9;logrus.WithFields(logrus.Fields{&#10;&#9;&#9;&#9;&#9;&quot;event&quot;:         &quot;llm_response&quot;,&#10;&#9;&#9;&#9;&#9;&quot;status&quot;:        status,&#10;&#9;&#9;&#9;&#9;&quot;latency_ms&quot;:    dur.Milliseconds(),&#10;&#9;&#9;&#9;&#9;&quot;parse_variant&quot;: parseVariant,&#10;&#9;&#9;&#9;&#9;&quot;content_len&quot;:   len(content),&#10;&#9;&#9;&#9;&#9;&quot;content_snip&quot;:  truncate(content, 300),&#10;&#9;&#9;&#9;}).Info(&quot;[LLM] parsed response&quot;)&#10;&#9;&#9;&#9;return content, nil&#10;&#9;&#9;}&#10;&#9;}&#10;&#10;&#9;logrus.WithFields(logrus.Fields{&#10;&#9;&#9;&quot;event&quot;:         &quot;llm_response&quot;,&#10;&#9;&#9;&quot;status&quot;:        status,&#10;&#9;&#9;&quot;latency_ms&quot;:    dur.Milliseconds(),&#10;&#9;&#9;&quot;parse_variant&quot;: parseVariant,&#10;&#9;&#9;&quot;raw_snip&quot;:      truncate(string(raw), 300),&#10;&#9;}).Error(&quot;[LLM] unrecognized response format&quot;)&#10;&#10;&#9;return &quot;&quot;, fmt.Errorf(&quot;unrecognized LLM response format: %.200s&quot;, string(raw))&#10;}&#10;&#10;// LLMClientAPI allows mocking LLMClient in other places&#10;// Only public methods should be included&#10;&#10;type LLMClientAPI interface {&#10;&#9;ExtractKeywords(ctx context.Context, message string) (map[string]interface{}, error)&#10;&#9;DisambiguateBestMatch(ctx context.Context, message string, candidates []Visit) (string, error)&#10;}&#10;&#10;var _ LLMClientAPI = (*LLMClient)(nil)" />
+            </PendingDiffInfo>
+          </value>
+        </entry>
+      </map>
+    </option>
+  </component>
+</project>
\ No newline at end of file
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..318ac3b
--- /dev/null
+++ b/README.md
@@ -0,0 +1,105 @@
+# Vetrag
+
+Lightweight veterinary visit reasoning helper with LLM-assisted keyword extraction and disambiguation.
+
+## Features
+- Switch seamlessly between local Ollama and OpenRouter (OpenAI-compatible) LLM backends by changing environment variables only.
+- Structured JSON outputs enforced using provider-supported response formats (Ollama `format`, OpenAI/OpenRouter `response_format: { type: json_object }`).
+- Integration tests using mock LLM & DB (no network dependency).
+- GitHub Actions CI (vet, test, build).
+
+## Quick Start
+### 1. Clone & build
+```bash
+git clone <repo-url>
+cd vetrag
+go build ./...
+```
+
+### 2. Prepare data
+Ensure `config.yaml` and `maindb.yaml` / `db.yaml` exist as provided. Visit data is loaded at runtime (see `models.go` / `db.go`).
+
+### 3. Run with Ollama (local)
+Pull or have a model available (example: `ollama pull qwen2.5`):
+```bash
+export OPENAI_BASE_URL=http://localhost:11434/api/chat
+export OPENAI_MODEL=qwen2.5:latest
+# API key not required for Ollama
+export OPENAI_API_KEY=
+
+go run .
+```
+
+### 4. Run with OpenRouter
+Sign up at https://openrouter.ai and get an API key.
+```bash
+export OPENAI_BASE_URL=https://openrouter.ai/api/v1/chat/completions
+export OPENAI_API_KEY=sk-or-XXXXXXXXXXXXXXXX
+export OPENAI_MODEL=meta-llama/llama-3.1-70b-instruct  # or any supported model
+
+go run .
+```
+Open http://localhost:8080/ in your browser.
+
+### 5. Health & Chat
+```bash
+curl -s http://localhost:8080/health
+curl -s -X POST http://localhost:8080/chat -H 'Content-Type: application/json' -d '{"message":"my dog has diarrhea"}' | jq
+```
+
+## Environment Variables
+| Variable | Purpose | Default (if empty) |
+|----------|---------|--------------------|
+| OPENAI_BASE_URL | LLM endpoint (Ollama chat or OpenRouter chat completions) | `http://localhost:11434/api/chat` |
+| OPENAI_API_KEY  | Bearer token for OpenRouter/OpenAI-style APIs | (unused if empty) |
+| OPENAI_MODEL    | Model identifier (Ollama model tag or OpenRouter model slug) | none (must set for remote) |
+
+## How Backend Selection Works
+`llm.go` auto-detects the style:
+- If the base URL contains `openrouter.ai` or `/v1/` it uses OpenAI-style request & parses `choices[0].message.content`.
+- Otherwise it assumes Ollama and posts to `/api/chat` with `format` for structured JSON.
+
+## Structured Output
+We define a JSON Schema-like map internally and:
+- Ollama: send as `format` (native structured output extension).
+- OpenRouter/OpenAI: send `response_format: { type: "json_object" }` plus a system instruction describing the expected keys.
+
+## Prompts
+Prompts in `config.yaml` have been adjusted to explicitly demand JSON only. This reduces hallucinated prose and plays well with both backends.
+
+## Testing
+Run:
+```bash
+go test ./...
+```
+All tests mock the LLM so no network is required.
+
+## CI
+GitHub Actions workflow at `.github/workflows/ci.yml` runs vet, tests, build on push/PR.
+
+## Troubleshooting
+| Symptom | Cause | Fix |
+|---------|-------|-----|
+| Provider error referencing `response_format` and `json_schema` | Some providers reject `json_schema` | We now default to `json_object`; ensure you pulled latest changes. |
+| Empty response | Model returned non-JSON or empty content | Enable debug logs (see below) and inspect raw response. |
+| Non-JSON content (code fences) | Model ignored instruction | Try a stricter system message or switch to a model with better JSON adherence. |
+
+### Enable Debug Logging
+Temporarily edit `main.go`:
+```go
+logrus.SetLevel(logrus.DebugLevel)
+```
+(You can also refactor later to read a LOG_LEVEL env var.)
+
+### Sanitizing Output (Optional Future Improvement)
+If some models wrap JSON in text, a post-processor could strip code fences and re-parse. Not implemented yet to keep logic strict.
+
+## Next Ideas
+- Add retry with exponential backoff for transient 5xx.
+- Add optional `json` fallback if a provider rejects `json_object`.
+- Add streaming support.
+- Add integration test with recorded OpenRouter fixture.
+
+## License
+(Choose and add a LICENSE file if planning to open source.)
+
diff --git a/config.yaml b/config.yaml
index 561afb2..7bd8c92 100644
--- a/config.yaml
+++ b/config.yaml
@@ -1,4 +1,3 @@
 llm:
-  extract_keywords_prompt: "Translate [{{.Message}}] to English, then output only 3–5 comma-separated veterinary-related keywords IN ENGLISH derived strictly from [{{.Message}}]. example output [\"keyword1\",\"keyword2\"] No other text, no extra punctuation, no explanations, no quotes, no formatting."
-  disambiguate_prompt: "Given these possible vet visit reasons: [{{.Entries}}], choose the single best match for this user message: {{.Message}}. Reply with id ex {\"visitReason\":\"bloodwork\"} No other text, no extra punctuation, no explanations, no quotes, no formatting."
-
+  extract_keywords_prompt: "You will extract structured data from the user input. Input text: {{.Message}}. Return ONLY valid minified JSON object with keys: translate (English translation of input), keyword (array of 3-5 concise English veterinary-related keywords derived strictly from the input), animal (animal mentioned or 'unknown'). Example: {\"translate\":\"dog has diarrhea\",\"keyword\":[\"diarrhea\",\"digestive\"],\"animal\":\"dog\"}. Do not add extra text, markdown, or quotes outside JSON."
+  disambiguate_prompt: "Given candidate visit entries (JSON array): {{.Entries}} and user message: {{.Message}} choose the best matching visit's ID. Return ONLY JSON: {\"visitReason\":\"<one of the candidate IDs or empty string if none>\"}. No other text."
diff --git a/llm.go b/llm.go
index ab6a811..0489687 100644
--- a/llm.go
+++ b/llm.go
@@ -9,6 +9,7 @@ import (
 	"net/http"
 	"strings"
 	"text/template"
+	"time"
 
 	"github.com/sirupsen/logrus"
 )
@@ -116,26 +117,32 @@ func (llm *LLMClient) openAICompletion(ctx context.Context, prompt string, forma
 
 	isOpenAIStyle := strings.Contains(apiURL, "openrouter.ai") || strings.Contains(apiURL, "/v1/")
 
-	// Build request body depending on style
-	var body map[string]interface{}
-	if isOpenAIStyle {
-		// OpenAI / OpenRouter style (chat.completions)
-		// Use response_format with JSON schema when provided.
-		responseFormat := map[string]interface{}{
-			"type": "json_schema",
-			"json_schema": map[string]interface{}{
-				"name":   "structured_output",
-				"schema": format,
-			},
+	// Helper to stringify the expected JSON schema for instructions
+	schemaDesc := func() string {
+		b, _ := json.MarshalIndent(format, "", "  ")
+		return string(b)
+	}
+
+	truncate := func(s string, n int) string {
+		if len(s) <= n {
+			return s
 		}
-		body = map[string]interface{}{
-			"model":           llm.Model,
-			"messages":        []map[string]string{{"role": "user", "content": prompt}},
-			"response_format": responseFormat,
+		return s[:n] + "...<truncated>"
+	}
+
+	buildBody := func() map[string]interface{} {
+		if isOpenAIStyle {
+			return map[string]interface{}{
+				"model": llm.Model,
+				"messages": []map[string]string{
+					{"role": "system", "content": "You are a strict JSON generator. ONLY output valid JSON matching this schema: " + schemaDesc() + " Do not add explanations."},
+					{"role": "user", "content": prompt},
+				},
+				"response_format": map[string]interface{}{"type": "json_object"},
+			}
 		}
-	} else {
-		// Ollama structured output extension
-		body = map[string]interface{}{
+		// Ollama style
+		return map[string]interface{}{
 			"model":    llm.Model,
 			"messages": []map[string]string{{"role": "user", "content": prompt}},
 			"stream":   false,
@@ -143,46 +150,85 @@ func (llm *LLMClient) openAICompletion(ctx context.Context, prompt string, forma
 		}
 	}
 
-	jsonBody, _ := json.Marshal(body)
-	logrus.WithFields(logrus.Fields{"api_url": apiURL, "prompt": prompt, "is_openai_style": isOpenAIStyle}).Info("[LLM] completion POST")
+	body := buildBody()
 
-	req, _ := http.NewRequestWithContext(ctx, http.MethodPost, apiURL, bytes.NewBuffer(jsonBody))
-	if llm.APIKey != "" {
-		// OpenRouter expects: Authorization: Bearer sk-... or OR-... depending on key type
-		req.Header.Set("Authorization", "Bearer "+llm.APIKey)
+	doRequest := func(body map[string]interface{}) (raw []byte, status int, err error, dur time.Duration) {
+		jsonBody, _ := json.Marshal(body)
+		bodySize := len(jsonBody)
+		logrus.WithFields(logrus.Fields{
+			"event":           "llm_request",
+			"api_url":         apiURL,
+			"model":           llm.Model,
+			"is_openai_style": isOpenAIStyle,
+			"prompt_len":      len(prompt),
+			"body_size":       bodySize,
+		}).Info("[LLM] sending request")
+		req, _ := http.NewRequestWithContext(ctx, http.MethodPost, apiURL, bytes.NewBuffer(jsonBody))
+		if llm.APIKey != "" {
+			req.Header.Set("Authorization", "Bearer "+llm.APIKey)
+		}
+		req.Header.Set("Content-Type", "application/json")
+		req.Header.Set("Accept", "application/json")
+		if strings.Contains(apiURL, "openrouter.ai") {
+			req.Header.Set("Referer", "https://github.com/")
+			req.Header.Set("X-Title", "vetrag-app")
+		}
+		start := time.Now()
+		client := &http.Client{}
+		resp, err := client.Do(req)
+		if err != nil {
+			return nil, 0, err, time.Since(start)
+		}
+		defer resp.Body.Close()
+		raw, rerr := io.ReadAll(resp.Body)
+		return raw, resp.StatusCode, rerr, time.Since(start)
 	}
-	req.Header.Set("Content-Type", "application/json")
 
-	client := &http.Client{}
-	resp, err := client.Do(req)
+	raw, status, err, dur := doRequest(body)
 	if err != nil {
-		logrus.WithError(err).Error("[LLM] completion HTTP error")
+		logrus.WithFields(logrus.Fields{
+			"event":      "llm_response",
+			"status":     status,
+			"latency_ms": dur.Milliseconds(),
+			"error":      err,
+		}).Error("[LLM] request failed")
 		return "", err
 	}
-	defer resp.Body.Close()
+	logrus.WithFields(logrus.Fields{
+		"event":      "llm_raw_response",
+		"status":     status,
+		"latency_ms": dur.Milliseconds(),
+		"raw_trunc":  truncate(string(raw), 600),
+		"raw_len":    len(raw),
+	}).Debug("[LLM] raw response body")
 
-	raw, err := io.ReadAll(resp.Body)
-	if err != nil {
-		return "", fmt.Errorf("failed reading response body: %w", err)
-	}
-	logrus.WithFields(logrus.Fields{"status": resp.StatusCode, "raw": string(raw)}).Debug("[LLM] completion raw response")
+	parseVariant := "unknown"
 
-	// Attempt Ollama format first (backwards compatible)
+	// Attempt Ollama format parse
 	var ollama struct {
 		Message struct {
 			Content string `json:"content"`
 		} `json:"message"`
+		Error string `json:"error"`
 	}
 	if err := json.Unmarshal(raw, &ollama); err == nil && ollama.Message.Content != "" {
-		logrus.WithField("content", ollama.Message.Content).Info("[LLM] completion (ollama) parsed")
-		return ollama.Message.Content, nil
+		parseVariant = "ollama"
+		content := ollama.Message.Content
+		logrus.WithFields(logrus.Fields{
+			"event":         "llm_response",
+			"status":        status,
+			"latency_ms":    dur.Milliseconds(),
+			"parse_variant": parseVariant,
+			"content_len":   len(content),
+			"content_snip":  truncate(content, 300),
+		}).Info("[LLM] parsed response")
+		return content, nil
 	}
 
-	// Attempt OpenAI / OpenRouter style
+	// Attempt OpenAI/OpenRouter style parse
 	var openAI struct {
 		Choices []struct {
 			Message struct {
-				Role    string `json:"role"`
 				Content string `json:"content"`
 			} `json:"message"`
 		} `json:"choices"`
@@ -192,17 +238,46 @@ func (llm *LLMClient) openAICompletion(ctx context.Context, prompt string, forma
 		} `json:"error"`
 	}
 	if err := json.Unmarshal(raw, &openAI); err == nil {
-		if openAI.Error != nil {
-			return "", fmt.Errorf("provider error: %s (%s)", openAI.Error.Message, openAI.Error.Type)
+		if openAI.Error != nil || status >= 400 {
+			parseVariant = "openai"
+			var msg string
+			if openAI.Error != nil {
+				msg = openAI.Error.Message
+			} else {
+				msg = string(raw)
+			}
+			logrus.WithFields(logrus.Fields{
+				"event":         "llm_response",
+				"status":        status,
+				"latency_ms":    dur.Milliseconds(),
+				"parse_variant": parseVariant,
+				"error":         msg,
+			}).Error("[LLM] provider error")
+			return "", fmt.Errorf("provider error: %s", msg)
 		}
 		if len(openAI.Choices) > 0 && openAI.Choices[0].Message.Content != "" {
+			parseVariant = "openai"
 			content := openAI.Choices[0].Message.Content
-			logrus.WithField("content", content).Info("[LLM] completion (openai) parsed")
+			logrus.WithFields(logrus.Fields{
+				"event":         "llm_response",
+				"status":        status,
+				"latency_ms":    dur.Milliseconds(),
+				"parse_variant": parseVariant,
+				"content_len":   len(content),
+				"content_snip":  truncate(content, 300),
+			}).Info("[LLM] parsed response")
 			return content, nil
 		}
 	}
 
-	// If still nothing, return error with snippet
+	logrus.WithFields(logrus.Fields{
+		"event":         "llm_response",
+		"status":        status,
+		"latency_ms":    dur.Milliseconds(),
+		"parse_variant": parseVariant,
+		"raw_snip":      truncate(string(raw), 300),
+	}).Error("[LLM] unrecognized response format")
+
 	return "", fmt.Errorf("unrecognized LLM response format: %.200s", string(raw))
 }
 
diff --git a/openrouter_integration_test.go b/openrouter_integration_test.go
new file mode 100644
index 0000000..e999d36
--- /dev/null
+++ b/openrouter_integration_test.go
@@ -0,0 +1,89 @@
+package main
+
+import (
+	"context"
+	"encoding/json"
+	"net/http"
+	"net/http/httptest"
+	"strings"
+	"testing"
+)
+
+// Test OpenAI/OpenRouter style success response parsing
+func TestLLMClient_OpenRouterStyle_ExtractKeywords(t *testing.T) {
+	// Save and restore original config
+	orig := appConfig
+	defer func() { appConfig = orig }()
+
+	appConfig.LLM.ExtractKeywordsPrompt = "Dummy {{.Message}}" // simple template
+
+	ts := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		if r.URL.Path != "/v1/chat/completions" {
+			w.WriteHeader(http.StatusNotFound)
+			return
+		}
+		// Optionally verify header presence
+		if got := r.Header.Get("Authorization"); got == "" {
+			w.WriteHeader(http.StatusUnauthorized)
+			return
+		}
+		w.Header().Set("Content-Type", "application/json")
+		resp := map[string]interface{}{
+			"choices": []map[string]interface{}{
+				{
+					"message": map[string]interface{}{
+						"role":    "assistant",
+						"content": `{"translate":"dog has diarrhea","keyword":["diarrhea","digestive"],"animal":"dog"}`,
+					},
+				},
+			},
+		}
+		json.NewEncoder(w).Encode(resp)
+	}))
+	defer ts.Close()
+
+	llm := NewLLMClient("test-key", ts.URL+"/v1/chat/completions", "meta-llama/test")
+	res, err := llm.ExtractKeywords(context.Background(), "kutya hasmenés")
+	if err != nil {
+		te(t, "unexpected error: %v", err)
+	}
+	if res["translate"] != "dog has diarrhea" {
+		te(t, "translate mismatch: %v", res["translate"])
+	}
+	kw, ok := res["keyword"].([]interface{})
+	if !ok || len(kw) != 2 || kw[0] != "diarrhea" {
+		te(t, "keyword list mismatch: %#v", res["keyword"])
+	}
+	if res["animal"] != "dog" {
+		te(t, "animal mismatch: %v", res["animal"])
+	}
+}
+
+// Test OpenAI/OpenRouter style error response handling
+func TestLLMClient_OpenRouterStyle_Error(t *testing.T) {
+	orig := appConfig
+	defer func() { appConfig = orig }()
+	appConfig.LLM.ExtractKeywordsPrompt = "Dummy {{.Message}}"
+
+	ts := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		w.Header().Set("Content-Type", "application/json")
+		w.WriteHeader(http.StatusTooManyRequests)
+		json.NewEncoder(w).Encode(map[string]interface{}{
+			"error": map[string]interface{}{
+				"message": "Rate limit",
+				"type":    "rate_limit",
+			},
+		})
+	}))
+	defer ts.Close()
+
+	llm := NewLLMClient("test-key", ts.URL+"/v1/chat/completions", "meta-llama/test")
+	_, err := llm.ExtractKeywords(context.Background(), "test")
+	if err == nil || !contains(err.Error(), "Rate limit") {
+		te(t, "expected rate limit error, got: %v", err)
+	}
+}
+
+// --- helpers ---
+func contains(haystack, needle string) bool               { return strings.Contains(haystack, needle) }
+func te(t *testing.T, format string, args ...interface{}) { t.Helper(); t.Fatalf(format, args...) }
diff --git a/visits.bleve/store/000000000006.zap b/visits.bleve/store/000000000006.zap
deleted file mode 100644
index 659acfd..0000000
Binary files a/visits.bleve/store/000000000006.zap and /dev/null differ
diff --git a/visits.bleve/store/root.bolt b/visits.bleve/store/root.bolt
index 16f4475..0b85963 100644
Binary files a/visits.bleve/store/root.bolt and b/visits.bleve/store/root.bolt differ