diff --git a/app/modules/features/SettingsFeature/Sources/AISettings/AIModels/ModelsView.swift b/app/modules/features/SettingsFeature/Sources/AISettings/AIModels/ModelsView.swift
index 87fd64969..9eaad4183 100644
--- a/app/modules/features/SettingsFeature/Sources/AISettings/AIModels/ModelsView.swift
+++ b/app/modules/features/SettingsFeature/Sources/AISettings/AIModels/ModelsView.swift
@@ -191,21 +191,20 @@ struct ModelCard: View {
         .padding(.top, 8)
       }
 
-      if let pricing = model.defaultPricing {
-        HStack {
+      HStack {
+        if let pricing = model.defaultPricing {
           Text("Pricing:")
             .font(.headline)
             .fontWeight(.medium)
           Text("\(displayPrice(pricing.input)) / \(displayPrice(pricing.output))")
             .fontWeight(.medium)
-
-          Spacer()
-
-          Toggle("", isOn: $isActive)
-            .toggleStyle(.switch)
         }
-        .padding(.top, 8)
+        Spacer()
+
+        Toggle("", isOn: $isActive)
+          .toggleStyle(.switch)
       }
+      .padding(.top, 8)
 
       if provider.externalAgent != nil {
         Text("\(model.name) is an external agent")
diff --git a/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/AIProviderView.swift b/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/AIProviderView.swift
index c5943fba4..9cc6020a2 100644
--- a/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/AIProviderView.swift
+++ b/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/AIProviderView.swift
@@ -14,7 +14,7 @@ struct AIProviderView: View {
     viewModel: LLMSettingsViewModel,
     provider: AIProvider,
     providerSettings: AIProviderSettings?,
-    isConnected: Bool,
+    isConfigured: Bool,
     enabledModels: [AIModelID],
     onSettingsChanged: ((AIProviderSettings?) -> Void)?,
     onSelectModels: (() -> Void)?,
@@ -23,7 +23,7 @@ struct AIProviderView: View {
     self.viewModel = viewModel
     self.provider = provider
     self.providerSettings = providerSettings
-    self.isConnected = isConnected
+    self.isConfigured = isConfigured
     self.enabledModels = enabledModels
     self.onSettingsChanged = onSettingsChanged
     self.onSelectModels = onSelectModels
@@ -41,9 +41,9 @@ struct AIProviderView: View {
               .font(.title2)
               .fontWeight(.medium)
             Spacer()
-            Text(isConnected ? "Connected" : "Not connected")
+            Text(isConfigured ? "Configured" : "Not configured")
               .font(.subheadline)
-              .foregroundColor(isConnected ? colorScheme.addedLineDiffText : .secondary)
+              .foregroundColor(isConfigured ? colorScheme.addedLineDiffText : .secondary)
           }
 
           if let websiteURL = provider.websiteURL {
@@ -102,14 +102,19 @@ struct AIProviderView: View {
           }
         }
 
-        // Local executable section (for providers that are local)
+        // External agent section
         if let externalAgent = provider.externalAgent {
           ExternalAgentView(externalAgent: externalAgent, executable: $executable)
         }
+
+        // Local inference section
+        if let localInference = provider.localInference {
+          LocalInferenceView(localInference: localInference, baseURL: $baseURL, executable: $executable)
+        }
       }
 
       // Models button
-      if isConnected, let onSelectModels, provider.externalAgent == nil {
+      if isConfigured, let onSelectModels, !provider.isExternalAgent {
         Button(action: {
           onSelectModels()
         }) {
@@ -140,6 +145,9 @@ struct AIProviderView: View {
     .onChange(of: apiKey) { _, _ in
       saveSettings()
     }
+    .onChange(of: baseURL) { _, _ in
+      saveSettings()
+    }
     .onChange(of: executable) { _, _ in
       saveSettings()
     }
@@ -159,7 +167,7 @@ struct AIProviderView: View {
 
   private let provider: AIProvider
   private let providerSettings: AIProviderSettings?
-  private let isConnected: Bool
+  private let isConfigured: Bool
   private let onSettingsChanged: ((AIProviderSettings?) -> Void)?
   private let onSelectModels: (() -> Void)?
   private let frameless: Bool
@@ -186,20 +194,25 @@ struct AIProviderView: View {
     let trimmedBaseURL = baseURL.trimmingCharacters(in: .whitespacesAndNewlines)
     let trimmedExecutable = executable.trimmingCharacters(in: .whitespacesAndNewlines)
 
-    if provider.externalAgent == nil {
+    if provider.needsAPIKey {
       guard !trimmedAPIKey.isEmpty else {
         onSettingsChanged(nil)
         return
       }
-    } else {
+    } else if provider.isExternalAgent {
       guard !trimmedExecutable.isEmpty else {
         onSettingsChanged(nil)
         return
       }
+    } else if provider.isLocalInference {
+      guard !trimmedExecutable.isEmpty || URL(string: trimmedBaseURL) != nil else {
+        onSettingsChanged(nil)
+        return
+      }
     }
 
     let providerSettings = AIProviderSettings(
-      apiKey: trimmedAPIKey,
+      apiKey: trimmedAPIKey.isEmpty ? nil : trimmedAPIKey,
       baseUrl: trimmedBaseURL.isEmpty ? nil : trimmedBaseURL,
       executable: trimmedExecutable.isEmpty ? nil : trimmedExecutable,
       createdOrder: -1)
@@ -236,6 +249,8 @@ extension AIProvider {
       "Mistral"
     case .inception:
       "Inception"
+    case .ollama:
+      "Chat & build with open models"
     default:
       "Unknown provider"
     }
@@ -243,14 +258,23 @@ extension AIProvider {
 
   /// Whether the provider requires an API key to function (regardless of whether one has already been provided).
   var needsAPIKey: Bool {
-    externalAgent == nil
+    !isExternalAgent && !isLocalInference
   }
 
-  func isConnected(_ providerSettings: AIProviderSettings?) -> Bool {
-    if externalAgent != nil {
-      providerSettings?.executable?.trimmingCharacters(in: .whitespacesAndNewlines).isEmpty == false
-    } else {
-      providerSettings?.apiKey.trimmingCharacters(in: .whitespacesAndNewlines).isEmpty == false
+  func isConfigured(_ providerSettings: AIProviderSettings?) -> Bool {
+    if needsAPIKey {
+      return providerSettings?.apiKey?.trimmingCharacters(in: .whitespacesAndNewlines).isEmpty == false
+    } else if isExternalAgent {
+      return providerSettings?.executable?.trimmingCharacters(in: .whitespacesAndNewlines).isEmpty == false
+    } else if isLocalInference {
+      if
+        let baseUrl = providerSettings?.baseUrl?.trimmingCharacters(in: .whitespacesAndNewlines),
+        URL(string: baseUrl) != nil
+      {
+        return true
+      }
+      return providerSettings?.executable?.trimmingCharacters(in: .whitespacesAndNewlines).isEmpty == false
     }
+    return false
   }
 }
diff --git a/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/AIProvidersView.swift b/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/AIProvidersView.swift
index 78a0b75b9..5b583a0d2 100644
--- a/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/AIProvidersView.swift
+++ b/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/AIProvidersView.swift
@@ -45,7 +45,7 @@ public struct AIProvidersView: View {
                 viewModel: viewModel,
                 provider: providerInfo.provider,
                 providerSettings: providerInfo.settings,
-                isConnected: providerInfo.isConnected,
+                isConfigured: providerInfo.isConfigured,
                 enabledModels: viewModel.enabledModels,
                 onSettingsChanged: { newSettings in
                   updateProviderSettings(for: providerInfo.provider, with: newSettings)
@@ -88,7 +88,7 @@ public struct AIProvidersView: View {
       return ProviderInfo(
         provider: provider,
         settings: existingSettings,
-        isConnected: provider.isConnected(existingSettings))
+        isConfigured: provider.isConfigured(existingSettings))
     }
 
     return searchText.isEmpty
@@ -104,7 +104,7 @@ public struct AIProvidersView: View {
 
   private func setInitialOrder() {
     orderedProviders = AIProvider.allCases.map { provider in
-      (provider, provider.isConnected(viewModel.providerSettings[provider]))
+      (provider, provider.isConfigured(viewModel.providerSettings[provider]))
     }.sorted { lhs, rhs in
       // Sort: connected first, then alphabetically
       if lhs.1 != rhs.1 {
@@ -137,7 +137,7 @@ public struct AIProvidersView: View {
 private struct ProviderInfo {
   let provider: AIProvider
   let settings: AIProviderSettings?
-  let isConnected: Bool
+  let isConfigured: Bool
 }
 
 // MARK: - ProviderModelSelectionView
@@ -164,7 +164,7 @@ private struct ProviderModelSelectionView: View {
           viewModel: viewModel,
           provider: provider,
           providerSettings: providerSettings,
-          isConnected: true,
+          isConfigured: true,
           enabledModels: viewModel.enabledModels,
           onSettingsChanged: nil,
           onSelectModels: nil)
diff --git a/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/ExternalAgentView.swift b/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/ExternalAgentView.swift
index f2b6fbda4..8ba0de1f9 100644
--- a/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/ExternalAgentView.swift
+++ b/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/ExternalAgentView.swift
@@ -20,7 +20,7 @@ struct ExternalAgentView: View {
     provider = externalAgent.llmProvider
     self.externalAgent = externalAgent
     _executable = executable
-    _executableFinder = .init(initialValue: ExecutableFinder(defaultExecutable: externalAgent.defaultExecutableName))
+    _executableFinder = .init(initialValue: ExecutableFinder(executable: externalAgent.defaultExecutableName))
   }
 
   /// The external agent configuration.
@@ -119,32 +119,6 @@ struct ExternalAgentView: View {
   @Environment(\.colorScheme) private var colorScheme
 }
 
-// MARK: - ExecutableFinder
-
-/// A helper that finds where a given executable is located on disk by running `which`.
-@MainActor @Observable
-private final class ExecutableFinder {
-  /// Initializes the finder and attempts to locate the executable using `which`.
-  init(defaultExecutable: String) {
-    @Dependency(\.shellService) var shellService
-
-    Task { [weak self] in
-      do {
-        let executablePath = try await shellService.runAndThrow("which \(defaultExecutable)", useInteractiveShell: true)
-        await MainActor.run {
-          guard let self else { return }
-          self.executablePath = executablePath?.trimmingCharacters(in: .whitespacesAndNewlines)
-        }
-      } catch {
-        // Silently ignore errors - executable not found is expected
-      }
-    }
-  }
-
-  /// The path where the executable was found, or nil if not found.
-  private(set) var executablePath: String?
-}
-
 extension ExternalAgent {
   /// Whether the external agent has been enabled at least once.
   /// When the agent is disabled, this value will help understand whether the agent has never been enabled, and can be enabled by default, or if it has been disabled by the user.
diff --git a/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/LocalInferenceView.swift b/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/LocalInferenceView.swift
new file mode 100644
index 000000000..4a405c560
--- /dev/null
+++ b/app/modules/features/SettingsFeature/Sources/AISettings/AIProviders/LocalInferenceView.swift
@@ -0,0 +1,95 @@
+// Copyright cmd app, Inc. Licensed under the Apache License, Version 2.0.
+// You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0
+
+import Dependencies
+import DLS
+import LLMFoundation
+import SwiftUI
+
+// MARK: - LocalInferenceView
+
+struct LocalInferenceView: View {
+  /// Initializes the card with the local inference configuration and a binding to its executable path.
+  init(
+    localInference: LocalInference,
+    baseURL: Binding<String>,
+    executable: Binding<String>)
+  {
+    provider = localInference.llmProvider
+    self.localInference = localInference
+    _baseURL = baseURL
+    _executable = executable
+    _executableFinder = .init(initialValue: ExecutableFinder(executable: localInference.executableName))
+  }
+
+  /// The local inference configuration.
+  let localInference: LocalInference
+
+  /// The AI provider associated with this local inference.
+  let provider: AIProvider
+
+  var body: some View {
+    VStack(alignment: .leading, spacing: 8) {
+      if let executablePath = executableFinder.executablePath {
+        HStack {
+          Text("\(provider.name)'s executable was found")
+            .fontWeight(.medium)
+
+          Spacer()
+
+          HoveredButton(
+            action: {
+              executable = executable.isEmpty ? executablePath : ""
+            },
+            onHoverColor: colorScheme.tertiarySystemBackground,
+            backgroundColor: colorScheme.secondarySystemBackground,
+            padding: 5,
+            content: {
+              Text(executable.isEmpty ? "Enable" : "Disable")
+            })
+        }
+      } else if baseURL.isEmpty {
+        Text("\(provider.name)'s executable could not be found. Either:")
+          .font(.subheadline)
+          .fontWeight(.medium)
+        PlainLink("install it first", destination: localInference.installationInstructions)
+          .font(.subheadline)
+          .fontWeight(.medium)
+        Text("or configure a custom base URL below:")
+          .font(.subheadline)
+          .fontWeight(.medium)
+      }
+
+      let showTitle = executableFinder.executablePath != nil || !baseURL.isEmpty
+      if showTitle {
+        Text("Base URL")
+          .font(.subheadline)
+          .fontWeight(.medium)
+      }
+      TextField(localInference.defaultBaseUrl.absoluteString, text: $baseURL)
+        .textFieldStyle(.plain)
+        .padding(.horizontal, 12)
+        .padding(.vertical, 8)
+        .with(
+          cornerRadius: 6,
+          backgroundColor: Color(
+            NSColor.textBackgroundColor),
+          borderColor: Color.gray.opacity(0.3))
+
+      Text("Leave empty to use default")
+        .font(.footnote)
+        .foregroundColor(.secondary)
+    }
+  }
+
+  /// Binding to the executable path or launch command.
+  @Binding private var executable: String
+
+  /// Binding to the base URL.
+  @Binding private var baseURL: String
+
+  /// Helper to locate the executable on disk.
+  @State private var executableFinder: ExecutableFinder
+
+  @Environment(\.colorScheme) private var colorScheme
+}
diff --git a/app/modules/features/SettingsFeature/Sources/CodeCompletionSettingsView.swift b/app/modules/features/SettingsFeature/Sources/CodeCompletionSettingsView.swift
index c1a3dc8b4..01a841185 100644
--- a/app/modules/features/SettingsFeature/Sources/CodeCompletionSettingsView.swift
+++ b/app/modules/features/SettingsFeature/Sources/CodeCompletionSettingsView.swift
@@ -225,7 +225,7 @@ private struct CodeCompletionProviderSection: View {
                 viewModel: llmSettingsViewModel,
                 provider: aiProvider,
                 providerSettings: llmSettingsViewModel.providerSettings[aiProvider],
-                isConnected: aiProvider.isConnected(llmSettingsViewModel.providerSettings[aiProvider]),
+                isConfigured: aiProvider.isConfigured(llmSettingsViewModel.providerSettings[aiProvider]),
                 enabledModels: llmSettingsViewModel.enabledModels,
                 onSettingsChanged: { newSettings in
                   updateProviderSettings(for: aiProvider, with: newSettings)
diff --git a/app/modules/features/SettingsFeature/Sources/ExecutableFinder.swift b/app/modules/features/SettingsFeature/Sources/ExecutableFinder.swift
new file mode 100644
index 000000000..2bcd61b4e
--- /dev/null
+++ b/app/modules/features/SettingsFeature/Sources/ExecutableFinder.swift
@@ -0,0 +1,32 @@
+// Copyright cmd app, Inc. Licensed under the Apache License, Version 2.0.
+// You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0
+
+import Dependencies
+import ShellServiceInterface
+import SwiftUI
+
+// MARK: - ExecutableFinder
+
+/// A helper that finds where a given executable is located on disk by running `which`.
+@MainActor @Observable
+final class ExecutableFinder {
+  /// Initializes the finder and attempts to locate the executable using `which`.
+  init(executable: String) {
+    @Dependency(\.shellService) var shellService
+
+    Task { [weak self] in
+      do {
+        let executablePath = try await shellService.runAndThrow("which \(executable)", useInteractiveShell: true)
+        await MainActor.run {
+          guard let self else { return }
+          self.executablePath = executablePath?.trimmingCharacters(in: .whitespacesAndNewlines)
+        }
+      } catch {
+        // Silently ignore errors - executable not found is expected
+      }
+    }
+  }
+
+  /// The path where the executable was found, or nil if not found.
+  private(set) var executablePath: String?
+}
diff --git a/app/modules/foundations/LLMFoundation/Sources/AIModel.swift b/app/modules/foundations/LLMFoundation/Sources/AIModel.swift
index 7c6c4d977..08c595dc7 100644
--- a/app/modules/foundations/LLMFoundation/Sources/AIModel.swift
+++ b/app/modules/foundations/LLMFoundation/Sources/AIModel.swift
@@ -5,7 +5,9 @@ import Foundation
 
 // MARK: - LLMReasoning
 
-public struct LLMReasoning: Sendable, Hashable, Codable { }
+public struct LLMReasoning: Sendable, Hashable, Codable {
+  public init() { }
+}
 
 // MARK: - AIProviderModel
 
@@ -38,11 +40,14 @@ public struct AIModel: Hashable, Identifiable, Sendable, Codable {
     description: String? = nil,
     contextSize: Int,
     maxOutputTokens: Int,
-    defaultPricing: ModelPricing?, // TODO: Make non-optional when we have pricing for all models.
+    defaultPricing: ModelPricing?,
     documentationURL: URL? = nil,
     reasoning: LLMReasoning? = nil,
     createdAt: TimeInterval,
-    rankForProgramming: Int)
+    rankForProgramming: Int,
+    supportsChat: Bool = true,
+    supportsTools: Bool = true,
+    supportsCompletion: Bool = false)
   {
     self.slug = slug
     self.name = name
@@ -54,6 +59,13 @@ public struct AIModel: Hashable, Identifiable, Sendable, Codable {
     self.reasoning = reasoning
     self.createdAt = createdAt
     self.rankForProgramming = rankForProgramming
+    self.supportsChat = supportsChat
+      // TODO: move to appropriate place
+      && AIModel.modelSupportsChat(id: slug)
+    self.supportsTools = supportsTools
+    self.supportsCompletion = supportsCompletion
+      // TODO: move to appropriate place
+      || AIModel.modelSupportsCompletion(id: slug)
   }
 
   /// A few models for debugging and providing default values.
@@ -122,6 +134,9 @@ public struct AIModel: Hashable, Identifiable, Sendable, Codable {
   public let reasoning: LLMReasoning?
   public let createdAt: TimeInterval
   public let rankForProgramming: Int
+  public let supportsChat: Bool
+  public let supportsTools: Bool
+  public let supportsCompletion: Bool
 
   public var id: String {
     slug
@@ -147,11 +162,11 @@ public struct AIModel: Hashable, Identifiable, Sendable, Codable {
 }
 
 extension AIModel {
-  public var supportsCompletion: Bool {
+  static func modelSupportsCompletion(id: String) -> Bool {
     ["inception/mercury-coder-small", "mistralai/codestral-latest"].contains(id)
   }
 
-  public var supportsChat: Bool {
+  static func modelSupportsChat(id: String) -> Bool {
     id != "inception/mercury-coder-small"
   }
 }
diff --git a/app/modules/foundations/LLMFoundation/Sources/AIProvider.swift b/app/modules/foundations/LLMFoundation/Sources/AIProvider.swift
index 31ce879f6..235ef727a 100644
--- a/app/modules/foundations/LLMFoundation/Sources/AIProvider.swift
+++ b/app/modules/foundations/LLMFoundation/Sources/AIProvider.swift
@@ -17,11 +17,11 @@ public struct AIProvider: Hashable, Identifiable, CaseIterable, Sendable, RawRep
   init(
     id: String,
     name: String,
-    keychainKey: String,
+    keychainKey: String? = nil,
     websiteURL: URL? = nil,
     apiKeyCreationURL: URL? = nil,
     lowTierModelId: AIModelID? = nil,
-    modelsEnabledByDefault: [AIModelID])
+    modelsEnabledByDefault: [AIModelID] = [])
   {
     self.id = id
     self.name = name
@@ -44,12 +44,13 @@ public struct AIProvider: Hashable, Identifiable, CaseIterable, Sendable, RawRep
       .geminiCLI,
       .mistral,
       .inception,
+      .ollama,
     ]
   }
 
   public let id: String
   public let name: String
-  public let keychainKey: String
+  public let keychainKey: String?
   public let websiteURL: URL?
   public let apiKeyCreationURL: URL?
   public let lowTierModelId: AIModelID?
diff --git a/app/modules/foundations/LLMFoundation/Sources/LocalInference.swift b/app/modules/foundations/LLMFoundation/Sources/LocalInference.swift
new file mode 100644
index 000000000..3a14ab400
--- /dev/null
+++ b/app/modules/foundations/LLMFoundation/Sources/LocalInference.swift
@@ -0,0 +1,41 @@
+// Copyright cmd app, Inc. Licensed under the Apache License, Version 2.0.
+// You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0
+
+import Foundation
+
+// MARK: - LocalInference
+
+/// Inference with local LLMs (e.g Ollama).
+public struct LocalInference: Sendable {
+  /// The name of the inference.
+  public let name: String
+  /// An executable name
+  public let executableName: String
+  /// A base URL for a local AP..
+  public let defaultBaseUrl: URL
+  /// A link to instructions on how to install.
+  public let installationInstructions: URL
+  /// Additional information about the associated provider.
+  public let llmProvider: AIProvider
+}
+
+extension AIProvider {
+  public var localInference: LocalInference? {
+    switch self {
+    case .ollama:
+      .init(
+        name: "Ollama",
+        executableName: "ollama",
+        defaultBaseUrl: URL(string: "http://localhost:11434")!,
+        installationInstructions: URL(string: "https://docs.ollama.com/quickstart")!,
+        llmProvider: self)
+
+    default:
+      nil
+    }
+  }
+
+  public var isLocalInference: Bool {
+    localInference != nil
+  }
+}
diff --git a/app/modules/foundations/LLMFoundation/Sources/providers/Ollama.swift b/app/modules/foundations/LLMFoundation/Sources/providers/Ollama.swift
new file mode 100644
index 000000000..1736c3322
--- /dev/null
+++ b/app/modules/foundations/LLMFoundation/Sources/providers/Ollama.swift
@@ -0,0 +1,12 @@
+// Copyright cmd app, Inc. Licensed under the Apache License, Version 2.0.
+// You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0
+
+import AppFoundation
+import Foundation
+
+extension AIProvider {
+  public static let ollama = AIProvider(
+    id: "ollama",
+    name: "Ollama",
+    websiteURL: URL(string: "https://ollama.com/search"))
+}
diff --git a/app/modules/serviceInterfaces/LocalServerServiceInterface/Sources/listModelsSchema.generated.swift b/app/modules/serviceInterfaces/LocalServerServiceInterface/Sources/listModelsSchema.generated.swift
index 2af431995..692560dcf 100644
--- a/app/modules/serviceInterfaces/LocalServerServiceInterface/Sources/listModelsSchema.generated.swift
+++ b/app/modules/serviceInterfaces/LocalServerServiceInterface/Sources/listModelsSchema.generated.swift
@@ -61,9 +61,13 @@ extension Schema {
     public let maxCompletionTokens: Int
     public let inputModalities: [ModelModality]
     public let outputModalities: [ModelModality]
-    public let pricing: ModelPricing
+    public let pricing: ModelPricing?
     public let createdAt: Double
     public let rankForProgramming: Int
+    public let supportsChat: Bool
+    public let supportsTools: Bool
+    public let supportsReasoning: Bool
+    public let supportsCompletion: Bool
   
     private enum CodingKeys: String, CodingKey {
       case providerId = "providerId"
@@ -77,6 +81,10 @@ extension Schema {
       case pricing = "pricing"
       case createdAt = "createdAt"
       case rankForProgramming = "rankForProgramming"
+      case supportsChat = "supportsChat"
+      case supportsTools = "supportsTools"
+      case supportsReasoning = "supportsReasoning"
+      case supportsCompletion = "supportsCompletion"
     }
   
     public init(
@@ -88,9 +96,13 @@ extension Schema {
         maxCompletionTokens: Int,
         inputModalities: [ModelModality],
         outputModalities: [ModelModality],
-        pricing: ModelPricing,
+        pricing: ModelPricing? = nil,
         createdAt: Double,
-        rankForProgramming: Int
+        rankForProgramming: Int,
+        supportsChat: Bool,
+        supportsTools: Bool,
+        supportsReasoning: Bool,
+        supportsCompletion: Bool
     ) {
       self.providerId = providerId
       self.globalId = globalId
@@ -103,6 +115,10 @@ extension Schema {
       self.pricing = pricing
       self.createdAt = createdAt
       self.rankForProgramming = rankForProgramming
+      self.supportsChat = supportsChat
+      self.supportsTools = supportsTools
+      self.supportsReasoning = supportsReasoning
+      self.supportsCompletion = supportsCompletion
     }
   
     public init(from decoder: Decoder) throws {
@@ -115,9 +131,13 @@ extension Schema {
       maxCompletionTokens = try container.decode(Int.self, forKey: .maxCompletionTokens)
       inputModalities = try container.decode([ModelModality].self, forKey: .inputModalities)
       outputModalities = try container.decode([ModelModality].self, forKey: .outputModalities)
-      pricing = try container.decode(ModelPricing.self, forKey: .pricing)
+      pricing = try container.decodeIfPresent(ModelPricing?.self, forKey: .pricing)
       createdAt = try container.decode(Double.self, forKey: .createdAt)
       rankForProgramming = try container.decode(Int.self, forKey: .rankForProgramming)
+      supportsChat = try container.decode(Bool.self, forKey: .supportsChat)
+      supportsTools = try container.decode(Bool.self, forKey: .supportsTools)
+      supportsReasoning = try container.decode(Bool.self, forKey: .supportsReasoning)
+      supportsCompletion = try container.decode(Bool.self, forKey: .supportsCompletion)
     }
   
     public func encode(to encoder: Encoder) throws {
@@ -130,9 +150,13 @@ extension Schema {
       try container.encode(maxCompletionTokens, forKey: .maxCompletionTokens)
       try container.encode(inputModalities, forKey: .inputModalities)
       try container.encode(outputModalities, forKey: .outputModalities)
-      try container.encode(pricing, forKey: .pricing)
+      try container.encodeIfPresent(pricing, forKey: .pricing)
       try container.encode(createdAt, forKey: .createdAt)
       try container.encode(rankForProgramming, forKey: .rankForProgramming)
+      try container.encode(supportsChat, forKey: .supportsChat)
+      try container.encode(supportsTools, forKey: .supportsTools)
+      try container.encode(supportsReasoning, forKey: .supportsReasoning)
+      try container.encode(supportsCompletion, forKey: .supportsCompletion)
     }
   }
   public enum ModelModality: String, Codable, Sendable, CaseIterable {
diff --git a/app/modules/serviceInterfaces/LocalServerServiceInterface/Sources/sendMessageSchema.generated.swift b/app/modules/serviceInterfaces/LocalServerServiceInterface/Sources/sendMessageSchema.generated.swift
index 8fbc00c1c..b6449a06c 100644
--- a/app/modules/serviceInterfaces/LocalServerServiceInterface/Sources/sendMessageSchema.generated.swift
+++ b/app/modules/serviceInterfaces/LocalServerServiceInterface/Sources/sendMessageSchema.generated.swift
@@ -10,7 +10,7 @@ extension Schema {
     public let messages: [Message]
     public let system: String?
     public let projectRoot: String?
-    public let tools: [Tool]
+    public let tools: [Tool]?
     public let model: String
     public let enableReasoning: Bool
     public let provider: APIProvider
@@ -31,7 +31,7 @@ extension Schema {
         messages: [Message],
         system: String? = nil,
         projectRoot: String? = nil,
-        tools: [Tool],
+        tools: [Tool]? = nil,
         model: String,
         enableReasoning: Bool,
         provider: APIProvider,
@@ -52,7 +52,7 @@ extension Schema {
       messages = try container.decode([Message].self, forKey: .messages)
       system = try container.decodeIfPresent(String?.self, forKey: .system)
       projectRoot = try container.decodeIfPresent(String?.self, forKey: .projectRoot)
-      tools = try container.decode([Tool].self, forKey: .tools)
+      tools = try container.decodeIfPresent([Tool]?.self, forKey: .tools)
       model = try container.decode(String.self, forKey: .model)
       enableReasoning = try container.decode(Bool.self, forKey: .enableReasoning)
       provider = try container.decode(APIProvider.self, forKey: .provider)
@@ -64,7 +64,7 @@ extension Schema {
       try container.encode(messages, forKey: .messages)
       try container.encodeIfPresent(system, forKey: .system)
       try container.encodeIfPresent(projectRoot, forKey: .projectRoot)
-      try container.encode(tools, forKey: .tools)
+      try container.encodeIfPresent(tools, forKey: .tools)
       try container.encode(model, forKey: .model)
       try container.encode(enableReasoning, forKey: .enableReasoning)
       try container.encode(provider, forKey: .provider)
@@ -810,6 +810,7 @@ extension Schema {
     case gemini = "gemini"
     case mistral = "mistral"
     case inception = "inception"
+    case ollama = "ollama"
     case claudeCode = "claude_code"
     case codex = "codex"
     case geminiCli = "gemini_cli"
diff --git a/app/modules/serviceInterfaces/SettingsServiceInterface/Sources/SettingsService.swift b/app/modules/serviceInterfaces/SettingsServiceInterface/Sources/SettingsService.swift
index 69d1c6695..e6ebd9ab4 100644
--- a/app/modules/serviceInterfaces/SettingsServiceInterface/Sources/SettingsService.swift
+++ b/app/modules/serviceInterfaces/SettingsServiceInterface/Sources/SettingsService.swift
@@ -154,12 +154,12 @@ public struct Settings: Sendable, Equatable {
     /// To help keep track of which Provider was setup first, we use an incrementing order.
     /// This order can be useful for determining which provider to default to when multiple are available.
     public let createdOrder: Int
-    public var apiKey: String
+    public var apiKey: String?
     public var baseUrl: String?
     public var executable: String?
 
     public init(
-      apiKey: String,
+      apiKey: String?,
       baseUrl: String?,
       executable: String?,
       createdOrder: Int)
diff --git a/app/modules/services/LLMService/Sources/DefaultLLMService.swift b/app/modules/services/LLMService/Sources/DefaultLLMService.swift
index a0ade6770..897fd1790 100644
--- a/app/modules/services/LLMService/Sources/DefaultLLMService.swift
+++ b/app/modules/services/LLMService/Sources/DefaultLLMService.swift
@@ -267,12 +267,14 @@ final class DefaultLLMService: LLMService {
       messages: messageHistory,
       system: system,
       projectRoot: context?.projectRoot?.path,
-      tools: tools
+      tools: model.supportsTools
+        ? tools
         // Unless we are using an external agent, only send to the AI tools that are internal.
         .filter { ($0.canBeExecuted && $0.id == $0.referenceId) || provider.isExternalAgent }
-        .map { .init(name: $0.name, description: $0.description, inputSchema: $0.inputSchema) },
+        .map { .init(name: $0.name, description: $0.description, inputSchema: $0.inputSchema) }
+        : nil,
       model: providerModel.id,
-      enableReasoning: enableReasoning,
+      enableReasoning: model.canReason && enableReasoning,
       provider: .init(
         provider: provider,
         settings: providerSettings,
@@ -420,6 +422,8 @@ extension Schema.APIProvider {
         return .mistral
       case .inception:
         return .inception
+      case .ollama:
+        return .ollama
       default:
         throw AppError(message: "Unsupported provider \(provider.name)")
       }
diff --git a/app/modules/services/LLMService/Sources/LLMModelManager.swift b/app/modules/services/LLMService/Sources/LLMModelManager.swift
index edc12315f..ed73f793f 100644
--- a/app/modules/services/LLMService/Sources/LLMModelManager.swift
+++ b/app/modules/services/LLMService/Sources/LLMModelManager.swift
@@ -329,21 +329,31 @@ final class AIModelsManager: AIModelsManagerProtocol {
       name: apiProvider.name,
       settings: apiProvider.settings)))
     let response: Schema.ListModelsOutput = try await localServer.postRequest(path: "models", data: data)
-    return response.models.map { AIProviderModel(
-      providerId: $0.providerId,
-      provider: provider,
-      modelInfo: .init(
-        name: $0.name,
-        slug: $0.globalId,
-        contextSize: $0.contextLength,
-        maxOutputTokens: $0.maxCompletionTokens,
-        defaultPricing: .init(
-          input: $0.pricing.prompt,
-          output: $0.pricing.completion,
-          cacheWrite: $0.pricing.inputCacheWrite ?? 0,
-          cachedInput: $0.pricing.inputCacheRead ?? 0),
-        createdAt: $0.createdAt,
-        rankForProgramming: $0.rankForProgramming)) }
+    return response.models.map { model in
+      let defaultPricing: ModelPricing? = {
+        guard let pricing = model.pricing else { return nil }
+        return .init(
+          input: pricing.prompt,
+          output: pricing.completion,
+          cacheWrite: pricing.inputCacheWrite ?? 0,
+          cachedInput: pricing.inputCacheRead ?? 0)
+      }()
+      return AIProviderModel(
+        providerId: model.providerId,
+        provider: provider,
+        modelInfo: .init(
+          name: model.name,
+          slug: model.globalId,
+          contextSize: model.contextLength,
+          maxOutputTokens: model.maxCompletionTokens,
+          defaultPricing: defaultPricing,
+          reasoning: model.supportsReasoning ? LLMReasoning() : nil,
+          createdAt: model.createdAt,
+          rankForProgramming: model.rankForProgramming,
+          supportsChat: model.supportsChat,
+          supportsTools: model.supportsTools,
+          supportsCompletion: model.supportsCompletion))
+    }
   }
 
   private func observerChangesToSettings() {
diff --git a/app/modules/services/LLMService/Tests/LLMModelManagerTests.swift b/app/modules/services/LLMService/Tests/LLMModelManagerTests.swift
index 12e43bfb7..b2cd3a46a 100644
--- a/app/modules/services/LLMService/Tests/LLMModelManagerTests.swift
+++ b/app/modules/services/LLMService/Tests/LLMModelManagerTests.swift
@@ -1098,7 +1098,11 @@ private func makeSchemaModel(
       prompt: 1.0,
       completion: 2.0),
     createdAt: Date().timeIntervalSince1970,
-    rankForProgramming: 1)
+    rankForProgramming: 1,
+    supportsChat: true,
+    supportsTools: true,
+    supportsReasoning: false,
+    supportsCompletion: true)
 }
 
 private func makeListModelsOutput(models: [Schema.Model]) -> Schema.ListModelsOutput {
diff --git a/app/modules/services/SettingsService/Sources/DefaultSettingsService.swift b/app/modules/services/SettingsService/Sources/DefaultSettingsService.swift
index f3e469cbf..f1a22c5c1 100644
--- a/app/modules/services/SettingsService/Sources/DefaultSettingsService.swift
+++ b/app/modules/services/SettingsService/Sources/DefaultSettingsService.swift
@@ -270,7 +270,7 @@ final class DefaultSettingsService: SettingsService {
 
     let keychainKeyPrefix = "cmd-keychain-key-"
     for provider in AIProvider.allCases {
-      let keychainKey = keychainKeyPrefix + provider.keychainKey
+      guard let keychainKey = provider.keychainKey.map({ keychainKeyPrefix + $0 }) else { continue }
       if let settings = settings.llmProviderSettings[provider] {
         privateKeys[keychainKey] = settings.apiKey
         publicSettings.llmProviderSettings[provider]?.apiKey = keychainKey
diff --git a/contributing.md b/contributing.md
index 928ead7cd..d5d63a248 100644
--- a/contributing.md
+++ b/contributing.md
@@ -55,6 +55,7 @@ export OPENAI_LOCAL_SERVER_PROXY="http://localhost:10003/v1"
 export GROQ_LOCAL_SERVER_PROXY="http://localhost:10004/openai/v1"
 export GEMINI_LOCAL_SERVER_PROXY="http://localhost:10005/v1beta"
 export GITHUB_COPILOT_PROXY="http://localhost:9090"
+export OLLAMA_LOCAL_SERVER_PROXY="http://localhost:10006"
 
 # Claude Code (with Proxyman):
 cat > "$HOME/.claude/start_with_proxy.sh" << 'EOF'
diff --git a/docs/docs.json b/docs/docs.json
index 73d2c4c4c..754bbe413 100644
--- a/docs/docs.json
+++ b/docs/docs.json
@@ -26,6 +26,7 @@
             "group": "Configuration",
             "pages": [
               "pages/ai-providers",
+              "pages/ollama",
               "pages/models",
               "pages/code-completion",
               "pages/chat-modes",
diff --git a/docs/pages/ai-providers.mdx b/docs/pages/ai-providers.mdx
index 7faa6dfbe..97a746255 100644
--- a/docs/pages/ai-providers.mdx
+++ b/docs/pages/ai-providers.mdx
@@ -5,12 +5,13 @@ description: "Configure AI providers to use with cmd"
 
 ## Overview
 
-cmd connects to AI providers using your API keys. You can configure multiple providers and switch between them as needed. This gives you flexibility to:
+cmd connects to AI providers using your API keys, or use local inference with providers like Ollama. You can configure multiple providers and switch between them as needed. This gives you flexibility to:
 
 - Use different providers for different tasks
+- Run AI models locally for privacy and offline development
 - Have backup options if one provider has issues
 - Compare performance across providers
-- Take advantage of different pricing models
+- Take advantage of different pricing models or eliminate API costs entirely
 
 ## Initial Setup
 
@@ -61,6 +62,12 @@ When multiple providers offer the same model, you can set which provider to use
   </Card>
 </CardGroup>
 
+### Local Inference
+
+For complete data privacy and offline development, you can use [Ollama](/pages/ollama) to run AI models locally on your machine or on a private network server. This eliminates API costs and ensures your code never leaves your infrastructure.
+
+See the [Ollama configuration guide](/pages/ollama) for setup instructions.
+
 <Tip>
   Configure multiple providers to compare costs and performance. You can switch providers anytime from **Settings > Models**.
 </Tip>
diff --git a/docs/pages/models.mdx b/docs/pages/models.mdx
index 3652d40f0..19cc2d7cb 100644
--- a/docs/pages/models.mdx
+++ b/docs/pages/models.mdx
@@ -10,6 +10,7 @@ After configuring your [AI providers](/pages/ai-providers), you need to enable w
 - Which models are available in the model selector
 - Which provider to use when a model is available from multiple sources
 - Default model preferences
+- Local models from [Ollama](/pages/ollama) for private, offline inference
 
 You can configure models during onboarding or anytime through **Settings > Models** or **Settings > AI Providers**.
 
@@ -43,6 +44,7 @@ Some models may be available from multiple providers. For example:
 - **Claude Sonnet** from both Anthropic and OpenRouter
 - **GPT-4** from both OpenAI and Azure OpenAI
 - Popular models from both direct providers and aggregators
+- Local models from Ollama vs. cloud providers
 
 ### Setting Provider Preference
 
@@ -87,3 +89,28 @@ Once you've enabled models, you can switch between them easily in the chat inter
 The model selector shows only the models you've enabled in settings.
 
 <Warning>After changing model mid-conversation, the next message will not have a cached prompt</Warning>
+
+## Local Models
+
+For complete privacy and offline development, you can use local models through [Ollama](/pages/ollama). Once you've configured the Ollama provider, all models installed in your Ollama instance will automatically appear in the model list.
+
+<Steps>
+  <Step title="Install Models in Ollama">
+    Use the Ollama CLI to install models:
+    ```bash
+    ollama pull qwen2.5-coder:7b
+    ```
+  </Step>
+
+  <Step title="Refresh Model List">
+    If you've added new models to Ollama, refresh cmd's model list by disabling and re-enabling the Ollama provider in **Settings > AI Providers**
+  </Step>
+
+  <Step title="Enable Local Models">
+    Go to **Settings > Models** and enable the Ollama models you want to use
+  </Step>
+</Steps>
+
+<Tip>
+  Local models run entirely on your machine, ensuring your code never leaves your infrastructure. This is ideal for sensitive projects or working offline.
+</Tip>
diff --git a/docs/pages/ollama.mdx b/docs/pages/ollama.mdx
new file mode 100644
index 000000000..7cb088c64
--- /dev/null
+++ b/docs/pages/ollama.mdx
@@ -0,0 +1,166 @@
+---
+title: "Ollama"
+description: "Configure Ollama for local AI inference with cmd"
+---
+
+## Overview
+
+Ollama enables you to run AI models locally on your machine or on a private network endpoint. This gives you complete control over your data, eliminates API costs, and enables offline development. Ollama can automatically download and manage models for you, making local inference accessible and straightforward.
+
+## Prerequisites
+
+Before configuring Ollama in cmd, you need to have Ollama installed and running on your system.
+
+<Steps>
+  <Step title="Install Ollama">
+    Download and install Ollama from the [official website](https://ollama.com/) or follow the [Quick Start guide](https://docs.ollama.com/quickstart).
+  </Step>
+
+  <Step title="Start Ollama">
+    Ensure Ollama is running. The default installation sets up autostart, but you can also start it manually:
+
+    ```bash
+    ollama serve
+    ```
+
+    Ollama will run on `http://localhost:11434` by default.
+  </Step>
+
+  <Step title="Install Models">
+    Install one or more AI models. Ollama will automatically download the models when you first request them:
+
+    ```bash
+    # Example: Install a coding-focused model
+    ollama pull devstral-small-2:24b
+
+    # Or install a small model with lower system requirements
+    ollama pull qwen2.5-coder:7b
+
+    # Or install a reasoning model
+    ollama pull deepseek-r1:14b
+    ```
+
+    You can browse available models at [https://ollama.com/search](https://ollama.com/search).
+  </Step>
+
+  <Step title="Verify Installation">
+    Verify Ollama is working correctly:
+
+    ```bash
+    ollama list
+    ```
+
+    This should show your installed models.
+  </Step>
+</Steps>
+
+<Info>
+  Ollama automatically loads models on-demand. You don't need to manually load models before using them with cmd.
+</Info>
+
+## Configuring Ollama in cmd
+
+Once Ollama is installed and running, you can enable it in cmd:
+
+<Steps>
+  <Step title="Open AI Provider Settings">
+    Go to **Settings > AI Providers** in cmd
+  </Step>
+
+  <Step title="Add Ollama Provider">
+    Click **"Add Provider"** or **"Configure"** for Ollama.
+
+    By default, cmd connects to Ollama on `http://localhost:11434`. If you're running Ollama on a different port or on a remote server, you can customize the base URL.
+
+    <AccordionGroup>
+      <Accordion title="Example: Default local configuration">
+        For a standard local Ollama installation, simply toggle **"Enable"**
+      </Accordion>
+
+      <Accordion title="Example: Custom port">
+        If you're running Ollama on a different port:
+
+        ```
+        Base URL: http://localhost:8080
+        ```
+      </Accordion>
+
+      <Accordion title="Example: Remote server">
+        If you're running Ollama on a remote server in your private network:
+
+        ```
+        Base URL: http://192.168.1.100:11434
+        ```
+      </Accordion>
+    </AccordionGroup>
+  </Step>
+
+  <Step title="Model discovery">
+    cmd will automatically discover the available models from your Ollama installation when the provider is configured.
+  </Step>
+
+  <Step title="Select Models">
+    Go to **Settings > Models** and enable the models you want to use in cmd. All models installed in Ollama will be available for selection.
+  </Step>
+</Steps>
+
+<Tip>
+  If you install new models in Ollama after configuring the provider, you can refresh the model list by disabling and re-enabling the Ollama provider in **Settings > AI Providers**.
+</Tip>
+
+## Using Ollama
+
+Once enabled and models are selected, you can use Ollama models just like any other AI provider:
+
+<Steps>
+  <Step title="Select an Ollama Model">
+    In the cmd interface, open the model selector and choose one of your Ollama models (e.g., "devstral-small-2:24b")
+  </Step>
+
+  <Step title="Start Using">
+    You can now use Ollama models for:
+    - Chat and code assistance
+    - Agent mode for autonomous tasks (if supported by the model)
+    - All other cmd features such as code completion 
+
+    All inference happens locally on your machine or your private server - no data leaves your network.
+  </Step>
+</Steps>
+
+## Tested Models
+
+The following models have been successfully tested with cmd:
+
+- **qwen3-coder:30b** - High-performance coding model
+- **devstral-small-2:24b** - Efficient development assistant
+- **deepseek-r1:14b** - Reasoning-focused model
+- **qwen2.5-coder:7b** - Lightweight coding model
+
+You can find more models at [https://ollama.com/search](https://ollama.com/search).
+
+## Benefits of Local Inference
+
+Using Ollama with cmd provides several advantages:
+
+<CardGroup cols={2}>
+  <Card title="Data Privacy" icon="shield-halved">
+    All processing happens locally - your code never leaves your machine
+  </Card>
+  <Card title="No API Costs" icon="dollar-sign">
+    Run unlimited inference without per-token charges
+  </Card>
+  <Card title="Offline Development" icon="wifi-slash">
+    Work without internet connectivity
+  </Card>
+  <Card title="Custom Models" icon="sliders">
+    Use specialized or fine-tuned models for your specific needs
+  </Card>
+</CardGroup>
+
+<Warning>
+  Local models require significant computational resources. Larger models provide better results but need more RAM and processing power. Ensure your system meets the requirements for the models you want to run.
+</Warning>
+
+<Tip>
+  For the best coding experience, consider models specifically trained for code. These models understand programming contexts better than general-purpose models.
+</Tip>
diff --git a/docs/snippets/features-showcase.mdx b/docs/snippets/features-showcase.mdx
index f2a280251..d077467c7 100644
--- a/docs/snippets/features-showcase.mdx
+++ b/docs/snippets/features-showcase.mdx
@@ -77,6 +77,19 @@
     <a href="/pages/claude-code">Learn how to configure External Agents →</a>
   </Tab>
 
+  <Tab title="Local Inference">
+    Run AI models entirely on your machine with Ollama:
+    - **Complete privacy**: Your code never leaves your infrastructure
+    - **Custom models**: Use specialized or fine-tuned models
+    - **Network deployment**: Run Ollama on private network servers
+    - **Offline development**: Work without internet connectivity
+    - **No API costs**: Unlimited inference without per-token charges
+
+    Tested successfully with models like devstral-small-2 and qwen3-coder.
+
+    <a href="/pages/ollama">Learn how to configure Ollama →</a>
+  </Tab>
+
   <Tab title="Xcode 26 Integration">
     <video
       controls
diff --git a/local-server/README.md b/local-server/README.md
index 0910fa9e0..b03cbbd33 100644
--- a/local-server/README.md
+++ b/local-server/README.md
@@ -5,7 +5,7 @@ TypeScript server embedded in CMD that provides AI integration and third-party l
 ## Purpose
 
 This local HTTP server runs alongside the CMD macOS app and handles:
-- AI provider integrations (Anthropic, OpenAI, Groq, Gemini, OpenRouter)
+- AI provider integrations (Anthropic, OpenAI, Groq, Gemini, OpenRouter, Ollama)
 - Agent Client Protocol (ACP) support
 - Model Context Protocol (MCP) support
 - File operations and search
diff --git a/local-server/build.sha256 b/local-server/build.sha256
index 372eb2596..ec8b3b3ae 100644
--- a/local-server/build.sha256
+++ b/local-server/build.sha256
@@ -1 +1 @@
-d70ed262e28022f81a0e676f6a9a394a0eb67835cbd7824da548fd14a0fd33fc
\ No newline at end of file
+a8b504499e156b2f32b035c4cd88fb7acf4f9ac82231cfaf1576032a2a02b3bc
\ No newline at end of file
diff --git a/local-server/build.size b/local-server/build.size
index c0e29e278..d74c5d149 100644
--- a/local-server/build.size
+++ b/local-server/build.size
@@ -1,7 +1,7 @@
 {
   "development": {
-    "size": "10.15MB",
-    "compressedSize": "3.48MB"
+    "size": "10.21MB",
+    "compressedSize": "3.49MB"
   },
   "production": {
     "size": "8.89MB",
diff --git a/local-server/jest.globalsetup.js b/local-server/jest.globalsetup.js
index 0e1253c7e..e3ab729fe 100644
--- a/local-server/jest.globalsetup.js
+++ b/local-server/jest.globalsetup.js
@@ -9,6 +9,7 @@ export default () => {
 	delete process.env["OPENAI_LOCAL_SERVER_PROXY"]
 	delete process.env["GROQ_LOCAL_SERVER_PROXY"]
 	delete process.env["GEMINI_LOCAL_SERVER_PROXY"]
+	delete process.env["OLLAMA_LOCAL_SERVER_PROXY"]
 	delete process.env["CLAUDE_CODE_PROXY"]
 	delete process.env["CODEX_PROXY"]
 	delete process.env["GEMINI_CLI_PROXY"]
diff --git a/local-server/package.json b/local-server/package.json
index 63267a04d..973908f85 100644
--- a/local-server/package.json
+++ b/local-server/package.json
@@ -52,6 +52,7 @@
 		"glob-regex": "^0.3.2",
 		"globby": "^14.1.0",
 		"js-tiktoken": "^1.0.21",
+		"ollama-ai-provider-v2": "^1.5.5",
 		"openai": "^4.83.0",
 		"p-wait-for": "^5.0.2",
 		"simple-git": "^3.27.0",
diff --git a/local-server/src/server/endpoints/listModels.ts b/local-server/src/server/endpoints/listModels.ts
index 611b49665..a66a53cb3 100644
--- a/local-server/src/server/endpoints/listModels.ts
+++ b/local-server/src/server/endpoints/listModels.ts
@@ -57,18 +57,24 @@ export const registerEndpoint = (router: Router, aiProviders: AIProvider[]) => {
 				maxCompletionTokens: model.max_completion_tokens || 16384,
 				inputModalities: model.architecture.input_modalities.filter(isValidModelModality),
 				outputModalities: model.architecture.output_modalities.filter(isValidModelModality),
-				pricing: {
-					prompt: parseTokenCost(model.pricing.prompt),
-					completion: parseTokenCost(model.pricing.completion),
-					image: parseTokenCost(model.pricing.image),
-					request: parseTokenCost(model.pricing.request),
-					web_search: parseTokenCost(model.pricing.web_search),
-					internal_reasoning: parseTokenCost(model.pricing.internal_reasoning),
-					input_cache_read: parseTokenCost(model.pricing.input_cache_read),
-					input_cache_write: parseTokenCost(model.pricing.input_cache_write),
-				},
+				pricing: model.pricing
+					? {
+							prompt: parseTokenCost(model.pricing.prompt),
+							completion: parseTokenCost(model.pricing.completion),
+							image: parseTokenCost(model.pricing.image),
+							request: parseTokenCost(model.pricing.request),
+							web_search: parseTokenCost(model.pricing.web_search),
+							internal_reasoning: parseTokenCost(model.pricing.internal_reasoning),
+							input_cache_read: parseTokenCost(model.pricing.input_cache_read),
+							input_cache_write: parseTokenCost(model.pricing.input_cache_write),
+						}
+					: undefined,
 				createdAt: model.created,
 				rankForProgramming: model.rankForProgramming,
+				supportsChat: model.supportsChat,
+				supportsTools: model.supportsTools,
+				supportsReasoning: model.supportsReasoning,
+				supportsCompletion: model.supportsCompletion,
 			})),
 		} satisfies ListModelsOutput)
 	})
diff --git a/local-server/src/server/endpoints/sendMessage/sendMessage.ts b/local-server/src/server/endpoints/sendMessage/sendMessage.ts
index fc77a74a2..e56ee7711 100644
--- a/local-server/src/server/endpoints/sendMessage/sendMessage.ts
+++ b/local-server/src/server/endpoints/sendMessage/sendMessage.ts
@@ -103,7 +103,7 @@ export const registerEndpoint = (router: Router, aiProviders: AIProvider[]) => {
 						})
 				}
 
-				await sendMessageImpl({ messages, localExecutable, threadId, tools }, res)
+				await sendMessageImpl({ messages, localExecutable, threadId, tools: tools ?? [] }, res)
 				return
 			}
 
@@ -147,8 +147,8 @@ export const registerEndpoint = (router: Router, aiProviders: AIProvider[]) => {
 				model,
 				abortSignal: abortController.signal,
 				tools: (addProviderOptionsToTools
-					? addProviderOptionsToTools(tools.map(mapTool))
-					: tools.map(mapTool)
+					? addProviderOptionsToTools(tools?.map(mapTool) ?? [])
+					: tools?.map(mapTool)
 				)?.reduce(
 					(acc, tool) => {
 						acc[tool.name] = tool
diff --git a/local-server/src/server/providers/__tests__/ollama.test.ts b/local-server/src/server/providers/__tests__/ollama.test.ts
new file mode 100644
index 000000000..937d90aaf
--- /dev/null
+++ b/local-server/src/server/providers/__tests__/ollama.test.ts
@@ -0,0 +1,1060 @@
+import { describe, expect, it, beforeEach, jest } from "@jest/globals"
+import { OllamaAIProvider } from "../ollama"
+import { ProviderConfig } from "../provider"
+import { UserFacingError } from "../../errors"
+
+// Mock global fetch
+global.fetch = jest.fn() as jest.MockedFunction<typeof fetch>
+
+describe("OllamaAIProvider", () => {
+	let provider: OllamaAIProvider
+	let mockFetch: jest.MockedFunction<typeof fetch>
+
+	beforeEach(() => {
+		provider = new OllamaAIProvider()
+		mockFetch = global.fetch as jest.MockedFunction<typeof fetch>
+		mockFetch.mockClear()
+	})
+
+	describe("provider metadata", () => {
+		it("should have correct provider name", () => {
+			expect(provider.name).toBe("ollama")
+		})
+	})
+
+	describe("build", () => {
+		it("should create provider with default baseURL", () => {
+			const result = provider.build({
+				provider: {},
+				modelName: "llama2",
+			})
+
+			expect(result.model).toBeDefined()
+			expect(result.generalProviderOptions).toBeUndefined()
+		})
+
+		it("should create provider with custom baseURL", () => {
+			const result = provider.build({
+				provider: {
+					baseUrl: "http://custom-ollama:11434/api",
+				},
+				modelName: "mistral",
+			})
+
+			expect(result.model).toBeDefined()
+		})
+
+		it("should append /api to baseURL if not yet present", () => {
+			const result = provider.build({
+				provider: {
+					baseUrl: "http://custom-ollama:11434",
+				},
+				modelName: "llama2",
+			})
+
+			expect(result.model).toBeDefined()
+		})
+
+		it("should respect OLLAMA_LOCAL_SERVER_PROXY in build()", () => {
+			const originalEnv = process.env.OLLAMA_LOCAL_SERVER_PROXY
+			process.env.OLLAMA_LOCAL_SERVER_PROXY = "http://proxy:9999"
+
+			const result = provider.build({
+				provider: {},
+				modelName: "llama2",
+			})
+
+			expect(result.model).toBeDefined()
+
+			// Restore
+			if (originalEnv) {
+				process.env.OLLAMA_LOCAL_SERVER_PROXY = originalEnv
+			} else {
+				delete process.env.OLLAMA_LOCAL_SERVER_PROXY
+			}
+		})
+
+		it("should create provider with thinking option when reasoningBudget is set", () => {
+			const result = provider.build({
+				provider: {},
+				modelName: "llama2",
+				reasoningBudget: 100,
+			})
+
+			expect(result.model).toBeDefined()
+			expect(result.generalProviderOptions).toEqual({ ollama: { think: true } })
+		})
+	})
+
+	describe("listModels", () => {
+		it("should respect OLLAMA_LOCAL_SERVER_PROXY environment variable", async () => {
+			const originalEnv = process.env.OLLAMA_LOCAL_SERVER_PROXY
+			process.env.OLLAMA_LOCAL_SERVER_PROXY = "http://proxy:9999"
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => ({ models: [] }),
+			} as Response)
+
+			const config: ProviderConfig = {}
+			await provider.listModels(config, [])
+
+			expect(mockFetch).toHaveBeenCalledWith("http://proxy:9999/api/tags")
+
+			// Restore original env
+			if (originalEnv) {
+				process.env.OLLAMA_LOCAL_SERVER_PROXY = originalEnv
+			} else {
+				delete process.env.OLLAMA_LOCAL_SERVER_PROXY
+			}
+		})
+
+		it("should use custom baseURL when provided", async () => {
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => ({ models: [] }),
+			} as Response)
+
+			const config: ProviderConfig = {
+				baseUrl: "http://custom-host:8080",
+			}
+
+			await provider.listModels(config, [])
+
+			expect(mockFetch).toHaveBeenCalledWith("http://custom-host:8080/api/tags")
+		})
+
+		it("should throw UserFacingError when API request fails", async () => {
+			mockFetch.mockResolvedValueOnce({
+				ok: false,
+				status: 500,
+				statusText: "Internal Server Error",
+			} as Response)
+
+			const config: ProviderConfig = {}
+
+			await expect(provider.listModels(config, [])).rejects.toThrow(UserFacingError)
+		})
+
+		it("should handle Ollama server not running", async () => {
+			mockFetch.mockRejectedValueOnce(new Error("fetch failed"))
+
+			const config: ProviderConfig = {}
+
+			await expect(provider.listModels(config, [])).rejects.toThrow()
+		})
+
+		it("should handle empty models list", async () => {
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => ({ models: [] }),
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models).toEqual([])
+		})
+
+		it("should handle failed detail requests", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "test-model:latest",
+						model: "test-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "1B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			// Mock failed detail request
+			mockFetch.mockResolvedValueOnce({
+				ok: false,
+				status: 404,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(0)
+		})
+
+		it("should fetch and parse model from Ollama API", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "llama2:latest",
+						model: "llama2",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 3825819519,
+						digest: "abc123",
+						details: {
+							format: "gguf",
+							family: "llama",
+							parameter_size: "7B",
+							quantization_level: "Q4_0",
+						},
+					},
+					{
+						name: "codellama:13b",
+						model: "codellama",
+						modified_at: "2024-01-02T00:00:00Z",
+						size: 7365960935,
+						digest: "def456",
+						details: {
+							format: "gguf",
+							family: "llama",
+							parameter_size: "13B",
+							quantization_level: "Q4_0",
+						},
+					},
+				],
+			}
+
+			const mockModelDetails = {
+				model_info: {
+					"general.base_model.0.name": "Llama 2",
+					"general.architecture": "llama",
+					"llama.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "llama",
+					parameter_size: "7B",
+					quantization_level: "Q4_0",
+				},
+				capabilites: ["completion", "tools"],
+			}
+
+			// Mock /api/tags call
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			// Mock /api/show calls for each model
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetails,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetails,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			// Should call /api/tags once and /api/show twice (once per model)
+			expect(mockFetch).toHaveBeenCalledTimes(3)
+			expect(models.length).toBeGreaterThan(0)
+		})
+
+		it("should extract context length from model details", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "qwen2.5-coder:1.5b",
+						model: "qwen2.5-coder",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 986062089,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "qwen2",
+							parameter_size: "1.5B",
+							quantization_level: "Q4_K_M",
+						},
+					},
+				],
+			}
+
+			const mockModelDetails = {
+				model_info: {
+					"general.base_model.0.name": "Qwen2.5 Coder 1.5B",
+					"general.base_model.0.organization": "Qwen",
+					"general.architecture": "qwen2",
+					"qwen2.context_length": 32768,
+					"general.size_label": "1.5B",
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "qwen2",
+					parameter_size: "1.5B",
+					quantization_level: "Q4_K_M",
+				},
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetails,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].context_length).toBe(32768)
+		})
+
+		it("should derive input modalities from capabilities", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "vision-model:latest",
+						model: "vision-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsWithVision = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 8192,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["completion", "vision", "tools"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsWithVision,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].architecture.input_modalities).toContain("text")
+			expect(models[0].architecture.input_modalities).toContain("image")
+		})
+
+		it("should default to text-only modality when no capabilities", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "text-only-model:latest",
+						model: "text-only-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsNoCapabilities = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				// No capabilities field
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsNoCapabilities,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].architecture.input_modalities).toEqual(["text"])
+		})
+
+		it("should derive supportsChat from completion capability", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "chat-model:latest",
+						model: "chat-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsWithChat = {
+				model_info: {
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["completion", "tools"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsWithChat,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models[0].supportsChat).toBe(true)
+		})
+
+		it("should set supportsChat to false without completion capability", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "no-chat-model:latest",
+						model: "no-chat-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsNoChat = {
+				model_info: {
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["vision"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsNoChat,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models[0].supportsChat).toBe(false)
+		})
+
+		it("should derive supportsTools from capabilities", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "tools-model:latest",
+						model: "tools-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsWithTools = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["completion", "tools"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsWithTools,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].supportsTools).toBe(true)
+		})
+
+		it("should set supportsTools to false when no tools capability", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "no-tools-model:latest",
+						model: "no-tools-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsNoTools = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["completion", "vision"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsNoTools,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].supportsTools).toBe(false)
+		})
+
+		it("should derive supportsReasoning from capabilities", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "reasoning-model:latest",
+						model: "reasoning-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsWithReasoning = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["completion", "thinking", "tools"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsWithReasoning,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].supportsReasoning).toBe(true)
+		})
+
+		it("should set supportsReasoning to false when no thinking capability", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "no-reasoning-model:latest",
+						model: "no-reasoning-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsNoReasoning = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsNoReasoning,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].supportsReasoning).toBe(false)
+		})
+
+		it("should derive supportsCompletion from capabilities", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "completion-model:latest",
+						model: "completion-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsWithCompletion = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["completion", "tools", "insert"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsWithCompletion,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].supportsCompletion).toBe(true)
+		})
+
+		it("should set supportsCompletion to false when no completion capability", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "no-completion-model:latest",
+						model: "no-completion-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsNoCompletion = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["vision", "tools"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsNoCompletion,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].supportsCompletion).toBe(false)
+		})
+
+		it("should handle all capabilities together", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "full-featured-model:latest",
+						model: "full-featured-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetailsFullFeatured = {
+				model_info: {
+					"general.architecture": "test",
+					"test.context_length": 8192,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+				capabilities: ["completion", "vision", "thinking", "tools", "insert"],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetailsFullFeatured,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(1)
+			expect(models[0].architecture.input_modalities).toContain("text")
+			expect(models[0].architecture.input_modalities).toContain("image")
+			expect(models[0].supportsChat).toBe(true)
+			expect(models[0].supportsTools).toBe(true)
+			expect(models[0].supportsReasoning).toBe(true)
+			expect(models[0].supportsCompletion).toBe(true)
+		})
+
+		it("should set high rankForProgramming for code models", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "codellama:7b",
+						model: "codellama",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "llama",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetails = {
+				model_info: {
+					"general.architecture": "llama",
+					"llama.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "llama",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetails,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models[0].rankForProgramming).toBe(100)
+		})
+
+		it("should set high rankForProgramming for dev-prefixed models", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "devllama:latest",
+						model: "devllama",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "llama",
+							parameter_size: "7B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetails = {
+				model_info: {
+					"general.architecture": "llama",
+					"llama.context_length": 4096,
+				},
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "llama",
+					parameter_size: "7B",
+					quantization_level: "Q4",
+				},
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetails,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models[0].rankForProgramming).toBe(100)
+		})
+
+		it("should use default context length when model_info is missing", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "minimal:latest",
+						model: "minimal",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "1B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			const mockModelDetails = {
+				// No model_info
+				details: {
+					parent_model: "",
+					format: "gguf",
+					family: "test",
+					parameter_size: "1B",
+					quantization_level: "Q4",
+				},
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockModelDetails,
+			} as Response)
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models[0].context_length).toBe(4096)
+		})
+
+		it("should return null on network error during detail fetch", async () => {
+			const mockOllamaResponse = {
+				models: [
+					{
+						name: "test-model:latest",
+						model: "test-model",
+						modified_at: "2024-01-01T00:00:00Z",
+						size: 1000000,
+						digest: "test123",
+						details: {
+							format: "gguf",
+							family: "test",
+							parameter_size: "1B",
+							quantization_level: "Q4",
+						},
+					},
+				],
+			}
+
+			mockFetch.mockResolvedValueOnce({
+				ok: true,
+				json: async () => mockOllamaResponse,
+			} as Response)
+
+			// Mock network error
+			mockFetch.mockRejectedValueOnce(new Error("Network error"))
+
+			const config: ProviderConfig = {}
+			const models = await provider.listModels(config, [])
+
+			expect(models.length).toBe(0)
+		})
+	})
+})
diff --git a/local-server/src/server/providers/ollama.ts b/local-server/src/server/providers/ollama.ts
new file mode 100644
index 000000000..80fcad54f
--- /dev/null
+++ b/local-server/src/server/providers/ollama.ts
@@ -0,0 +1,227 @@
+import { AIProvider, AIProviderInput, AIProviderOutput, ProviderModel, ProviderConfig, ModelModality } from "./provider"
+import { APIProviderName } from "@/server/schemas/sendMessageSchema"
+import { createOllama, OllamaCompletionProviderOptions } from "ollama-ai-provider-v2"
+import { LanguageModel } from "ai"
+import { UserFacingError } from "../errors"
+import { ProviderModelFullInfo } from "./provider"
+
+type OllamaModelInfo = {
+	name: string
+	model: string
+	modified_at: string
+	size: number
+	digest: string
+	details: {
+		parent_model?: string
+		format: string
+		family: string
+		families?: string[]
+		parameter_size: string
+		quantization_level: string
+	}
+}
+
+type OllamaModelsResponse = {
+	models: OllamaModelInfo[]
+}
+
+type OllamaModelDetails = {
+	model_info: {
+		"general.architecture"?: string
+		"general.base_model.0.name"?: string
+		"general.base_model.0.organization"?: string
+		"general.parameter_count"?: number
+		"general.size_label"?: string
+		"general.license"?: string
+		// Ollama's API is not fully typed and some parameters get scoped keys such as `qwen3.context_length` / `llama.context_length`
+		// For this reason this property is a catch all from where the relevant values will be extracted.
+		[key: string]: string | number | null | undefined
+	}
+	details: {
+		parent_model: string
+		format: string
+		family: string
+		families?: string[]
+		parameter_size: string
+		quantization_level: string
+	}
+	capabilities?: string[]
+	license?: string
+	template?: string
+	system?: string
+}
+
+// Extract context length from model_info
+function extractContextLength(modelInfo: Record<string, string | number | null | undefined>): number {
+	// Search for any key ending with ".context_length". This is because Ollama uses scoped keys (e.g. `qwen3.context_length` / `llama.context_length`)
+	const contextLengthKey = Object.keys(modelInfo).find((key) => key.endsWith(".context_length"))
+
+	if (contextLengthKey) {
+		const value = modelInfo[contextLengthKey]
+		if (typeof value === "number" && value > 0) {
+			return value
+		}
+	}
+
+	// Default fallback
+	return 4096
+}
+
+// Derive input modalities from Ollama capabilities
+function deriveInputModalities(capabilities?: string[]): ModelModality[] {
+	if (!capabilities || capabilities.length === 0) {
+		return ["text"]
+	}
+
+	const modalities = new Set<ModelModality>(["text"]) // All Ollama models support text
+
+	// Check for vision capabilities
+	if (capabilities.includes("vision")) {
+		modalities.add("image")
+	}
+
+	return Array.from(modalities)
+}
+
+export class OllamaAIProvider implements AIProvider {
+	name: APIProviderName = "ollama"
+
+	build(params: AIProviderInput): AIProviderOutput {
+		const {
+			provider: { baseUrl },
+			modelName,
+			reasoningBudget,
+		} = params
+
+		let finalBaseUrl = process.env["OLLAMA_LOCAL_SERVER_PROXY"] ?? baseUrl ?? "http://localhost:11434/api"
+		if (!finalBaseUrl.endsWith("/api")) {
+			finalBaseUrl = `${finalBaseUrl}/api`
+		}
+
+		const provider = createOllama({
+			baseURL: finalBaseUrl,
+		})
+
+		const providerOptions: OllamaCompletionProviderOptions = {}
+		if (reasoningBudget) {
+			providerOptions.think = true
+		}
+
+		const generalProviderOptions = Object.keys(providerOptions).length > 0 ? { ollama: providerOptions } : undefined
+
+		return {
+			model: provider(modelName) as unknown as LanguageModel,
+			generalProviderOptions,
+		}
+	}
+
+	async listModels(params: ProviderConfig, _referenceModels: ProviderModelFullInfo[]): Promise<ProviderModel[]> {
+		let baseUrl = process.env["OLLAMA_LOCAL_SERVER_PROXY"] ?? params.baseUrl ?? "http://localhost:11434/api"
+		if (!baseUrl.endsWith("/api")) {
+			baseUrl = `${baseUrl}/api`
+		}
+
+		// List available models. See https://github.com/ollama/ollama/blob/main/docs/api.md#list-local-models
+		const url = new URL(`${baseUrl}/tags`)
+		const response = await fetch(url.toString())
+
+		if (!response.ok) {
+			throw new UserFacingError({
+				message: `Failed to fetch Ollama models: ${response.statusText}`,
+				statusCode: response.status,
+				underlyingError: new Error(`Failed to fetch models for Ollama provider`),
+			})
+		}
+
+		const data: OllamaModelsResponse = await response.json()
+		const allModels = data.models || []
+
+		// Fetch detailed information for each model in parallel
+		const modelsWithDetails = await Promise.all(
+			allModels.map(async (model) => {
+				const details = await this.fetchModelDetails(baseUrl, model.name)
+				if (!details) {
+					return undefined
+				}
+				return { model, details }
+			}),
+		).then((results) =>
+			results.filter(
+				(item): item is { model: OllamaModelInfo; details: OllamaModelDetails } => item !== undefined,
+			),
+		)
+
+		return modelsWithDetails.map(({ model, details }) => this.buildModel(model, details))
+	}
+
+	/**
+	 * Fetch detailed information about a specific model from Ollama API
+	 */
+	private async fetchModelDetails(baseUrl: string, modelName: string): Promise<OllamaModelDetails | null> {
+		try {
+			// Fetch model details. See https://github.com/ollama/ollama/blob/main/docs/api.md#show-model-information
+			const response = await fetch(`${baseUrl}/show`, {
+				method: "POST",
+				headers: {
+					"Content-Type": "application/json",
+				},
+				body: JSON.stringify({ name: modelName }),
+			})
+
+			if (!response.ok) {
+				// If we can't get details, return null
+				return null
+			}
+
+			return await response.json()
+		} catch (_error) {
+			// Silently fail and return null
+			return null
+		}
+	}
+
+	private buildModel(model: OllamaModelInfo, details: OllamaModelDetails): ProviderModel {
+		// Extract general information from details
+		const displayName = details.model_info?.["general.base_model.0.name"] || model.name
+		const organization = details.model_info?.["general.base_model.0.organization"]
+		const sizeLabel = details.model_info?.["general.size_label"] || model.details.parameter_size
+
+		// Build description with available information
+		let description = `Ollama: ${model.details.family}`
+		if (organization) {
+			description = `${organization} - ${displayName}`
+		}
+		if (sizeLabel) {
+			description += ` (${sizeLabel})`
+		}
+
+		// Extract context length from detailed model info if available, fallback to Ollama default
+		const contextLength = details.model_info ? extractContextLength(details.model_info) : 4096
+
+		// Derive input modalities from capabilities
+		const inputModalities = deriveInputModalities(details.capabilities)
+
+		// Calculate rank for programming from model name
+		const rankForProgramming =
+			model.name.toLowerCase().includes("code") || model.name.toLowerCase().startsWith("dev") ? 100 : 0
+
+		// Return model information
+		return {
+			providerId: model.name,
+			globalId: `ollama/${model.name}`,
+			name: displayName,
+			description: description,
+			context_length: contextLength,
+			architecture: {
+				input_modalities: inputModalities,
+				output_modalities: ["text"],
+			},
+			created: new Date(model.modified_at).getTime() / 1000,
+			rankForProgramming: rankForProgramming,
+			supportsChat: details.capabilities?.includes("completion") ?? false,
+			supportsTools: details?.capabilities?.includes("tools") ?? false,
+			supportsReasoning: details.capabilities?.includes("thinking") ?? false,
+			supportsCompletion: details.capabilities?.includes("insert") ?? false,
+		}
+	}
+}
diff --git a/local-server/src/server/providers/provider-utils.ts b/local-server/src/server/providers/provider-utils.ts
index 3e54b2142..4c1afa59c 100644
--- a/local-server/src/server/providers/provider-utils.ts
+++ b/local-server/src/server/providers/provider-utils.ts
@@ -117,6 +117,10 @@ export const listReferenceModels = async (): Promise<ProviderModelFullInfo[]> =>
 				name,
 				// A model supports reasoning if at least one provider supports it
 				supportsReasoning: !!modelWithProviders.find((provider) => provider.endpoint?.supports_reasoning),
+				// A model supports tools if at least one provider supports it
+				supportsTools: !!modelWithProviders.find((provider) =>
+					provider.endpoint?.supported_parameters.includes("tools"),
+				),
 				providers: modelWithProviders
 					.map((modelWithProvider) => {
 						if (!modelWithProvider.endpoint) {
diff --git a/local-server/src/server/providers/provider.ts b/local-server/src/server/providers/provider.ts
index 9ff91075f..cc85a80a2 100644
--- a/local-server/src/server/providers/provider.ts
+++ b/local-server/src/server/providers/provider.ts
@@ -71,7 +71,7 @@ export type ProviderModelFullInfo = {
 		max_completion_tokens?: number
 	}
 	/** Pricing information (values are strings to preserve precision) */
-	pricing: {
+	pricing?: {
 		/** Cost per prompt token */
 		prompt: string
 		/** Cost per completion token */
@@ -106,6 +106,8 @@ export type ProviderModelFullInfo = {
 	created: number
 	/** How this model ranks in programming tasks (from OpenRouter, only available for top models) */
 	rankForProgramming: number
+	/** Whether the model supports tools */
+	supportsTools: boolean
 	/** Whether the model supports extended reasoning/thinking */
 	supportsReasoning: boolean
 }
@@ -140,7 +142,7 @@ export type ProviderModel = {
 		output_modalities: ModelModality[]
 	}
 	/** Pricing information (values are strings to preserve precision) */
-	pricing: {
+	pricing?: {
 		/** Cost per prompt token */
 		prompt: string
 		/** Cost per completion token */
@@ -162,10 +164,14 @@ export type ProviderModel = {
 	created: number
 	/** Ranking for programming tasks */
 	rankForProgramming: number
+	/** Whether the model supports chat */
+	supportsChat: boolean
+	/** Whether the model supports tools */
+	supportsTools: boolean
 	/** Whether the model supports extended reasoning/thinking */
 	supportsReasoning: boolean
+	/** Whether the model supports completion */
 	supportsCompletion: boolean
-	supportsChat: boolean
 }
 
 /**
diff --git a/local-server/src/server/schemas/listModelsSchema.ts b/local-server/src/server/schemas/listModelsSchema.ts
index 458d2b385..c68d3fec7 100644
--- a/local-server/src/server/schemas/listModelsSchema.ts
+++ b/local-server/src/server/schemas/listModelsSchema.ts
@@ -36,10 +36,14 @@ export type Model = {
 	maxCompletionTokens: number
 	inputModalities: ModelModality[]
 	outputModalities: ModelModality[]
-	pricing: ModelPricing
+	pricing?: ModelPricing
 	createdAt: number
 	/**
 	 * @format integer
 	 */
 	rankForProgramming: number
+	supportsChat: boolean
+	supportsTools: boolean
+	supportsReasoning: boolean
+	supportsCompletion: boolean
 }
diff --git a/local-server/src/server/schemas/sendMessageSchema.ts b/local-server/src/server/schemas/sendMessageSchema.ts
index c872b2836..1e1cbdac2 100644
--- a/local-server/src/server/schemas/sendMessageSchema.ts
+++ b/local-server/src/server/schemas/sendMessageSchema.ts
@@ -2,7 +2,7 @@ export interface SendMessageRequestParams {
 	messages: Message[]
 	system?: string
 	projectRoot: string | undefined
-	tools: Tool[]
+	tools?: Tool[]
 	model: string
 	enableReasoning: boolean
 	provider: APIProvider
@@ -32,6 +32,7 @@ export type APIProviderName =
 	| "gemini"
 	| "mistral"
 	| "inception"
+	| "ollama"
 	| "claude_code"
 	| "codex"
 	| "gemini_cli"
diff --git a/local-server/src/server/server.ts b/local-server/src/server/server.ts
index 2c6db366f..f13fb3dad 100644
--- a/local-server/src/server/server.ts
+++ b/local-server/src/server/server.ts
@@ -23,6 +23,7 @@ import { GroqAIProvider } from "./providers/groq"
 import { MistralAIProvider } from "./providers/mistral"
 import { GeminiAIProvider } from "./providers/gemini"
 import { InceptionAIProvider } from "./providers/inception"
+import { OllamaAIProvider } from "./providers/ollama"
 
 const connectionInfo: ConnectionInfo = {
 	port: 10534, // Default port
@@ -51,6 +52,7 @@ const aiProviders = [
 	new GeminiAIProvider(),
 	new MistralAIProvider(),
 	new InceptionAIProvider(),
+	new OllamaAIProvider(),
 ]
 registerSendMessageEndpoint(router, aiProviders)
 registerCodeCompletionEndpoint(router, aiProviders)
diff --git a/local-server/yarn.lock b/local-server/yarn.lock
index 922878cc8..25bdacc40 100644
--- a/local-server/yarn.lock
+++ b/local-server/yarn.lock
@@ -127,7 +127,20 @@ __metadata:
   languageName: node
   linkType: hard
 
-"@ai-sdk/provider@npm:2.0.0":
+"@ai-sdk/provider-utils@npm:^3.0.17":
+  version: 3.0.19
+  resolution: "@ai-sdk/provider-utils@npm:3.0.19"
+  dependencies:
+    "@ai-sdk/provider": "npm:2.0.0"
+    "@standard-schema/spec": "npm:^1.0.0"
+    eventsource-parser: "npm:^3.0.6"
+  peerDependencies:
+    zod: ^3.25.76 || ^4.1.8
+  checksum: 10c0/e4decb19264067fa1b1642e07d515d25d1509a1a9143f59ccc051e3ca413c9fb1d708e1052a70eaf329ca39ddf6152520cd833dbf8c95d9bf02bbeffae8ea363
+  languageName: node
+  linkType: hard
+
+"@ai-sdk/provider@npm:2.0.0, @ai-sdk/provider@npm:^2.0.0":
   version: 2.0.0
   resolution: "@ai-sdk/provider@npm:2.0.0"
   dependencies:
@@ -7667,6 +7680,7 @@ __metadata:
     js-tiktoken: "npm:^1.0.21"
     json-schema: "npm:^0.4.0"
     nock: "npm:^14.0.1"
+    ollama-ai-provider-v2: "npm:^1.5.5"
     openai: "npm:^4.83.0"
     p-wait-for: "npm:^5.0.2"
     prettier: "npm:^3.4.2"
@@ -8362,6 +8376,18 @@ __metadata:
   languageName: node
   linkType: hard
 
+"ollama-ai-provider-v2@npm:^1.5.5":
+  version: 1.5.5
+  resolution: "ollama-ai-provider-v2@npm:1.5.5"
+  dependencies:
+    "@ai-sdk/provider": "npm:^2.0.0"
+    "@ai-sdk/provider-utils": "npm:^3.0.17"
+  peerDependencies:
+    zod: ^4.0.16
+  checksum: 10c0/da40c8097bd8205c46eccfbd13e77c51a6ce97a29b886adfc9e1b8444460b558138d1ed4428491fcc9378d46f649dd0a9b1e5b13cf6bbc8f5385e8b321734e72
+  languageName: node
+  linkType: hard
+
 "on-finished@npm:2.4.1, on-finished@npm:^2.4.1":
   version: 2.4.1
   resolution: "on-finished@npm:2.4.1"