Add scripts and documentation for local inference configuration with Ollama and mlx-omni-server

- Introduced `configure_local_inference.sh` to automatically set `.dev.vars` based on active local inference services. - Updated `start_inference_server.sh` to handle both Ollama and mlx-omni-server server types. - Enhanced `package.json` to include new commands for starting and configuring inference servers. - Refined README to include updated instructions for running and adding models for local inference. - Minor cleanup in `MessageBubble.tsx`.
2025-09-08 22:56:46 +00:00 · 2025-06-02 12:38:50 -04:00
parent f2d91e2752
commit 9e8b427826
5 changed files with 93 additions and 32 deletions
--- a/scripts/configure_local_inference.sh
+++ b/scripts/configure_local_inference.sh
@@ -0,0 +1,49 @@
+#!/usr/bin/env bash
+
+
+# Ensure .dev.vars file exists.
+# This prevents errors if sed tries to edit a non-existent file and ensures '>>' appends.
+# Function to configure .dev.vars with the specified API key and endpoint
+configure_dev_vars() {
+  local endpoint_url=$1
+  local api_key="required-but-not-used"
+
+  echo "Configuring .dev.vars for endpoint: ${endpoint_url}"
+
+  # Configure OPENAI_API_KEY
+  # 1. Remove any existing OPENAI_API_KEY line
+  sed -i '' '/^OPENAI_API_KEY=/d' .dev.vars
+  # 2. Append a blank line (ensures the new variable is on a new line and adds spacing)
+  # 3. Append the new OPENAI_API_KEY line
+  echo "OPENAI_API_KEY=${api_key}" >> .dev.vars
+
+  # Configure OPENAI_API_ENDPOINT
+  # 1. Remove any existing OPENAI_API_ENDPOINT line
+  sed -i '' '/^OPENAI_API_ENDPOINT=/d' .dev.vars
+  # 3. Append the new OPENAI_API_ENDPOINT line
+  echo "OPENAI_API_ENDPOINT=${endpoint_url}" >> .dev.vars
+
+  echo "Local inference is configured for $endpoint_url"
+}
+
+echo "Checking for local inference services..."
+
+# Check for Ollama on port 11434
+# nc -z -w1 localhost 11434:
+#   -z: Zero-I/O mode (port scanning)
+#   -w1: Timeout after 1 second
+#   >/dev/null 2>&1: Suppress output from nc
+if nc -z -w1 localhost 11434 >/dev/null 2>&1; then
+  echo "Ollama service detected on port 11434."
+  configure_dev_vars "http://localhost:11434"
+# Else, check for mlx-omni-server on port 10240
+elif nc -z -w1 localhost 10240 >/dev/null 2>&1; then
+  echo "mlx-omni-server service detected on port 10240."
+  configure_dev_vars "http://localhost:10240"
+else
+  echo "No active local inference service (Ollama or mlx-omni-server) found on default ports (11434, 10240)."
+  echo "If a service is running on a different port, .dev.vars may need manual configuration."
+  echo ".dev.vars was not modified by this script for OpenAI local inference settings."
+fi
+
+echo "Script finished."