add local-ai

2024-11-10 14:19:42 -05:00
parent 423fff7750
commit 8f1af975e6
2 changed files with 167 additions and 0 deletions
--- a/podman/incubating/localai/README.md
+++ b/podman/incubating/localai/README.md
@@ -0,0 +1,135 @@
+# Local AI with Anything LLM
+
+<https://github.com/Mintplex-Labs/anything-llm/blob/master/docker/HOW_TO_USE_DOCKER.md>
+
+<https://localai.io/>
+
+## Run locally
+
+```bash
+podman network create localai
+
+mkdir -p ./volumes/local-ai/local-ai
+mkdir -p ./volumes/local-ai/anythingllm
+
+# Local AI
+podman run \
+    -d \
+    -p 127.0.0.1:8080:8080 \
+    --network localai \
+    --name local-ai \
+    -v ./volumes/local-ai/local-ai:/build/models \
+    quay.io/go-skynet/local-ai:latest-cpu
+
+# Anything LLM Interface
+podman run -d \
+    -p 127.0.0.1:3001:3001 \
+    --cap-add SYS_ADMIN \
+    --network localai \
+    --name anything-llm \
+    -v ./volumes/local-ai/anythingllm:/app/server/storage \
+    -e STORAGE_DIR="/app/server/storage" \
+    docker.io/mintplexlabs/anythingllm
+```
+
+## Run in Production
+
+This installs both Local AI and Anything LLM as backend/frontend services.
+
+Note:
+
+You'll need folders for the models and anything-llm storage.
+
+```bash
+mkdir /models
+mkdir /anything-llm
+chown 1000:1000 /anything-llm
+```
+
+```bash
+podman network create localai
+
+# Local AI
+podman run \
+    -d \
+    -p 127.0.0.1:8080:8080 \
+    --network localai \
+    --name local-ai \
+    -v /models:/build/models \
+    quay.io/go-skynet/local-ai:latest-cpu
+
+# Anything LLM Interface
+podman run -d \
+    -p 127.0.0.1:3001:3001 \
+    --cap-add SYS_ADMIN \
+    --network localai \
+    --name anything-llm \
+    -v /anythingllm:/app/server/storage \
+    -e STORAGE_DIR="/app/server/storage" \
+    docker.io/mintplexlabs/anythingllm
+```
+
+## Models
+
+### Config
+
+```yaml
+name: llama-3.2
+parameters:
+  model: huggingface/Llama-3.2-3B-Instruct-f16.gguf
+  temperature: 0.6
+backend: llama-cpp
+# Default context size
+context_size: 8192
+threads: 16
+```
+
+### Chat
+
+llama-3.2-3b-instruct:q8_0
+
+### Code
+
+llama3.2-3b-enigma
+
+### Agent
+
+llama-3.2-3b-instruct:q8_0
+
+## Nginx
+
+```bash
+certbot-3 certonly --dns-route53 -d chatreesept.reeseapps.com
+```
+
+Make sure to add the following timeout configurations to your http block:
+
+```conf
+server {
+   # Enable websocket connections for agent protocol.
+   location ~* ^/api/agent-invocation/(.*) {
+      proxy_pass http://0.0.0.0:3001;
+      proxy_http_version 1.1;
+      proxy_set_header Upgrade $http_upgrade;
+      proxy_set_header Connection "Upgrade";
+   }
+
+   listen 80;
+   server_name [insert FQDN here];
+   location / {
+      # Prevent timeouts on long-running requests.
+      proxy_connect_timeout       605;
+      proxy_send_timeout          605;
+      proxy_read_timeout          605;
+      send_timeout                605;
+      keepalive_timeout           605;
+
+      # Enable readable HTTP Streaming for LLM streamed responses
+      proxy_buffering off; 
+      proxy_cache off;
+
+      # Proxy your locally running service
+      proxy_pass  http://0.0.0.0:3001;
+    }
+}
+```
--- a/podman/incubating/localai/chatreesept.reeseapps.com
+++ b/podman/incubating/localai/chatreesept.reeseapps.com
@@ -0,0 +1,32 @@
+server {
+    listen 127.0.0.1:8443 ssl;
+    server_name chatreesept.reeseapps.com;
+
+    ssl_certificate /etc/letsencrypt/live/chatreesept.reeseapps.com/fullchain.pem;
+    ssl_certificate_key /etc/letsencrypt/live/chatreesept.reeseapps.com/privkey.pem;
+    include /etc/letsencrypt/options-ssl-nginx.conf;
+    ssl_dhparam /etc/letsencrypt/ssl-dhparams.pem;
+
+    location ~* ^/api/agent-invocation/(.*) {
+        proxy_pass http://localhost:3001;
+        proxy_http_version 1.1;
+        proxy_set_header Upgrade $http_upgrade;
+        proxy_set_header Connection "Upgrade";
+   }
+
+    location / {
+        client_max_body_size 50m;
+        # Prevent timeouts on long-running requests.
+        proxy_connect_timeout       605;
+        proxy_send_timeout          605;
+        proxy_read_timeout          605;
+        send_timeout                605;
+        keepalive_timeout           605;
+
+        # Enable readable HTTP Streaming for LLM streamed responses
+        proxy_buffering off; 
+        proxy_cache off;
+
+        proxy_pass http://localhost:3001;
+    }
+}