1st try of the backend

2026-01-19 22:02:50 +01:00
commit b90621f665
4 changed files with 125 additions and 0 deletions
--- a/backend/app.py
+++ b/backend/app.py
@@ -0,0 +1,71 @@
+from fastapi import FastAPI
+from pydantic import BaseModel
+import json
+
+from llm import ollama_chat
+from tools import web_search, electronics_ohm, run_command
+
+app = FastAPI()
+
+class ChatIn(BaseModel):
+    message: str
+    model: str = "llama3.1"  # change si besoin
+    mode: str = "AUTO"       # AUTO / DEV / ELEC / INFRA / WEB
+
+SYSTEM = """Tu es un assistant personnel pour Nino.
+Tu dois être pratique, structuré, et orienté action.
+Si une demande nécessite une recherche web, utilise l'outil web_search.
+Si c'est de l'électronique, tu peux utiliser electronics_ohm ou demander les valeurs manquantes.
+Si une commande système est utile, propose run_command mais explique ce que ça fait.
+Réponds en français.
+"""
+
+TOOLS_SPEC = """
+Outils disponibles (à appeler en JSON strict sur une seule ligne) :
+
+1) web_search: {"tool":"web_search","query":"...","max_results":5}
+2) electronics_ohm: {"tool":"electronics_ohm","V":null,"I":0.02,"R":220}
+3) run_command: {"tool":"run_command","cmd":"docker ps"}
+
+Si tu appelles un outil, n'écris QUE le JSON.
+"""
+
+@app.post("/chat")
+async def chat(inp: ChatIn):
+    messages = [
+        {"role": "system", "content": SYSTEM},
+        {"role": "system", "content": TOOLS_SPEC},
+        {"role": "user", "content": inp.message},
+    ]
+
+    # 1) le modèle choisit soit de répondre, soit d'appeler un outil
+    first = (await ollama_chat(inp.model, messages)).strip()
+
+    # 2) si JSON tool-call
+    if first.startswith("{") and '"tool"' in first:
+        call = json.loads(first)
+        tool = call["tool"]
+
+        if tool == "web_search":
+            res = web_search(call["query"], call.get("max_results", 5))
+            messages.append({"role": "assistant", "content": first})
+            messages.append({"role": "tool", "content": json.dumps(res, ensure_ascii=False)})
+            final = await ollama_chat(inp.model, messages)
+            return {"answer": final, "tool_used": "web_search", "tool_result": res}
+
+        if tool == "electronics_ohm":
+            res = electronics_ohm(call.get("V"), call.get("I"), call.get("R"))
+            messages.append({"role": "assistant", "content": first})
+            messages.append({"role": "tool", "content": json.dumps(res, ensure_ascii=False)})
+            final = await ollama_chat(inp.model, messages)
+            return {"answer": final, "tool_used": "electronics_ohm", "tool_result": res}
+
+        if tool == "run_command":
+            res = run_command(call["cmd"])
+            messages.append({"role": "assistant", "content": first})
+            messages.append({"role": "tool", "content": json.dumps(res, ensure_ascii=False)})
+            final = await ollama_chat(inp.model, messages)
+            return {"answer": final, "tool_used": "run_command", "tool_result": res}
+
+    # sinon réponse directe
+    return {"answer": first, "tool_used": None}
--- a/backend/llm.py
+++ b/backend/llm.py
@@ -0,0 +1,13 @@
+import httpx
+
+OLLAMA_URL = "http://localhost:11434"
+
+async def ollama_chat(model: str, messages: list[dict]) -> str:
+    async with httpx.AsyncClient(timeout=120) as client:
+        r = await client.post(
+            f"{OLLAMA_URL}/api/chat",
+            json={"model": model, "messages": messages, "stream": False},
+        )
+        r.raise_for_status()
+        data = r.json()
+        return data["message"]["content"]
--- a/backend/requirements.txt
+++ b/backend/requirements.txt
@@ -0,0 +1,5 @@
+fastapi
+uvicorn
+httpx
+pydantic
+duckduckgo-search
--- a/backend/tool.py
+++ b/backend/tool.py
@@ -0,0 +1,36 @@
+from duckduckgo_search import DDGS
+import subprocess
+import shlex
+import math
+
+def web_search(query: str, max_results: int = 5) -> list[dict]:
+    out = []
+    with DDGS() as ddgs:
+        for r in ddgs.text(query, max_results=max_results):
+            out.append({"title": r.get("title"), "url": r.get("href"), "snippet": r.get("body")})
+    return out
+
+def electronics_ohm(V: float | None, I: float | None, R: float | None) -> dict:
+    # résout V=I*R si une variable est None
+    if [V, I, R].count(None) != 1:
+        return {"error": "Donne exactement 2 valeurs (ex: V et R) et laisse l’autre à null."}
+    if V is None:
+        return {"V": I * R}
+    if I is None:
+        return {"I": V / R}
+    return {"R": V / I}
+
+SAFE_COMMANDS = {"git", "docker", "docker-compose", "python", "pip", "ls", "cat", "grep", "tail", "journalctl"}
+
+def run_command(cmd: str) -> dict:
+    # garde-fou minimal : n’autorise que certaines commandes
+    parts = shlex.split(cmd)
+    if not parts:
+        return {"error": "Commande vide."}
+    if parts[0] not in SAFE_COMMANDS:
+        return {"error": f"Commande interdite: {parts[0]} (liste: {sorted(SAFE_COMMANDS)})"}
+    try:
+        p = subprocess.run(parts, capture_output=True, text=True, timeout=25)
+        return {"returncode": p.returncode, "stdout": p.stdout[-4000:], "stderr": p.stderr[-4000:]}
+    except Exception as e:
+        return {"error": str(e)}