initial REST API for ramalama

Just an initial code, we can always improve on the road. Resolves: containers#725 Signed-off-by: Douglas Schilling Landgraf <dougsland@redhat.com>
dougsland · Feb 4, 2025 · 203dcd3 · 203dcd3 · packit-as-a-service · Feb 4, 2025
1 parent 3a08829
commit 203dcd3
Show file tree

Hide file tree

Showing 4 changed files with 102 additions and 0 deletions.
diff --git a/restapi/.gitignore b/restapi/.gitignore
@@ -0,0 +1 @@
+__pycache__/
diff --git a/restapi/README.md b/restapi/README.md
@@ -0,0 +1,21 @@
+## Running the server
+
+In the server side, run the following:
+
+```console
+uvicorn api:app --host 0.0.0.0 --port 8000 --reload
+```
+
+## Client side getting information
+
+```console
+curl -X GET "http://192.168.82.25:8000/models"
+
+{"models":["NAME                      MODIFIED      SIZE     ","ollama://tinyllama:latest 3 minutes ago 608.16 MB"]}% 
+```
+
+## Posting data
+
+```console
+curl -X POST "http://192.168.82.25:8000/run/tinyllama" &
+```
diff --git a/restapi/api.py b/restapi/api.py
@@ -0,0 +1,78 @@
+from fastapi import FastAPI
+from fastapi.responses import RedirectResponse
+import subprocess
+
+app = FastAPI()
+
+
+# Redirect root "/" to "/docs"
+@app.get("/", include_in_schema=False)
+def root():
+    return RedirectResponse(url="/docs")
+
+
+@app.get("/info")
+def info_command():
+    try:
+        result = subprocess.run(
+                ["ramalama", "info"], capture_output=True, text=True
+        )
+        return {"info": result.stdout.strip().split("\n")}
+    except Exception as e:
+        return {"error": str(e)}
+
+
+@app.get("/ps")
+def ps_command():
+    try:
+        result = subprocess.run(
+                ["ramalama", "ps"], capture_output=True, text=True
+        )
+        return {"ps": result.stdout.strip().split("\n")}
+    except Exception as e:
+        return {"error": str(e)}
+
+
+# List available AI models in RamaLama
+@app.get("/models")
+def list_models():
+    try:
+        result = subprocess.run(
+                ["ramalama", "list"], capture_output=True, text=True
+        )
+        return {"models": result.stdout.strip().split("\n")}
+    except Exception as e:
+        return {"error": str(e)}
+
+
+# Pull method
+@app.post("/pull/{model_name}")
+def pull_model(model_name: str):
+    try:
+        command = ["ramalama", "pull", model_name]
+        subprocess.run(command, check=True)
+        return {"message": f"Model {model_name} is running"}
+    except subprocess.CalledProcessError as e:
+        return {"error": str(e)}
+
+
+# Run an AI model
+# (chatbot will open in the server side at this moment)
+@app.post("/run/{model_name}")
+def run_model(model_name: str):
+    try:
+        command = ["ramalama", "run", model_name]
+        subprocess.run(command, check=True)
+        return {"message": f"Model {model_name} is running"}
+    except subprocess.CalledProcessError as e:
+        return {"error": str(e)}
+
+
+# Stop a running AI model
+@app.post("/stop/{model_name}")
+def stop_model(model_name: str):
+    try:
+        subprocess.run(["ramalama", "stop", model_name], check=True)
+        return {"message": f"Model {model_name} stopped"}
+    except Exception as e:
+        return {"error": str(e)}
diff --git a/restapi/requirements.txt b/restapi/requirements.txt
@@ -0,0 +1,2 @@
+fastapi
+uvicorn