hyperflow-wms · anamonium · Jun 15, 2025 · Jun 23, 2025
diff --git a/README.md b/README.md
@@ -263,4 +263,4 @@ echo "127.0.1.1 $HOSTNAME" >> /etc/hosts
 ```
 search svc.cluster.local
 options ndots:5 timeout:1
-```
+```
diff --git a/charts/hyperflow-ops/values.yaml b/charts/hyperflow-ops/values.yaml
@@ -1,3 +1,7 @@
+# This is needed to start keda on address other than cluster.local
+# global:
+#   clusterDomain: #provide cluster address
+
 worker-pools:
   enabled: false # Set to true if using worker pools execution model
   enable-prometheus-adapter: &enable-prometheus-adapter true
@@ -53,6 +57,9 @@ hyperflow-worker-pool-operator:
       username: guest
       password: guest
       erlangCookie: jiwng4pw7NJL3KutMb4pF7k6C5RphXYU
+    # extraEnvVars: #change if cluster domain is different from cluster.local
+    #   - name: RABBITMQ_NODE_NAME
+    #     value: "rabbit@$(MY_POD_NAME).rabbitmq-headless.$(MY_POD_NAMESPACE).svc.cluster.local"
 
   kube-prometheus-stack:
     enabled: *enable-kube-prometheus-stack

diff --git a/charts/hyperflow-run/values.yaml b/charts/hyperflow-run/values.yaml
@@ -31,13 +31,20 @@ workerPools:
   pools: # WorkerPool resources will be created according to this list
     - name: mproject
       taskType: mProject # this has to be equal to task name in workflow.json
-      initialResources: # example overridden setting
-        requests:
-          cpu: "1"
     - name: mdiff
       taskType: mDiffFit
+      initialResources: 
+        requests:
+          cpu: "0.1"
+        limits:
+          cpu: "0.2"
     - name: mbackground
       taskType: mBackground
+      initialResources: 
+        requests:
+          cpu: "0.05"
+        limits:
+          cpu: "0.1"
 
 
 ######################################################

diff --git a/values/monitoring/api/README.md b/values/monitoring/api/README.md
@@ -0,0 +1,15 @@
+# Hyperflow API – Metrics & Logs Interface
+
+This project provides a FastAPI-based interface for querying workflow logs and metrics from OpenSearch.
+
+---
+
+## Setup Instructions
+
+### 1. Create and activate the conda environment
+
+Make sure you have [conda](https://docs.conda.io/en/latest/miniconda.html) installed.
+
+```bash
+conda env create -f environment.yml
+conda activate hyperflow-api
diff --git a/values/monitoring/api/environment.yml b/values/monitoring/api/environment.yml
@@ -0,0 +1,21 @@
+name: hyperflow-api
+channels:
+  - conda-forge
+  - defaults
+dependencies:
+  - python=3.11
+  - pandas
+  - numpy
+  - matplotlib
+  - seaborn
+  - scipy
+  - requests
+  - jupyter
+  - scikit-learn
+  - tqdm
+  - pip
+  - pip:
+      - fastapi
+      - uvicorn
+      - lightgbm
+      - joblib
diff --git a/values/monitoring/api/example-notebook.ipynb b/values/monitoring/api/example-notebook.ipynb
diff --git a/values/monitoring/api/main.py b/values/monitoring/api/main.py
@@ -0,0 +1,260 @@
+from fastapi import FastAPI, Depends, HTTPException, status, Query
+from fastapi.security import HTTPBasic, HTTPBasicCredentials
+from fastapi.responses import FileResponse
+from fastapi.responses import StreamingResponse
+import requests
+import json
+import os
+from typing import List, Dict, Tuple
+
+app = FastAPI()
+
+# --- KONFIGURACJA ---
+OPENSEARCH_URL = "http://localhost:9200"
+SCROLL_TIME = "5m"
+SCROLL_SIZE = 5000
+LOGS_INDEX = "hyperflow_logs"
+METRICS_INDEX = "hyperflow_metrics"
+
+# --- SECURITY DEPENDENCY ---
+security = HTTPBasic()
+
+def get_auth(credentials: HTTPBasicCredentials = Depends(security)) -> Tuple[str, str]:
+    if not credentials.username or not credentials.password:
+        raise HTTPException(
+            status_code=status.HTTP_401_UNAUTHORIZED,
+            detail="Brak credentials",
+            headers={"WWW-Authenticate": "Basic"},
+        )
+    return credentials.username, credentials.password
+
+# --- WSPÓLNE FUNKCJE SCROLLINGU ---
+
+def perform_initial_scroll(index: str, payload: Dict, auth: Tuple[str, str]) -> Dict:
+    return requests.get(
+        f"{OPENSEARCH_URL}/{index}/_search?scroll={SCROLL_TIME}",
+        json=payload,
+        auth=auth
+    ).json()
+
+def perform_scroll(scroll_id: str, auth: Tuple[str, str]) -> Dict:
+    return requests.post(
+        f"{OPENSEARCH_URL}/_search/scroll",
+        json={"scroll": SCROLL_TIME, "scroll_id": scroll_id},
+        auth=auth
+    ).json()
+
+def scroll_by_query(index: str, query_body: Dict, auth: Tuple[str, str]) -> List[Dict]:
+    """
+    Uniwersalna funkcja scrollująca po zadanym body zapytania.
+    Zwraca listę dokumentów (hits).
+    """
+    all_hits = []
+    payload = {"size": SCROLL_SIZE, "query": query_body}
+
+    resp = perform_initial_scroll(index, payload, auth)
+    scroll_id = resp.get("_scroll_id")
+    hits = resp.get("hits", {}).get("hits", [])
+    all_hits.extend(hits)
+
+    while hits:
+        resp = perform_scroll(scroll_id, auth)
+        scroll_id = resp.get("_scroll_id")
+        hits = resp.get("hits", {}).get("hits", [])
+        all_hits.extend(hits)
+
+    return all_hits
+
+@app.get("/logs/by-workflow/{workflow_id}")
+def get_logs_by_workflow(
+    workflow_id: str,
+    auth: Tuple[str, str] = Depends(get_auth)
+):
+    query_body = {"term": {"log.attributes.workflowId.keyword": workflow_id}}
+    hits = scroll_by_query(LOGS_INDEX, query_body, auth)
+
+    file_name = f"logs_{workflow_id}.json"
+    with open(file_name, "w", encoding="utf-8") as f:
+        json.dump([h["_source"] for h in hits], f, ensure_ascii=False, indent=2)
+
+    return {"message": "Zapisano logi", "file": os.path.abspath(file_name), "count": len(hits)}
+
+
+@app.get("/logs/by-date")
+def get_logs_by_date(
+    start_date: str = Query(..., description="Start date ISO (np. 2025-05-01T00:00:00Z)"),
+    end_date:   str = Query(..., description="End   date ISO (np. 2025-05-05T23:59:59Z)"),
+    auth: Tuple[str, str] = Depends(get_auth)
+):
+    query_body = {
+        "range": {
+            "time": {
+                "gte": start_date,
+                "lte": end_date,
+                "format": "strict_date_optional_time"
+            }
+        }
+    }
+    hits = scroll_by_query(LOGS_INDEX, query_body, auth)
+
+    file_name = f"logs_{start_date}_{end_date}.json".replace(":", "-")
+    with open(file_name, "w", encoding="utf-8") as f:
+        json.dump([h["_source"] for h in hits], f, ensure_ascii=False, indent=2)
+
+    return {"message": "Zapisano logi", "file": os.path.abspath(file_name), "count": len(hits)}
+
+
+@app.get("/metrics/by-workflow/{workflow_id}")
+def get_metrics_by_workflow(
+    workflow_id: str,
+    auth: Tuple[str, str] = Depends(get_auth)
+):
+    query_body = {"term": {"metric.attributes.workflowId.keyword": workflow_id}}
+    hits = scroll_by_query(METRICS_INDEX, query_body, auth)
+
+    file_name = f"metrics_{workflow_id}.json"
+    with open(file_name, "w", encoding="utf-8") as f:
+        json.dump([h["_source"] for h in hits], f, ensure_ascii=False, indent=2)
+
+    return {"message": "Zapisano metryki", "file": os.path.abspath(file_name), "count": len(hits)}
+
+
+@app.get("/metrics/by-date")
+def get_metrics_by_date(
+    start_date: str = Query(..., description="Start date ISO (np. 2025-05-01T00:00:00Z)"),
+    end_date:   str = Query(..., description="End   date ISO (np. 2025-05-05T23:59:59Z)"),
+    auth: Tuple[str, str] = Depends(get_auth)
+):
+    must_clause = {
+        "range": {
+            "time": {
+                "gte": start_date,
+                "lte": end_date,
+                "format": "strict_date_optional_time"
+            }
+        }
+    }
+    query_body = {"bool": {"must": [must_clause]}}
+    hits = scroll_by_query(METRICS_INDEX, query_body, auth)
+
+    file_name = f"metrics_{start_date}_{end_date}.json".replace(":", "-")
+    with open(file_name, "w", encoding="utf-8") as f:
+        json.dump([h["_source"] for h in hits], f, ensure_ascii=False, indent=2)
+
+    return FileResponse(
+        path=file_name,
+        filename=os.path.basename(file_name),
+        media_type="application/json"
+    )
+
+
+@app.get("/metrics/filter/by-workflow/{workflow_id}")
+def filter_metrics_by_workflow(
+    workflow_id: str,
+    name: List[str] = Query(
+        None,
+        description="Filtruj po polu `name`; np. ?name=cpu-usage&name=memory-usage"
+    ),
+    auth: Tuple[str, str] = Depends(get_auth)
+):
+    must_clauses = [
+        {"term": {"metric.attributes.workflowId.keyword": workflow_id}}
+    ]
+    if name:
+        must_clauses.append({"terms": {"name.keyword": name}})
+
+    query_body = {"bool": {"must": must_clauses}}
+    hits = scroll_by_query(METRICS_INDEX, query_body, auth)
+
+    file_name = f"metrics_filtered_{workflow_id}.json"
+    with open(file_name, "w", encoding="utf-8") as f:
+        json.dump([h["_source"] for h in hits], f, ensure_ascii=False, indent=2)
+
+    return {"message": "Zapisano przefiltrowane metryki", "file": os.path.abspath(file_name), "count": len(hits)}
+
+
+@app.get("/metrics/filter/by-date")
+def filter_metrics_by_date(
+    start_date: str = Query(..., description="Start date ISO (np. 2025-05-01T00:00:00Z)"),
+    end_date:   str = Query(..., description="End   date ISO (np. 2025-05-05T23:59:59Z)"),
+    name: List[str] = Query(None, description="Filtruj po polu `name`; np. ?name=cpu-usage&name=memory-usage"),
+    task_type: List[str] = Query(None, description="Filtruj po `metric.attributes.name`; ..."),
+    auth: Tuple[str, str] = Depends(get_auth)
+):
+    must_clauses = [
+        {
+            "range": {
+                "time": {
+                    "gte": start_date,
+                    "lte": end_date,
+                    "format": "strict_date_optional_time"
+                }
+            }
+        }
+    ]
+    if name:
+        must_clauses.append({"terms": {"name.keyword": name}})
+
+    if task_type:
+            must_clauses.append({"terms": {"metric.attributes.name.keyword": task_type}})
+
+    query_body = {"bool": {"must": must_clauses}}
+    hits = scroll_by_query(METRICS_INDEX, query_body, auth)
+
+    file_name = f"metrics_filtered_{start_date}_{end_date}.json".replace(":", "-")
+    with open(file_name, "w", encoding="utf-8") as f:
+        json.dump([h["_source"] for h in hits], f, ensure_ascii=False, indent=2)
+
+    return FileResponse(
+        path=file_name,
+        filename=os.path.basename(file_name),
+        media_type="application/json"
+    )
+
+@app.get("/logs/by-date/stream")
+def stream_logs_by_date(
+    start_date: str = Query(..., description="Start date ISO (np. 2025-05-01T00:00:00Z)"),
+    end_date: str = Query(..., description="End date ISO (np. 2025-05-05T23:59:59Z)"),
+    auth: Tuple[str, str] = Depends(get_auth)
+):
+    query_body = {
+            "range": {
+                "time": {
+                    "gte": start_date,
+                    "lte": end_date,
+                    "format": "strict_date_optional_time"
+                }
+            }
+        }
+    hits = scroll_by_query(LOGS_INDEX, query_body, auth)
+
+    def generate():
+        for hit in hits:
+            yield json.dumps(hit["_source"]) + "\n"
+
+    return StreamingResponse(generate(), media_type="application/jsonlines")
+
+@app.get("/metrics/by-date/stream")
+def stream_metrics_by_date(
+    start_date: str = Query(..., description="Start date ISO (np. 2025-05-01T00:00:00Z)"),
+    end_date: str = Query(..., description="End date ISO (np. 2025-05-05T23:59:59Z)"),
+    auth: Tuple[str, str] = Depends(get_auth)
+):
+    must_clause = {
+            "range": {
+                "time": {
+                    "gte": start_date,
+                    "lte": end_date,
+                    "format": "strict_date_optional_time"
+                }
+            }
+        }
+    query_body = {"bool": {"must": [must_clause]}}
+    hits = scroll_by_query(METRICS_INDEX, query_body, auth)
+
+    def generate():
+        for hit in hits:
+            yield json.dumps(hit["_source"]) + "\n"
+
+    return StreamingResponse(generate(), media_type="application/jsonlines")
+
-Original file line number
+Diff line change
@@ Expand Up / @@ -263,4 +263,4 @@ echo "127.0.1.1 $HOSTNAME" >> /etc/hosts @@
     ```
     search svc.cluster.local
     options ndots:5 timeout:1
-    ```
+    ```