Merge remote-tracking branch 'origin' into cyber-security

Dr0p42 · Dr0p42 · commit a612803529d3 · 2025-10-23T17:39:46.000+02:00
diff --git a/Makefile b/Makefile
@@ -209,7 +209,7 @@ git-deps: .git/hooks/pre-commit
 # Create symbolic link to allow importing lib.abi from the virtual environment
 python_version=$(shell cat .python-version)
 .venv/lib/python$(python_version)/site-packages/abi: deps
-	@[ -L .venv/lib/python$(python_version)/site-packages/abi ] || ln -s `pwd`/lib/abi .venv/lib/python$(python_version)/site-packages/abi 
+	@[ -L .venv/lib/python$(python_version)/site-packages/abi ] || ln -s `pwd`/lib/abi .venv/lib/python$(python_version)/site-packages/abi
 
 # Install dependencies (alternative to .venv)
 install: dep
@@ -242,7 +242,7 @@ chat-chatgpt-agent: deps
 chat-claude-agent: deps
 	@ LOG_LEVEL=$(log_level) uv run python -m src.cli ClaudeAgent
 
-chat-deepseek-agent: deps 
+chat-deepseek-agent: deps
 	@ LOG_LEVEL=DEBUG uv run python -m src.cli DeepSeekAgent
 
 chat-gemini-agent: deps
@@ -292,7 +292,7 @@ create-pipeline: deps
 
 # Create a new ontology from template
 create-ontology: deps
-	@ LOG_LEVEL=ERROR uv run python -m src.core.abi.cli create-ontology 
+	@ LOG_LEVEL=ERROR uv run python -m src.core.abi.cli create-ontology
 
 # =============================================================================
 # CHAT WITH MARKETPLACE AGENTS
@@ -306,6 +306,10 @@ pull-request-description: deps
 chat-naas-agent: deps
 	@ LOG_LEVEL=$(log_level) uv run python -m src.cli NaasAgent
 
+# Bodo data analysis agent
+chat-bodo-agent: deps
+	@ LOG_LEVEL=$(log_level) uv run python -m src.cli BodoAgent
+
 # Customer support specialized agent
 chat-support-agent: deps
 	@ LOG_LEVEL=$(log_level) uv run python -m src.cli SupportAgent
@@ -345,7 +349,7 @@ mcp-test: deps
 
 # Interactive SPARQL terminal for querying the knowledge graph
 sparql-terminal: deps
-	@ uv run python -m src.core.abi.apps.sparql_terminal.main	
+	@ uv run python -m src.core.abi.apps.sparql_terminal.main
 
 # Oxigraph administrative interface for database management
 oxigraph-admin: deps
@@ -376,7 +380,7 @@ test-coverage: deps
 	@ uv run coverage-badge -f -o coverage.svg
 	@ echo "📊 Coverage report generated:"
 	@ echo "  - HTML: htmlcov/index.html"
-	@ echo "  - XML: coverage.xml" 
+	@ echo "  - XML: coverage.xml"
 	@ echo "  - Badge: coverage.svg"
 
 # Run basic tests for CI (no external dependencies)
@@ -550,7 +554,7 @@ build: build.linux.x86_64
 # Build Docker image for Linux x86_64 architecture with size reporting
 build.linux.x86_64: deps
 	DOCKER_BUILDKIT=1 docker build . -t abi -f docker/images/Dockerfile.linux.x86_64 --platform linux/amd64
-	
+
 	@# Show container size
 	@docker image ls abi
 
diff --git a/config.yaml b/config.yaml
@@ -53,3 +53,5 @@ modules:
     enabled: true
   - path: src/marketplace/applications/pubmed
     enabled: false
+  - path: src/marketplace/applications/bodo
+    enabled: false
diff --git a/pyproject.toml b/pyproject.toml
@@ -73,6 +73,7 @@ dependencies = [
     "dagster-aws[s3]>=0.27.12",
     "ratelimit>=2.2.1",
     "yahooquery>=2.4.1",
+    "bodo>=2025.10",
     "pandas-stubs>=2.3.2.250926",
 ]
 
diff --git a/src/core/abi/cli.py b/src/core/abi/cli.py
@@ -9,6 +9,8 @@
 import re
 from rich.console import Console
 from rich.prompt import Prompt
+import yaml
+import dotenv
 
 console = Console(style="")
 
@@ -80,8 +82,6 @@ def get_component_selection():
 
 def enable_module_in_config(module_path: str):
     """Enable the module in config files if they exist."""
-    import yaml
-    import dotenv
     dotenv.load_dotenv()
     
     env = os.getenv("ENV")
@@ -229,8 +229,9 @@ def create_new_module():
                         content = f.read()
                     
                     # Replace template references
-                    content = content.replace('__templates__', module_name)
                     content = content.replace('Template', module_name.replace('_', '').title())
+                    content = content.replace(template_path.replace('\\', '/').replace('/', '.'), target_path.replace('\\', '/').replace('/', '.'))
+                    content = content.replace('__templates__', module_name)
                     content = content.replace('template', module_name.replace('_', '').lower())
                     
                     # Update path references
diff --git a/src/marketplace/applications/bodo/agents/BodoAgent.py b/src/marketplace/applications/bodo/agents/BodoAgent.py
@@ -0,0 +1,86 @@
+from langchain_openai import ChatOpenAI
+from abi.services.agent.Agent import Agent, AgentConfiguration, AgentSharedState
+from src import secret
+from fastapi import APIRouter
+from src.marketplace.__demo__.workflows.ExecutePythonCodeWorkflow import ExecutePythonCodeWorkflow, ExecutePythonCodeWorkflowConfiguration
+from enum import Enum
+from typing import Optional
+from pydantic import SecretStr
+from langchain_core.tools import Tool, BaseTool
+
+NAME = "BodoAgent"
+MODEL = "gpt-4o"
+TEMPERATURE = 0
+DESCRIPTION = "An agent that can analyze large data with Bodo DataFrames"
+# TODO: Add avatar
+AVATAR_URL = "https://raw.githubusercontent.com/jupyter-naas/awesome-notebooks/refs/heads/master/.github/assets/logos/Naas.png"
+SYSTEM_PROMPT = f"""
+You are {NAME}, a data analysis assistant that uses Bodo DataFrames to efficiently explore and analyze datasets.
+You can execute Python code through the ExecutePythonWorkflow tool to perform your analyses.
+
+When a user asks a question involving data (e.g., describing a dataset, computing aggregates, or exploring patterns), you should:
+
+ * Write a complete Python script to perform the analysis.
+
+ * Always import bodo.pandas as pd at the top of the script (never use regular pandas).
+
+ * Read data using pandas-style APIs (for example: `pd.read_parquet("/path/to/file"))`.
+
+ * Perform any operations or computations using standard pandas syntax (groupby, describe, value_counts, etc.).
+
+ * Print concise, readable outputs — summary statistics, shapes, missing value counts, or aggregates.
+
+ * Avoid unsafe or network operations; only read data and compute results.
+
+ * After running the workflow, summarize the findings in plain English.
+
+Your responses should be short, factual, and focused on analytical insights rather than speculation.
+"""
+SUGGESTIONS = ["Summarize this CSV file: /path/to/file.csv"]
+
+def create_agent(
+    agent_shared_state: Optional[AgentSharedState] = None,
+    agent_configuration: Optional[AgentConfiguration] = None
+) -> Agent:
+    # Init
+    tools: list[Tool | BaseTool | Agent] = []
+
+    # Set model
+    model = ChatOpenAI(
+        model=MODEL,
+        temperature=TEMPERATURE,
+        api_key=SecretStr(secret.get('OPENAI_API_KEY'))
+    )
+
+    # Set configuration
+    if agent_configuration is None:
+        agent_configuration = AgentConfiguration(system_prompt=SYSTEM_PROMPT)
+    if agent_shared_state is None:
+        agent_shared_state = AgentSharedState(thread_id="0")
+
+    # Add tools
+    config = ExecutePythonCodeWorkflowConfiguration(timeout=600, allow_imports=True)
+    tools += ExecutePythonCodeWorkflow(config).as_tools()
+
+    return BodoAgent(
+        name=NAME,
+        description=DESCRIPTION,
+        chat_model=model,
+        tools=tools,
+        agents=[],
+        state=agent_shared_state,
+        configuration=agent_configuration,
+        # memory is automatically configured based on POSTGRES_URL environment variable
+    )
+
+class BodoAgent(Agent):
+    def as_api(
+        self,
+        router: APIRouter,
+        route_name: str = NAME,
+        name: str = NAME,
+        description: str = "API endpoints to call the Bodo agent completion.",
+        description_stream: str = "API endpoints to call the Bodo agent stream completion.",
+        tags: Optional[list[str | Enum]] = None,
+    ):
+        return super().as_api(router, route_name, name, description, description_stream, tags)
diff --git a/src/marketplace/domains/cyber-security-analyst/agents/CyberSecurityAgent.py b/src/marketplace/domains/cyber-security-analyst/agents/CyberSecurityAgent.py
@@ -59,6 +59,12 @@ def create_agent(
 ) -> Optional[IntentAgent]:
     """Create Cyber Security Agent with all 22 competency question tools."""
     
+    if agent_shared_state is None:
+        agent_shared_state = AgentSharedState()
+    
+    if agent_configuration is None:
+        agent_configuration = AgentConfiguration(system_prompt=SYSTEM_PROMPT)
+    
     # Load model based on AI_MODE
     from src import secret
     from langchain_openai import ChatOpenAI
@@ -149,6 +155,5 @@ def create_agent(
         intents=intents,
         state=agent_shared_state,
         configuration=agent_configuration,
-        memory=None,
-        system_prompt=SYSTEM_PROMPT,
+        memory=None
     )
diff --git a/src/mcp_server.py b/src/mcp_server.py
@@ -136,7 +136,7 @@ async def wait_for_api():
     for attempt in range(max_retries):
         try:
             async with httpx.AsyncClient(timeout=5.0) as client:
-                response = await client.get(f"{ABI_API_BASE}/health")
+                response = await client.get(f"{ABI_API_BASE}")
                 if response.status_code == 200:
                     print("✅ API is ready!")
                     return True
@@ -222,4 +222,4 @@ def run():
         mcp.run(transport='stdio')
 
 if __name__ == "__main__":
-    run() 
+    run() 

Original file line number	Diff line number	Diff line change
`@@ -73,6 +73,7 @@ dependencies = [`
`73`	`73`	`"dagster-aws[s3]>=0.27.12",`
`74`	`74`	`"ratelimit>=2.2.1",`
`75`	`75`	`"yahooquery>=2.4.1",`
	`76`	`+ "bodo>=2025.10",`
`76`	`77`	`"pandas-stubs>=2.3.2.250926",`
`77`	`78`	`]`
`78`	`79`