kaust-ark
diff --git a/‎README.md‎
Lines changed: 3 additions & 1 deletion b/‎README.md‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎README_ar.md‎
Lines changed: 3 additions & 1 deletion b/‎README_ar.md‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎README_zh.md‎
Lines changed: 3 additions & 1 deletion b/‎README_zh.md‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎ark/agents.py‎
Lines changed: 112 additions & 4 deletions b/‎ark/agents.py‎
Lines changed: 112 additions & 4 deletions
diff --git a/‎ark/orchestrator.py‎
Lines changed: 12 additions & 4 deletions b/‎ark/orchestrator.py‎
Lines changed: 12 additions & 4 deletions
diff --git a/‎ark/webapp/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎ark/webapp/__init__.py‎
Lines changed: 1 addition & 1 deletion
@@ -271,7 +271,9 @@ What you get:
 
 ```bash
 # Set up the conda base environment
-conda env create -f environment.yml   # creates "ark-base"
+conda env create -f environment.yml         # Linux (creates "ark-base")
+# OR for macOS:
+conda env create -f environment-macos.yml   # macOS (creates "ark-base")
 
 pip install -e .                    # Core
 pip install -e ".[research]"       # + Gemini Deep Research & Nano Banana
 
@@ -271,7 +271,9 @@ ark setup-bot    # مرة واحدة: الصق رمز BotFather، كشف تلق
 
 ```bash
 # إنشاء بيئة conda الأساسية
-conda env create -f environment.yml   # ينشئ "ark-base"
+conda env create -f environment.yml         # Linux (ينشئ "ark-base")
+# أو لنظام macOS:
+conda env create -f environment-macos.yml   # macOS (ينشئ "ark-base")
 
 pip install -e .                    # الأساسي
 pip install -e ".[research]"       # + Gemini Deep Research و Nano Banana
 
@@ -271,7 +271,9 @@ ark setup-bot    # 一次性配置：粘贴 BotFather token，自动检测 chat
 
 ```bash
 # 创建 conda 基础环境
-conda env create -f environment.yml   # 创建 "ark-base"
+conda env create -f environment.yml         # Linux (创建 "ark-base")
+# 或者对于 macOS：
+conda env create -f environment-macos.yml   # macOS (创建 "ark-base")
 
 pip install -e .                    # 核心
 pip install -e ".[research]"       # + Gemini Deep Research 和 Nano Banana
 
@@ -55,6 +55,87 @@ def _extract_usage(parsed: dict) -> dict:
     }
 
 
+def _parse_gemini_json(stdout: str) -> dict | None:
+    """Parse output of `gemini -o json`. Returns None on failure."""
+    text = (stdout or "").strip()
+    if not text:
+        return None
+    try:
+        # gemini -o json usually outputs the JSON object directly,
+        # but may have leading "Loaded cached credentials" etc.
+        if "{" in text:
+            text = text[text.find("{"):]
+        return json.loads(text)
+    except json.JSONDecodeError:
+        return None
+
+
+def _calculate_gemini_cost(model_id: str, input_tok: int, output_tok: int) -> float:
+    """
+    Calculate estimated cost for Gemini models (April 2026 pricing).
+    """
+    input_tok = int(input_tok or 0)
+    output_tok = int(output_tok or 0)
+    model_lower = (model_id or "").lower()
+
+    # Pricing per 1M tokens
+    if "3.1-pro" in model_lower:
+        in_rate = 2.00
+        out_rate = 12.00
+    elif "3.1-flash" in model_lower:
+        in_rate = 0.50
+        out_rate = 3.00
+    else:
+        # Default to pro
+        in_rate = 2.00
+        out_rate = 12.00
+
+    return (input_tok / 1_000_000 * in_rate) + (output_tok / 1_000_000 * out_rate)
+
+
+def _extract_gemini_usage(parsed: dict) -> dict:
+    """Aggregate token usage info from Gemini CLI's nested stats schema."""
+    parsed = parsed or {}
+    stats = parsed.get("stats", {})
+    models = stats.get("models") or stats.get("model") or {}
+
+    total_in = 0
+    total_out = 0
+    total_cached = 0
+    total_thoughts = 0
+    total_latency = 0
+    main_model = ""
+
+    for mid, info in models.items():
+        t = info.get("tokens", {})
+        total_in += int(t.get("input") or 0)
+        total_out += int(t.get("candidates") or 0)
+        total_cached += int(t.get("cached") or 0)
+        total_thoughts += int(t.get("thoughts") or 0)
+        
+        api = info.get("api", {})
+        total_latency += int(api.get("totalLatencyMs") or 0)
+        
+        # Heuristic for the "main" model being used for the response
+        if "roles" in info and "main" in info["roles"]:
+            main_model = mid
+    
+    if not main_model and models:
+        main_model = next(iter(models))
+
+    cost_usd = _calculate_gemini_cost(main_model, total_in, total_out)
+
+    return {
+        "model": main_model,
+        "input_tokens": total_in,
+        "output_tokens": total_out,
+        "cache_read_tokens": total_cached,
+        "cache_creation_tokens": 0, # Gemini schema doesn't distinguish creation
+        "cost_usd": cost_usd,
+        "duration_api_ms": total_latency,
+    }
+
+
 def _fmt_tok(n: int) -> str:
     """Format a token count as compact human-readable (e.g. 12.3k, 1.2M)."""
     n = int(n or 0)
@@ -485,16 +566,26 @@ def run_agent(self, agent_type: str, task: str, timeout: int = 1800,
         for attempt in range(1, MAX_RETRIES + 1):
             try:
                 cmd = []
-                # Strip CLAUDECODE env var to prevent nested-session detection
-                env = {k: v for k, v in os.environ.items() if k != "CLAUDECODE"}
+                # Strip CLAUDECODE to prevent nested-session detection.
+                # Strip GEMINI_API_KEY / GOOGLE_API_KEY so the Gemini CLI uses                                            
+                # OAuth credentials from ~/.gemini/oauth_creds.json rather than                                    
+                # the API key (which is only for Deep Research via Python API).                                           
+                _strip = {"CLAUDECODE", "GEMINI_API_KEY", "GOOGLE_API_KEY"} 
+                env = {k: v for k, v in os.environ.items() if k not in _strip}
                 if self.model == "gemini":
                     boundary = self._build_path_boundary()
                     cmd = [
                         "gemini",
-                        "-m", "auto",
+                        "-p", f"[SYSTEM RULE] {boundary}\n\n{full_prompt}",
                         "--approval-mode", "auto_edit",
-                        f"[SYSTEM RULE] {boundary}\n\n{full_prompt}",
+                        "-o", "json",
                     ]
+                    # Respect model_variant if set
+                    ark_model = self._get_ark_model()
+                    if ark_model:
+                        cmd.extend(["-m", ark_model])
+                    else:
+                        cmd.extend(["-m", "auto"])
                 elif self.model == "claude":
                     cmd = [
                         "claude", "-p", full_prompt,
@@ -518,6 +609,9 @@ def run_agent(self, agent_type: str, task: str, timeout: int = 1800,
                     self.log(f"Unsupported model backend: {self.model}", "ERROR")
                     return ""
 
+                ark_model = self._get_ark_model()
+                self.log(f"Backend model: {self.model} | Model: {ark_model or 'default'}", "INFO")
+
                 process = subprocess.Popen(
                     cmd,
                     stdin=subprocess.DEVNULL,  # Don't hold terminal pty fd
@@ -552,6 +646,13 @@ def run_agent(self, agent_type: str, task: str, timeout: int = 1800,
                             usage_record = _extract_usage(parsed)
                         else:
                             result = stdout
+                    elif self.model == "gemini":
+                        parsed = _parse_gemini_json(stdout)
+                        if parsed is not None:
+                            result = parsed.get("response", "") or ""
+                            usage_record = _extract_gemini_usage(parsed)
+                        else:
+                            result = stdout
                     else:
                         result = stdout
 
@@ -614,6 +715,13 @@ def run_agent(self, agent_type: str, task: str, timeout: int = 1800,
                             usage_record = _extract_usage(parsed)
                         else:
                             result = stdout
+                    elif self.model == "gemini":
+                        parsed = _parse_gemini_json(stdout)
+                        if parsed is not None:
+                            result = parsed.get("response", "") or ""
+                            usage_record = _extract_gemini_usage(parsed)
+                        else:
+                            result = stdout
                     else:
                         result = stdout
 
 
@@ -43,15 +43,15 @@ class Orchestrator(AgentMixin, CompilerMixin, ExecutionMixin, PipelineMixin, Dev
     """Main orchestrator class composing all mixins."""
 
     def __init__(self, project: str, max_days: float = 3, max_iterations: int = 100,
-                 mode: str = "research", model: str = "claude", code_dir: str = None,
+                 mode: str = "research", model: str = None, code_dir: str = None,
                  project_dir: str = None, db_path: str = None, project_id: str = None):
         global PROJECT_DIR
 
         self.max_end_time = datetime.now() + timedelta(days=max_days)
         self.max_iterations = max_iterations
         self.iteration = 0
         self.mode = mode
-        self.model = model
+        self._model_arg = model  # Store the CLI/constructor argument
         self.project_name = project
 
         # ── DB awareness ──
@@ -73,10 +73,13 @@ def __init__(self, project: str, max_days: float = 3, max_iterations: int = 100,
         config_file = self.project_path / "config.yaml"
         if config_file.exists():
             with open(config_file) as f:
-                self.config = yaml.safe_load(f)
+                self.config = yaml.safe_load(f) or {}
         else:
             self.config = {}
 
+        # Resolve model: Argument > config.yaml > fallback to "claude"
+        self.model = self._model_arg or self.config.get("model") or "claude"
+
         # Set code_dir and legacy global PROJECT_DIR
         if code_dir:
             PROJECT_DIR = Path(code_dir).absolute()
@@ -232,6 +235,11 @@ def _sync_db(self, **kwargs):
         """Update project record in the webapp DB. Fail-soft: errors are logged, never raised."""
         if not self._db_path or not self._project_id:
             return
+        try:
+            import sqlalchemy  # noqa: F401 — availability check
+        except ImportError:
+            self._db_path = None  # disable future sync attempts silently
+            return
         try:
             from ark.webapp.db import get_session, get_project, update_project
             with get_session(self._db_path) as session:
@@ -2088,7 +2096,7 @@ def main():
     parser.add_argument("--mode", type=str, default="research", choices=["research", "paper", "dev"],
                         help="Mode: 'research' for experiments, 'paper' for review iterations, 'dev' for development iterations")
     parser.add_argument("--project", type=str, required=True, help="Project name (e.g., prouter)")
-    parser.add_argument("--model", type=str, default="claude", choices=["claude", "gemini", "codex"],
+    parser.add_argument("--model", type=str, default=None, choices=["claude", "gemini", "codex"],
                         help="Model backend: 'claude', 'gemini', or 'codex'")
     parser.add_argument("--max-days", type=float, default=3, help="Maximum runtime in days")
     parser.add_argument("--iterations", type=int, default=100, help="Number of iterations to run")
 
@@ -2,4 +2,4 @@
 
 from .app import create_app
 
-__all__ = ["create_app"]
+__all__ = ["create_app"]
Original file line number	Diff line number	Diff line change
`@@ -2,4 +2,4 @@`
`2`	`2`
`3`	`3`	`from .app import create_app`
`4`	`4`
`5`		`-__all__ = ["create_app"]`
	`5`	`+__all__ = ["create_app"]`