cytoscape: --layout flag with shared topological algorithm

jmchilton · claude · jmchilton · commit e576876e3212 · 2026-04-28T16:05:15.000-04:00
Adds `--layout &lt;name&gt;` to gxwf-viz, mirroring the TS port at
galaxy-tool-util-ts. Names match cytoscape.js layout vocabulary:

- preset (default) — today's behavior, byte-identical output
- topological — computed leveled layout, baked into data.position
- dagre / breadthfirst / grid / cose / random — hint-only; positions
  dropped, runtime renderer (cytoscape.js) places nodes at view time

`topological` is a tiny longest-path layering (~30 LOC) with stride
constants pinned to a cross-language spec at
galaxy-tool-util-ts/docs/architecture/cytoscape-layout.md. Cross-language
parity verified end-to-end: TS and Python emit byte-identical positions
for the same workflow.

Default flat-list JSON shape preserved for back-compat. Non-default
layouts emit a {elements, layout} wrapper so consumers see the hint.

Template synced from TS (adds cytoscape-dagre + dagre CDN, $layout
substitution, falls back to preset if dagre unavailable).

Co-Authored-By: Claude Opus 4.7 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/gxformat2/cytoscape/__init__.py b/gxformat2/cytoscape/__init__.py
@@ -2,26 +2,42 @@
 
 from ._builder import cytoscape_elements
 from ._cli import main, to_cytoscape
+from ._layout import (
+    bakes_coordinates,
+    COL_STRIDE,
+    is_layout_name,
+    LAYOUT_NAMES,
+    ROW_STRIDE,
+    topological_positions,
+)
 from ._render import CYTOSCAPE_JS_TEMPLATE, render_html
 from .models import (
     CytoscapeEdge,
     CytoscapeEdgeData,
     CytoscapeElements,
+    CytoscapeLayout,
     CytoscapeNode,
     CytoscapeNodeData,
     CytoscapePosition,
 )
 
 __all__ = (
+    "COL_STRIDE",
     "CYTOSCAPE_JS_TEMPLATE",
     "CytoscapeEdge",
     "CytoscapeEdgeData",
     "CytoscapeElements",
+    "CytoscapeLayout",
     "CytoscapeNode",
     "CytoscapeNodeData",
     "CytoscapePosition",
+    "LAYOUT_NAMES",
+    "ROW_STRIDE",
+    "bakes_coordinates",
     "cytoscape_elements",
+    "is_layout_name",
     "main",
     "render_html",
     "to_cytoscape",
+    "topological_positions",
 )
diff --git a/gxformat2/cytoscape/_builder.py b/gxformat2/cytoscape/_builder.py
@@ -8,10 +8,12 @@
 from gxformat2.normalized import ensure_format2, NormalizedFormat2, NormalizedWorkflowStep
 from gxformat2.schema.gxformat2 import BaseInputParameter, GalaxyType, GalaxyWorkflow
 
+from ._layout import bakes_coordinates, is_layout_name, topological_positions
 from .models import (
     CytoscapeEdge,
     CytoscapeEdgeData,
     CytoscapeElements,
+    CytoscapeLayout,
     CytoscapeNode,
     CytoscapeNodeData,
     CytoscapePosition,
@@ -22,12 +24,22 @@
 
 def cytoscape_elements(
     workflow: dict[str, Any] | str | Path | GalaxyWorkflow | NormalizedFormat2,
+    *,
+    layout: str = "preset",
 ) -> CytoscapeElements:
     """Build Cytoscape visualization elements from a Galaxy workflow.
 
     Accepts anything ``normalized_format2()`` supports, plus an already
     normalized ``NormalizedFormat2`` instance.
+
+    ``layout`` selects the placement strategy (default ``preset``); see
+    ``_layout.py`` and the cross-language spec for details.
     """
+    if not is_layout_name(layout):
+        raise ValueError(
+            f'Unknown layout "{layout}". Valid values: ' "preset, topological, dagre, breadthfirst, grid, cose, random."
+        )
+
     if isinstance(workflow, NormalizedFormat2):
         nf2 = workflow
     else:
@@ -44,7 +56,25 @@ def cytoscape_elements(
         nodes.append(_step_node(step, i + inputs_offset))
         edges.extend(_step_edges(step, nf2))
 
-    return CytoscapeElements(nodes=nodes, edges=edges)
+    elements = CytoscapeElements(nodes=nodes, edges=edges)
+
+    if layout == "preset":
+        return elements
+
+    if bakes_coordinates(layout):
+        # Currently only ``topological`` reaches here.
+        positions = topological_positions(elements)
+        for node in nodes:
+            p = positions.get(node.data.id)
+            if p is not None:
+                node.position = p
+    else:
+        # Hint-only layout: drop coordinates; the runtime renderer places nodes.
+        for node in nodes:
+            node.position = None
+
+    elements.layout = CytoscapeLayout(name=layout)
+    return elements
 
 
 def _fallback_position(order_index: int) -> CytoscapePosition:
diff --git a/gxformat2/cytoscape/_cli.py b/gxformat2/cytoscape/_cli.py
@@ -5,6 +5,7 @@
 import sys
 
 from ._builder import cytoscape_elements
+from ._layout import LAYOUT_NAMES
 from ._render import render_html
 
 SCRIPT_DESCRIPTION = """
@@ -19,20 +20,23 @@
 """
 
 
-def to_cytoscape(workflow_path: str, output_path=None):
+def to_cytoscape(workflow_path: str, output_path=None, layout: str = "preset"):
     """Produce cytoscape output for supplied workflow path."""
     if output_path is None:
         output_path, _ = os.path.splitext(workflow_path)
         output_path += ".html"
 
-    elements = cytoscape_elements(workflow_path)
+    elements = cytoscape_elements(workflow_path, layout=layout)
 
     if output_path.endswith(".html"):
         with open(output_path, "w") as f:
-            f.write(render_html(elements))
+            f.write(render_html(elements, layout=layout))
     else:
+        # Bare flat list for ``preset`` (back-compat); wrapped {elements, layout}
+        # otherwise so the layout hint travels with the JSON.
+        payload = elements.to_list() if layout == "preset" else elements.to_dict()
         with open(output_path, "w") as f:
-            json.dump(elements.to_list(), f)
+            json.dump(payload, f)
 
 
 def main(argv=None):
@@ -41,7 +45,7 @@ def main(argv=None):
         argv = sys.argv[1:]
 
     args = _parser().parse_args(argv)
-    to_cytoscape(args.input_path, args.output_path)
+    to_cytoscape(args.input_path, args.output_path, layout=args.layout)
 
 
 def _parser():
@@ -50,4 +54,14 @@ def _parser():
     parser = argparse.ArgumentParser(description=SCRIPT_DESCRIPTION)
     parser.add_argument("input_path", metavar="INPUT", type=str, help="input workflow path (.ga/gxwf.yml)")
     parser.add_argument("output_path", metavar="OUTPUT", type=str, nargs="?", help="output viz path (.json/.html)")
+    parser.add_argument(
+        "--layout",
+        type=str,
+        default="preset",
+        choices=list(LAYOUT_NAMES),
+        help=(
+            "Layout strategy: preset (default; honors workflow positions), "
+            "topological (computed leveled layout), dagre, breadthfirst, grid, cose, random"
+        ),
+    )
     return parser
diff --git a/gxformat2/cytoscape/_layout.py b/gxformat2/cytoscape/_layout.py
@@ -0,0 +1,117 @@
+"""Cross-language topological layout for Cytoscape elements.
+
+Mirror of the TypeScript port at
+``galaxy-tool-util-ts/packages/schema/src/workflow/cytoscape-layout.ts``.
+
+Both implementations MUST produce byte-identical (x, y) coordinates for a
+given input. The normative spec lives in the galaxy-tool-util-ts repo at
+``docs/architecture/cytoscape-layout.md``. Any change here is a breaking
+visual diff and must land in lockstep with that file.
+"""
+
+from __future__ import annotations
+
+from typing import get_args, Literal
+
+from .models import CytoscapeElements, CytoscapePosition
+
+COL_STRIDE = 220
+ROW_STRIDE = 100
+
+LayoutName = Literal[
+    "preset",
+    "topological",
+    "dagre",
+    "breadthfirst",
+    "grid",
+    "cose",
+    "random",
+]
+
+LAYOUT_NAMES: tuple[str, ...] = get_args(LayoutName)
+
+
+def is_layout_name(value: str) -> bool:
+    return value in LAYOUT_NAMES
+
+
+def bakes_coordinates(layout: str) -> bool:
+    """Layouts that bake coordinates into ``data.position``.
+
+    All other layouts are hint-only and rely on the runtime renderer.
+    """
+    return layout in ("preset", "topological")
+
+
+def topological_positions(elements: CytoscapeElements) -> dict[str, CytoscapePosition]:
+    """Compute positions per the topological layering spec.
+
+    Returns a mapping keyed by node ``data.id``.
+    """
+    nodes = elements.nodes
+    node_ids = [n.data.id for n in nodes]
+    index_by_id = {node_id: i for i, node_id in enumerate(node_ids)}
+
+    incoming: dict[str, list[str]] = {node_id: [] for node_id in node_ids}
+    for edge in elements.edges:
+        source = edge.data.source
+        target = edge.data.target
+        if source not in index_by_id or target not in index_by_id:
+            continue
+        incoming[target].append(source)
+
+    in_degree: dict[str, int] = {node_id: len(srcs) for node_id, srcs in incoming.items()}
+
+    dependents: dict[str, list[str]] = {node_id: [] for node_id in node_ids}
+    for target, sources in incoming.items():
+        for s in sources:
+            dependents[s].append(target)
+
+    column: dict[str, int] = {}
+    visited: set[str] = set()
+
+    # Kahn topo sort, declaration-index tie break.
+    queue: list[str] = [node_id for node_id in node_ids if in_degree[node_id] == 0]
+    queue.sort(key=lambda nid: index_by_id[nid])
+
+    while queue:
+        # Pop lowest declaration index.
+        best = 0
+        for i in range(1, len(queue)):
+            if index_by_id[queue[i]] < index_by_id[queue[best]]:
+                best = i
+        node_id = queue.pop(best)
+        visited.add(node_id)
+
+        sources = incoming[node_id]
+        if not sources:
+            column[node_id] = 0
+        else:
+            max_col = 0
+            for s in sources:
+                c = column.get(s)
+                if c is not None and c + 1 > max_col:
+                    max_col = c + 1
+            column[node_id] = max_col
+
+        for dep in dependents[node_id]:
+            in_degree[dep] -= 1
+            if in_degree[dep] == 0:
+                queue.append(dep)
+
+    # Cycle fallback: any unvisited node gets column = declaration index.
+    for node_id in node_ids:
+        if node_id not in visited:
+            column[node_id] = index_by_id[node_id]
+
+    # Row assignment: per column, declaration order.
+    rows_by_column: dict[int, list[str]] = {}
+    for node_id in node_ids:
+        c = column[node_id]
+        rows_by_column.setdefault(c, []).append(node_id)
+
+    positions: dict[str, CytoscapePosition] = {}
+    for c, ids in rows_by_column.items():
+        for row, node_id in enumerate(ids):
+            positions[node_id] = CytoscapePosition(x=c * COL_STRIDE, y=row * ROW_STRIDE)
+    return positions
diff --git a/gxformat2/cytoscape/_render.py b/gxformat2/cytoscape/_render.py
@@ -9,12 +9,15 @@
 CYTOSCAPE_JS_TEMPLATE = os.path.join(os.path.dirname(__file__), "cytoscape.html")
 
 
-def render_html(elements: CytoscapeElements) -> str:
+def render_html(elements: CytoscapeElements, layout: str = "preset") -> str:
     """Return a standalone HTML page visualizing the workflow with Cytoscape.js.
 
     The returned string is a complete HTML document suitable for writing
     to a file or embedding in a Jupyter notebook.
     """
     with open(CYTOSCAPE_JS_TEMPLATE) as f:
         template = f.read()
-    return string.Template(template).safe_substitute(elements=json.dumps(elements.to_list()))
+    return string.Template(template).safe_substitute(
+        elements=json.dumps(elements.to_list()),
+        layout=json.dumps(layout),
+    )
diff --git a/gxformat2/cytoscape/cytoscape.html b/gxformat2/cytoscape/cytoscape.html
@@ -5,18 +5,36 @@
 <head>
     <title>Galaxy Workflow</title>
     <script src="https://unpkg.com/cytoscape@3.33.2/dist/cytoscape.min.js"></script>
+    <script src="https://unpkg.com/dagre@0.8.5/dist/dagre.min.js"></script>
+    <script src="https://unpkg.com/cytoscape-dagre@2.5.0/cytoscape-dagre.js"></script>
     <script src="https://unpkg.com/@popperjs/core@2.11.8/dist/umd/popper.min.js"></script>
     <script src="https://unpkg.com/cytoscape-popper@2.0.0/cytoscape-popper.js"></script>
     <script src="https://unpkg.com/tippy.js@6.3.7/dist/tippy.umd.min.js"></script>
     <link rel="stylesheet" href="https://unpkg.com/tippy.js@6.3.7/dist/tippy.css" />
     <script>
 document.addEventListener("DOMContentLoaded", function() {
+    var requestedLayout = $layout;
+    var dagreReady = (typeof cytoscapeDagre !== 'undefined');
+    if (dagreReady && cytoscape.use) {
+        try { cytoscape.use(cytoscapeDagre); } catch (e) { /* already registered */ }
+    }
+    var layoutConfig = (function(name) {
+        if (name === 'dagre') {
+            return dagreReady
+                ? { name: 'dagre', rankDir: 'LR', nodeSep: 40, rankSep: 80 }
+                : { name: 'preset' };
+        }
+        if (name === 'breadthfirst') return { name: 'breadthfirst', directed: true, spacingFactor: 1.2 };
+        if (name === 'grid') return { name: 'grid' };
+        if (name === 'cose') return { name: 'cose' };
+        if (name === 'random') return { name: 'random' };
+        if (name === 'topological') return { name: 'preset' };
+        return { name: 'preset' };
+    })(requestedLayout);
     var cy = cytoscape({
         container: document.getElementById('cy'),
         elements: $elements,
-        layout: {
-            name: 'preset'
-        },
+        layout: layoutConfig,
         // so we can see the ids
         style: [
             {
@@ -46,6 +64,27 @@
                     shape: 'round-rectangle',
                     'background-color': '#2c3143'
                 }
+            },
+            {
+                selector: 'edge.mapover_1',
+                style: { width: 4, 'line-color': '#5a8' }
+            },
+            {
+                selector: 'edge.mapover_2',
+                style: { width: 6, 'line-color': '#5a8' }
+            },
+            {
+                selector: 'edge.mapover_3',
+                style: { width: 8, 'line-color': '#5a8' }
+            },
+            {
+                selector: 'edge.reduction',
+                style: {
+                    'line-style': 'dashed',
+                    'line-color': '#a55',
+                    'target-arrow-shape': 'tee',
+                    'target-arrow-color': '#a55'
+                }
             }
         ]
       });
@@ -83,6 +122,14 @@
             } else {
                 innerHTML += "Connected to input " + input;
             }
+            let mapDepth = ele.data("map_depth");
+            if (mapDepth) {
+                let mapping = ele.data("mapping");
+                innerHTML += "<p><i>Map depth:</i> " + mapDepth + (mapping ? " (" + mapping + ")" : "") + "</p>";
+            }
+            if (ele.data("reduction")) {
+                innerHTML += "<p><i>Reduction:</i> list → multi-data</p>";
+            }
         }
         content.innerHTML = innerHTML;
 
diff --git a/gxformat2/cytoscape/models.py b/gxformat2/cytoscape/models.py
diff --git a/tests/test_cytoscape_layout.py b/tests/test_cytoscape_layout.py
diff --git a/tests/test_cytoscape_layout_integration.py b/tests/test_cytoscape_layout_integration.py