build(agent): molt-d#cb502d iteration

2026-04-15 01:16:38 +02:00 · 2026-04-15 01:16:38 +02:00 · 74e1d93590
parent 10e633b070
commit 74e1d93590
15 changed files with 362 additions and 2 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,21 @@
+node_modules/
+.npmrc
+.env
+.env.*
+__tests__/
+coverage/
+.nyc_output/
+dist/
+build/
+.cache/
+*.log
+.DS_Store
+tmp/
+.tmp/
+__pycache__/
+*.pyc
+.venv/
+venv/
+*.egg-info/
+.pytest_cache/
+READY_TO_PUBLISH
--- a/AGENTS.md
+++ b/AGENTS.md
@ -0,0 +1,33 @@
+# OpenGrowth Agents — Architecture & Contribution Guide
+
+Overview
+- A lightweight, privacy-preserving federated experimentation MVP intended for startup growth insights.
+- Core stack is Python-based with a clean, testable API surface suitable for gradual expansion.
+
+Tech Stack
+- Language: Python 3.8+
+- Components:
+  - SchemaRegistry: stores schemas and templates for experiments and metrics
+  - ExperimentTemplate: lightweight representation of experiments
+  - Adapters: GA4Adapter, SegmentAdapter to map analytics metrics into the canonical representation
+  - SecureAggregator: simple, privacy-preserving aggregation (mean + 95% CI)
+  - CloudLedger: simple, auditable, cloud-anchored ledger simulation
+  - Governance: AccessControl and Policy scaffold
+
+Testing & Quality
+- Tests are written with pytest and must pass locally before publishing
+- test.sh orchestrates tests plus a packaging build check
+
+Running Tests
+- bash test.sh
+
+Extending the MVP
+- Add more adapters (e.g., Amplitude) with a consistent interface
+- Expand governance with versioned templates and access controls
+- Implement a more robust secure aggregation (secure multi-party computation or differential privacy knobs in practice)
+- Build an initial REST/MQTT adapter to connect analytics stacks to the federation layer
+
+Contribution Rules
+- Keep changes small and incrementally testable
+- Add tests for any new public API
+- Update AGENTS.md if the architecture evolves or new agents are introduced
--- a/README.md
+++ b/README.md
@ -1,3 +1,15 @@
-# opengrowth-privacy-preserving-federated-
+# OpenGrowth Privacy-Preserving Federated (MVP)

-A privacy-preserving federated platform that enables startups to run, share, and benchmark growth experiments (pricing, onboarding, activation, onboarding flow, churn reduction) without exposing raw user data. Each startup retains local metrics (CAC,
+This repository contains a minimal, self-contained Python MVP for a privacy-preserving federated growth experimentation platform.
+
+- Exposes a lightweight API surface used by tests:
+  - SchemaRegistry, ExperimentTemplate
+  - SecureAggregator, CloudLedger, AccessControl, Governance
+  - GA4Adapter, SegmentAdapter
+- Includes a tiny in-repo implementation that can be extended later to integrate real adapters and secure aggregation techniques.
+
+Build and test
+- The project uses pyproject.toml with setuptools. Use `bash test.sh` to run tests and packaging checks.
+
+For maintainers
+- See AGENTS.md for architecture and contribution guidelines.
--- a/opengrowth_privacy_preserving_federated_/init.py
+++ b/opengrowth_privacy_preserving_federated_/init.py
@ -0,0 +1,79 @@
+"""OpenGrowth Privacy-Preserving Federated (MVP) package
+
+Lightweight in-repo implementation used by tests. This provides a minimal
+set of APIs to exercise the test suite without pulling in external dependencies.
+"""
+from . import schema_registry as _sr  # type: ignore
+
+# Re-export core registry types from the dedicated module to avoid duplication
+SchemaRegistry = _sr.SchemaRegistry
+ExperimentTemplate = _sr.ExperimentTemplate
+
+
+class SecureAggregator:
+    @staticmethod
+    def aggregate(results: list) -> dict:
+        # Compute simple per-key mean over numeric fields
+        if not results:
+            return {}
+        keys = set()
+        for r in results:
+            keys.update(r.keys())
+        out = {}
+        for k in keys:
+            vals = [r[k] for r in results if isinstance(r.get(k), (int, float))]
+            if not vals:
+                continue
+            mean = sum(vals) / len(vals)
+            out[k] = {"mean": mean}
+        return out
+
+
+class CloudLedger:
+    _last_anchor = None
+
+    @classmethod
+    def anchor(cls, payload: dict) -> str:
+        import json, hashlib
+        data = json.dumps(payload, sort_keys=True).encode()
+        anchor = hashlib.sha256(data).hexdigest()
+        cls._last_anchor = anchor
+        return anchor
+
+    @classmethod
+    def latest(cls) -> dict:
+        return {"anchor_id": cls._last_anchor}
+
+
+class AccessControl:
+    def __init__(self):
+        self._roles = {}
+
+    def grant(self, user: str, role: str) -> None:
+        self._roles.setdefault(user, set()).add(role)
+
+    def has_role(self, user: str, role: str) -> bool:
+        return role in self._roles.get(user, set())
+
+
+class Governance:
+    def __init__(self):
+        self._policies = {}
+
+    def register_policy(self, name: str, policy: dict) -> None:
+        self._policies[name] = policy
+
+    def get_policy(self, name: str) -> dict:
+        return self._policies.get(name, {})
+
+
+class GA4Adapter:
+    def fill(self, metrics: dict) -> dict:
+        # Pass-through in this MVP
+        return dict(metrics)
+
+
+class SegmentAdapter:
+    def fill(self, metrics: dict) -> dict:
+        # Pass-through in this MVP
+        return dict(metrics)
--- a/opengrowth_privacy_preserving_federated_/adapters/init.py
+++ b/opengrowth_privacy_preserving_federated_/adapters/init.py
@ -0,0 +1,4 @@
+from .ga4 import GA4Adapter
+from .segment import SegmentAdapter
+
+__all__ = ["GA4Adapter", "SegmentAdapter"]
--- a/opengrowth_privacy_preserving_federated_/adapters/ga4.py
+++ b/opengrowth_privacy_preserving_federated_/adapters/ga4.py
@ -0,0 +1,16 @@
+class GA4Adapter:
+    def __init__(self, mapping=None):
+        self.mapping = mapping or {
+            "activation_rate": "activation_rate",
+            "funnel_dropoff": "funnel_dropoff",
+            "time_to_value": "time_to_value",
+            "CAC": "cac",
+            "LTV": "ltv",
+        }
+
+    def fill(self, source_metrics: dict) -> dict:
+        result = {}
+        for std_key, src_key in self.mapping.items():
+            if isinstance(src_key, str) and src_key in source_metrics:
+                result[std_key] = source_metrics[src_key]
+        return result
--- a/opengrowth_privacy_preserving_federated_/adapters/segment.py
+++ b/opengrowth_privacy_preserving_federated_/adapters/segment.py
@ -0,0 +1,16 @@
+class SegmentAdapter:
+    def __init__(self, mapping=None):
+        self.mapping = mapping or {
+            "activation_rate": "activation_rate",
+            "funnel_dropoff": "funnel_dropoff",
+            "time_to_value": "time_to_value",
+            "CAC": "cac",
+            "LTV": "ltv",
+        }
+
+    def fill(self, source_metrics: dict) -> dict:
+        result = {}
+        for std_key, src_key in self.mapping.items():
+            if isinstance(src_key, str) and src_key in source_metrics:
+                result[std_key] = source_metrics[src_key]
+        return result
--- a/opengrowth_privacy_preserving_federated_/experiment_template.py
+++ b/opengrowth_privacy_preserving_federated_/experiment_template.py
@ -0,0 +1,12 @@
+class ExperimentTemplate:
+    def __init__(self, template_id: str, name: str, definition: dict):
+        self.template_id = template_id
+        self.name = name
+        self.definition = definition
+
+    def to_dict(self) -> dict:
+        return {
+            "template_id": self.template_id,
+            "name": self.name,
+            "definition": self.definition,
+        }
--- a/opengrowth_privacy_preserving_federated_/governance.py
+++ b/opengrowth_privacy_preserving_federated_/governance.py
@ -0,0 +1,20 @@
+class AccessControl:
+    def __init__(self):
+        self._roles = {}
+
+    def grant(self, user_id: str, role: str) -> None:
+        self._roles[user_id] = role
+
+    def has_role(self, user_id: str, role: str) -> bool:
+        return self._roles.get(user_id) == role
+
+
+class Governance:
+    def __init__(self):
+        self.policies = {}
+
+    def register_policy(self, name: str, policy: dict) -> None:
+        self.policies[name] = policy
+
+    def get_policy(self, name: str):
+        return self.policies.get(name)
--- a/opengrowth_privacy_preserving_federated_/ledger.py
+++ b/opengrowth_privacy_preserving_federated_/ledger.py
@ -0,0 +1,19 @@
+import json
+import hashlib
+
+
+class CloudLedger:
+    _blocks = []
+
+    @classmethod
+    def anchor(cls, data: dict) -> str:
+        payload = json.dumps(data, sort_keys=True).encode("utf-8")
+        anchor_id = hashlib.sha256(payload).hexdigest()
+        cls._blocks.append({"anchor_id": anchor_id, "data": data})
+        return anchor_id
+
+    @classmethod
+    def latest(cls):
+        if not cls._blocks:
+            return None
+        return cls._blocks[-1]
--- a/opengrowth_privacy_preserving_federated_/schema_registry.py
+++ b/opengrowth_privacy_preserving_federated_/schema_registry.py
@ -0,0 +1,23 @@
+class SchemaRegistry:
+    def __init__(self):
+        self._schemas = {}
+        self._templates = {}
+
+    def register_schema(self, name: str, schema: dict) -> None:
+        self._schemas[name] = schema
+
+    def get_schema(self, name: str) -> dict:
+        return self._schemas.get(name, {})
+
+    def register_template(self, template_id: str, definition: dict) -> None:
+        self._templates[template_id] = definition
+
+    def get_template(self, template_id: str) -> dict:
+        return self._templates.get(template_id, {})
+
+
+class ExperimentTemplate:
+    def __init__(self, template_id: str, name: str, definition: dict):
+        self.template_id = template_id
+        self.name = name
+        self.definition = definition
--- a/opengrowth_privacy_preserving_federated_/secure_aggregation.py
+++ b/opengrowth_privacy_preserving_federated_/secure_aggregation.py
@ -0,0 +1,32 @@
+import math
+import statistics
+
+
+class SecureAggregator:
+    @staticmethod
+    def aggregate(local_results: list) -> dict:
+        # local_results: list of dicts with numeric values
+        if not local_results:
+            return {}
+        # collect all metric keys
+        keys = set()
+        for d in local_results:
+            keys.update(d.keys())
+
+        aggregated = {}
+        for k in keys:
+            values = [d[k] for d in local_results if k in d and isinstance(d[k], (int, float))]
+            if not values:
+                continue
+            n = len(values)
+            mean = sum(values) / n
+            if n < 2:
+                ci_lower = ci_upper = mean
+            else:
+                std = statistics.pstdev(values)
+                se = std / math.sqrt(n)
+                margin = 1.96 * se
+                ci_lower = mean - margin
+                ci_upper = mean + margin
+            aggregated[k] = {"mean": mean, "ci_lower": ci_lower, "ci_upper": ci_upper}
+        return aggregated
--- a/pyproject.toml
+++ b/pyproject.toml
@ -0,0 +1,10 @@
+[build-system]
+requires = ["setuptools", "wheel"]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "opengrowth_privacy_preserving_federated"
+version = "0.1.0"
+description = "Minimal MVP for privacy-preserving federated experiments (OpenGrowth)"
+readme = "README.md"
+license = {text = "MIT"}
--- a/test.sh
+++ b/test.sh
@ -0,0 +1,13 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+echo "Installing package in editable mode..."
+python3 -m pip install -e .
+
+echo "Running pytest..."
+pytest -q
+
+echo "Building package (python -m build)..."
+python3 -m build
+
+echo "All tests passed and build succeeded."
--- a/tests/test_mvp.py
+++ b/tests/test_mvp.py
@ -0,0 +1,50 @@
+from opengrowth_privacy_preserving_federated_ import (
+    SchemaRegistry,
+    ExperimentTemplate,
+    SecureAggregator,
+    CloudLedger,
+    AccessControl,
+    Governance,
+    GA4Adapter,
+    SegmentAdapter,
+)
+from opengrowth_privacy_preserving_federated_ import schema_registry as _unused  # type: ignore
+
+
+def test_schema_and_templates_basic():
+    reg = SchemaRegistry()
+    reg.register_schema("Experiment", {"type": "object"})
+    assert reg.get_schema("Experiment") == {"type": "object"}
+
+    tmpl = ExperimentTemplate("pricing_v1", "Pricing Experiment v1", {"type": "pricing"})
+    reg.register_template(tmpl.template_id, tmpl.definition)
+    assert reg.get_template("pricing_v1") == {"type": "pricing"}
+
+
+def test_adapters_and_aggregation_and_ledger():
+    ga4 = GA4Adapter()
+    seg = SegmentAdapter()
+
+    local1 = ga4.fill({"activation_rate": 0.25, "funnel_dropoff": 0.4, "time_to_value": 12, "cac": 300, "ltv": 1000})
+    local2 = seg.fill({"activation_rate": 0.3, "funnel_dropoff": 0.35, "time_to_value": 10, "cac": 320, "ltv": 1200})
+
+    results = [local1, local2]
+    aggregated = SecureAggregator.aggregate(results)
+    assert "activation_rate" in aggregated
+    assert "mean" in aggregated["activation_rate"]
+
+    anchor = CloudLedger.anchor({"template": "pricing_v1", "aggregated": aggregated})
+    assert isinstance(anchor, str)
+    latest = CloudLedger.latest()
+    assert latest["anchor_id"] == anchor
+
+
+def test_governance_basic():
+    ac = AccessControl()
+    ac.grant("alice", "admin")
+    assert ac.has_role("alice", "admin")
+
+    gov = Governance()
+    gov.register_policy("template_access", {"roles": ["admin", "viewer"]})
+    policy = gov.get_policy("template_access")
+    assert policy["roles"] == ["admin", "viewer"]