refactor: move factcloud from hardcoded SSM to per-user DynamoDB oauth2_m2m connection

- Add oauth2_m2m auth type to mcp_loader.py (client_secret in record, not SSM) - Remove _get_factcloud_token(), FACTCLOUD_* config, factcloud_clients from main.py - Seed Daniel's factcloud connection into enrolled_services.mcp_connections - factcloud now loaded dynamically via mcp_loader at session start
feat: wire factcloud as direct MCP connection, drop knowledge_agent subagent
2026-05-16 09:49:28 -05:00 · 2026-05-16 09:25:55 -05:00 · 2026-05-16 07:11:39 -05:00 · 2026-05-16 07:07:46 -05:00 · 2026-05-15 23:32:23 -05:00 · 2026-05-15 20:35:02 -05:00
7 changed files with 396 additions and 3 deletions
--- a/agentclaw/app/agent_claw_main/config.py
+++ b/agentclaw/app/agent_claw_main/config.py
@@ -13,7 +13,7 @@ def _load():
    ssm = boto3.client('ssm', region_name='us-east-1')
    names = list(_DEFAULTS.keys())
    try:
-        resp = ssm.get_parameters(Names=names)
+        resp = ssm.get_parameters(Names=names, WithDecryption=True)
        found = {p['Name']: p['Value'] for p in resp['Parameters']}
    except Exception:
        found = {}
--- a/agentclaw/app/agent_claw_main/main.py
+++ b/agentclaw/app/agent_claw_main/main.py
@@ -4,6 +4,7 @@ agent-claw Runtime 1 — main assistant agent.
 Entrypoint for AgentCore CodeZip deployment.
 """
 import os
 import time
 from strands import Agent, tool
 from strands.models import BedrockModel
 from bedrock_agentcore.runtime import BedrockAgentCoreApp
@@ -90,6 +91,7 @@ except Exception as _e:
 # ── Subagent loading ──────────────────────────────────────────────────────
 TOOL_PRESETS = {
    "aws":       lambda: [MCPClient(lambda: aws_iam_streamablehttp_client(config.AWS_MCP_URL, aws_service="aws-mcp"))],
    "coding":    lambda: [MCPClient(lambda: aws_iam_streamablehttp_client(config.AWS_MCP_URL, aws_service="aws-mcp")), run_code],
@@ -425,6 +427,131 @@ def aws_describe_service(service: str, region: str = "us-east-1") -> str:
        return f"Service {service} not yet implemented. Try: lambda, s3, cloudformation, dynamodb, sqs"
 # ── Goal helpers ──────────────────────────────────────────────────────────
 from datetime import datetime as _dt
 from zoneinfo import ZoneInfo as _ZoneInfo
 def _now_iso() -> str:
    return _dt.now(_ZoneInfo('America/Chicago')).strftime('%Y-%m-%dT%H:%M:%S%z')
 def _read_goal() -> str | None:
    """Read GOAL.md from S3, return content or None."""
    try:
        return ws_tools.read_file('GOAL.md')
    except Exception:
        return None
 def _write_goal(content: str):
    ws_tools.write_file('GOAL.md', content)
    invalidate_prompt()
 def _delete_goal():
    try:
        _s3 = boto3.client('s3')
        _s3.delete_object(Bucket=ws_tools.get_bucket(), Key='GOAL.md')
        ws_tools._cache.pop('GOAL.md', None)
        invalidate_prompt()
    except Exception:
        pass
 def _parse_goal_status(content: str) -> str:
    """Extract Status field from GOAL.md content."""
    for line in content.splitlines():
        if line.startswith('**Status:**'):
            return line.split('**Status:**')[1].strip()
    return 'unknown'
 def _get_active_goal_context() -> dict | None:
    """Return goal context dict if active, else None."""
    content = _read_goal()
    if not content or _parse_goal_status(content) != 'active':
        return None
    objective = stopping = last_cp = ''
    for line in content.splitlines():
        if line.startswith('**Objective:**'):
            objective = line.split('**Objective:**')[1].strip()
        elif line.startswith('**Stopping condition:**'):
            stopping = line.split('**Stopping condition:**')[1].strip()
        elif line.startswith('- ['):
            last_cp = line  # last checkpoint line wins
    return {'objective': objective, 'stopping_condition': stopping, 'last_checkpoint': last_cp}
 def _handle_goal_command(prompt: str) -> str | None:
    """Handle /goal commands. Returns reply string or None if not a goal command."""
    parts = prompt.split(None, 2)  # ['/goal', subcommand?, rest?]
    cmd = parts[1] if len(parts) > 1 else 'status'
    rest = parts[2] if len(parts) > 2 else ''
    if cmd == 'set':
        if not rest:
            return '❌ Usage: `/goal set <objective>` or `/goal set <objective> | <stopping condition>`'
        if '|' in rest:
            objective, stopping = [s.strip() for s in rest.split('|', 1)]
        else:
            objective, stopping = rest.strip(), 'not specified'
        content = (
            f'# Goal\n\n'
            f'**Objective:** {objective}\n'
            f'**Stopping condition:** {stopping}\n'
            f'**Status:** active\n'
            f'**Set at:** {_now_iso()}\n\n'
            f'## Checkpoint log\n'
        )
        _write_goal(content)
        return f'✅ Goal set: {objective}\nStopping condition: {stopping}'
    elif cmd in ('status', '/goal'):
        content = _read_goal()
        if not content:
            return '📋 No active goal. Use `/goal set <objective>` to set one.'
        return content
    elif cmd == 'checkpoint':
        if not rest:
            return '❌ Usage: `/goal checkpoint <note>`'
        content = _read_goal()
        if not content:
            return '❌ No active goal to checkpoint.'
        entry = f'- [{_now_iso()}] {rest}\n'
        content = content.rstrip() + '\n' + entry
        _write_goal(content)
        return f'✅ Checkpoint added: {rest}'
    elif cmd == 'pause':
        content = _read_goal()
        if not content:
            return '❌ No active goal to pause.'
        content = content.replace('**Status:** active', '**Status:** paused')
        _write_goal(content)
        return '⏸️ Goal paused.'
    elif cmd == 'resume':
        content = _read_goal()
        if not content:
            return '❌ No goal to resume.'
        content = content.replace('**Status:** paused', '**Status:** active')
        _write_goal(content)
        return '▶️ Goal resumed.'
    elif cmd == 'clear':
        _delete_goal()
        return '🗑️ Goal cleared.'
    else:
        # Not a recognized subcommand — treat the whole thing as status check
        content = _read_goal()
        if not content:
            return '📋 No active goal. Use `/goal set <objective>` to set one.'
        return content
 # ── Entrypoint ────────────────────────────────────────────────────────────
 # Module-level actor_id for tool closures (set per-invocation)
@@ -528,7 +655,7 @@ async def main(payload: dict, context):
        system_prompt = system_prompt + '\n\n---\n\n' + ltm_block
    system_prompt += '\nAWS tools available: call_aws (any AWS API via AWS MCP Server), aws_list_lambda_functions, aws_get_cost_and_usage, aws_describe_service. Use call_aws directly for AWS API calls — do NOT say you lack AWS access.'
-    system_prompt += '\n\nSubagents available — use them aggressively to save cost and improve quality:\n- aws_agent: all AWS infrastructure, cost, resource, IAM, CloudWatch queries\n- coding_agent: code writing, builds, deployments, CodeBuild/AppRunner/ECR\n- document_agent: summarize URLs, extract data from documents, process long text\nDefault to delegating; only answer directly for simple conversational responses or tasks that don\'t fit a subagent.'
+    system_prompt += '\n\nSubagents available — use them aggressively to save cost and improve quality:\n- aws_agent: all AWS infrastructure, cost, resource, IAM, CloudWatch queries\n- coding_agent: code writing, builds, deployments, CodeBuild/AppRunner/ECR\n- document_agent: summarize URLs, extract data from documents, process long text\nYou also have direct access to factcloud MCP tools (your personal knowledge graph) loaded from your MCP connections — use them directly for any factbase, factcloud, or knowledge base queries. Do NOT say you lack access to factcloud.\nDefault to delegating to subagents; only answer directly for simple conversational responses or tasks that don\'t fit a subagent.'
    # Model: claude-sonnet-4-6 via cross-region inference
    # NOTE: extended thinking disabled — causes retry/duplicate issues with streaming
@@ -563,9 +690,42 @@ async def main(payload: dict, context):
        tools=all_tools,
    )
    # Intercept /goal commands — handle directly without LLM
    prompt = payload.get('prompt', '')
    if prompt.strip().startswith('/goal'):
        goal_reply = _handle_goal_command(prompt.strip())
        if goal_reply is not None:
            yield {'data': goal_reply}
            _typing_active = False
            session_manager.close()
            mcp_loader.close_mcp_clients(_mcp_to_close)
            return
    # Intercept heartbeat: replace bare [HEARTBEAT] with a strict-format instruction.
    # Agent-runner suppresses replies that start with HEARTBEAT_OK, so only real alerts reach Telegram.
    if prompt.strip() == '[HEARTBEAT]':
        # Inject goal context into heartbeat if active
        goal_ctx = _get_active_goal_context()
        goal_heartbeat = ''
        if goal_ctx:
            goal_heartbeat = (
                f' You have an active goal: "{goal_ctx["objective"]}". '
                f'Stopping condition: "{goal_ctx["stopping_condition"]}". '
                f'Last checkpoint: "{goal_ctx["last_checkpoint"]}". '
                f'Make progress toward this goal or report blockers.'
            )
        prompt = (
            'HEARTBEAT CHECK: Silently check for anything urgent Daniel should know about '
            '(calendar events starting within 2 hours, unread urgent emails, overdue reminders). '
            'Do NOT narrate your checking process. '
            'If nothing is urgent: reply with the single word HEARTBEAT_OK and nothing else. '
            'If something IS urgent: reply with 2-3 lines max summarising only the urgent items.'
            + goal_heartbeat
        )
    final_message = None
    try:
-        async for event in agent.stream_async(payload.get('prompt', '')):
+        async for event in agent.stream_async(prompt):
            if 'result' in event:
                final_message = event['result'].message
            yield event
--- a/agentclaw/app/agent_claw_main/mcp_loader.py
+++ b/agentclaw/app/agent_claw_main/mcp_loader.py
@@ -45,12 +45,40 @@ def _get_oauth_token(conn: dict, actor_id: str) -> str:
    return token
 def _get_m2m_token(conn: dict, actor_id: str) -> str:
    """Fetch OAuth token for oauth2_m2m (secret stored directly in record)."""
    cache_key = f"{actor_id}:{conn['name']}"
    cached = _token_cache.get(cache_key)
    if cached and cached['expires_at'] > time.time() + 60:
        return cached['token']
    data = urllib.parse.urlencode({
        'grant_type': 'client_credentials',
        'client_id': conn['client_id'],
        'client_secret': conn['client_secret'],
        'scope': conn.get('scopes', conn.get('scope', '')),
    }).encode()
    req = urllib.request.Request(conn['token_url'], data=data,
                                headers={'Content-Type': 'application/x-www-form-urlencoded'})
    with urllib.request.urlopen(req, timeout=10) as resp:
        body = json.loads(resp.read())
    token = body['access_token']
    expires_in = body.get('expires_in', 3600)
    _token_cache[cache_key] = {'token': token, 'expires_at': time.time() + expires_in}
    return token
 def _resolve_auth_headers(conn: dict, actor_id: str) -> dict:
    """Resolve auth headers for a connection."""
    auth_type = conn.get('auth_type', 'none')
    if auth_type == 'oauth_client_credentials':
        token = _get_oauth_token(conn, actor_id)
        return {'Authorization': f'Bearer {token}'}
    elif auth_type == 'oauth2_m2m':
        token = _get_m2m_token(conn, actor_id)
        return {'Authorization': f'Bearer {token}'}
    elif auth_type == 'bearer':
        token = _get_ssm_value(conn['token_ssm'])
        return {'Authorization': f'Bearer {token}'}
--- a/agentclaw/app/agent_claw_main/prompt_builder.py
+++ b/agentclaw/app/agent_claw_main/prompt_builder.py
@@ -46,6 +46,16 @@ def _get_base_prompt(actor_id: str = '') -> str:
    s3 = boto3.client('s3')
    parts = []
    # Inject active goal at the top of context
    try:
        obj = s3.get_object(Bucket=bucket, Key='GOAL.md')
        goal_content = obj['Body'].read().decode('utf-8')
        if '**Status:** active' in goal_content:
            parts.append(f'## Active Goal\n{goal_content}')
            print(f'[prompt_builder] Injected GOAL.md ({len(goal_content)} bytes)')
    except Exception:
        pass
    for fname in ['SOUL.md', 'STATUS.md']:
        try:
            obj = s3.get_object(Bucket=bucket, Key=fname)
--- a/cdk/bin/agent-claw.ts
+++ b/cdk/bin/agent-claw.ts
@@ -5,6 +5,11 @@ import { AgentClawStack } from '../lib/agent-claw-stack';
 const app = new cdk.App();
 // Billing tags applied to all resources in the stack
 cdk.Tags.of(app).add('project', 'agent-claw');
 cdk.Tags.of(app).add('env', 'prod');
 cdk.Tags.of(app).add('owner', 'daniel');
 new AgentClawStack(app, 'AgentClawStack', {
  env: {
    account: process.env.CDK_DEFAULT_ACCOUNT,
--- a/scripts/create-inference-profiles.py
+++ b/scripts/create-inference-profiles.py
@@ -0,0 +1,155 @@
 #!/usr/bin/env python3
 """
 Create Bedrock Application Inference Profiles for agent-claw and update SSM.
 Run after: aws sso login --profile ai1
 Usage:
    python3 scripts/create-inference-profiles.py [--dry-run]
 Creates:
    agent-claw-opus    — main agent
    agent-claw-sonnet  — aws_agent + coding_agent
    agent-claw-haiku   — document_agent
 Then updates SSM:
    /agent-claw/model-id        → agent-claw-opus ARN
    /agent-claw/subagents       → inline model_id fields replaced with profile ARNs
 """
 import argparse
 import json
 import sys
 import boto3
 from botocore.exceptions import ClientError
 PROFILE = 'ai1'
 REGION  = 'us-east-1'
 BILLING_TAGS = [
    {'key': 'project', 'value': 'agent-claw'},
    {'key': 'env',     'value': 'prod'},
    {'key': 'owner',   'value': 'daniel'},
 ]
 # Map: profile name → cross-region model ID to copy from
 PROFILES_TO_CREATE = {
    'agent-claw-opus':   'us.anthropic.claude-opus-4-6-v1:0',
    'agent-claw-sonnet': 'us.anthropic.claude-sonnet-4-6-20251001-v1:0',
    'agent-claw-haiku':  'us.anthropic.claude-haiku-4-5-20251001-v1:0',
 }
 # SSM subagent model_id values → which profile ARN to swap in
 SUBAGENT_MODEL_MAP = {
    'us.anthropic.claude-sonnet-4-6':              'agent-claw-sonnet',
    'us.anthropic.claude-sonnet-4-6-20251001-v1:0':'agent-claw-sonnet',
    'us.anthropic.claude-haiku-4-5-20251001-v1:0': 'agent-claw-haiku',
 }
 def get_system_inference_profile_arn(bedrock, model_id: str) -> str:
    """Find the system inference profile ARN for a given cross-region model ID."""
    paginator = bedrock.get_paginator('list_inference_profiles')
    for page in paginator.paginate(typeEquals='SYSTEM_DEFINED'):
        for p in page.get('inferenceProfileSummaries', []):
            if p.get('inferenceProfileId', '') == model_id or \
               any(m.get('modelArn', '').endswith(model_id) for m in p.get('models', [])):
                return p['inferenceProfileArn']
    # Fallback: construct ARN directly (works for cross-region profiles)
    return f'arn:aws:bedrock:{REGION}::foundation-model/{model_id}'
 def get_existing_profile(bedrock, name: str) -> dict | None:
    """Return existing application profile by name, or None."""
    paginator = bedrock.get_paginator('list_inference_profiles')
    for page in paginator.paginate(typeEquals='APPLICATION'):
        for p in page.get('inferenceProfileSummaries', []):
            if p.get('inferenceProfileName') == name:
                return p
    return None
 def create_or_get_profile(bedrock, name: str, model_id: str, dry_run: bool) -> str:
    """Create application inference profile (idempotent). Returns ARN."""
    existing = get_existing_profile(bedrock, name)
    if existing:
        arn = existing['inferenceProfileArn']
        print(f'  [exists] {name} → {arn}')
        return arn
    source_arn = get_system_inference_profile_arn(bedrock, model_id)
    print(f'  [create] {name}')
    print(f'           source: {source_arn}')
    if dry_run:
        print(f'           [dry-run] skipping create')
        return f'arn:aws:bedrock:{REGION}:{{}account}}:application-inference-profile/{name}-DRY-RUN'
    resp = bedrock.create_inference_profile(
        inferenceProfileName=name,
        description=f'agent-claw {name.split("-")[-1]} model with billing tags',
        modelSource={'copyFrom': source_arn},
        tags=BILLING_TAGS,
    )
    arn = resp['inferenceProfileArn']
    print(f'           → {arn}')
    return arn
 def update_ssm(ssm, param: str, value: str, dry_run: bool):
    print(f'  [ssm] {param} = {value[:80]}...' if len(value) > 80 else f'  [ssm] {param} = {value}')
    if not dry_run:
        ssm.put_parameter(Name=param, Value=value, Type='String', Overwrite=True)
 def main():
    parser = argparse.ArgumentParser()
    parser.add_argument('--dry-run', action='store_true')
    args = parser.parse_args()
    session = boto3.Session(profile_name=PROFILE, region_name=REGION)
    bedrock = session.client('bedrock')
    ssm     = session.client('ssm')
    print('=== Creating inference profiles ===')
    arns = {}
    for name, model_id in PROFILES_TO_CREATE.items():
        arns[name] = create_or_get_profile(bedrock, name, model_id, args.dry_run)
    print('\n=== Updating SSM ===')
    # Main agent model
    update_ssm(ssm, '/agent-claw/model-id', arns['agent-claw-opus'], args.dry_run)
    # Subagents JSON — swap model_id fields
    try:
        resp = ssm.get_parameter(Name='/agent-claw/subagents')
        defs = json.loads(resp['Parameter']['Value'])
    except ClientError as e:
        print(f'  [error] Could not read /agent-claw/subagents: {e}')
        sys.exit(1)
    changed = False
    for agent in defs:
        mid = agent.get('model_id', '')
        profile_name = SUBAGENT_MODEL_MAP.get(mid)
        if profile_name:
            new_arn = arns[profile_name]
            print(f'  [subagent] {agent["name"]}: {mid} → {profile_name}')
            agent['model_id'] = new_arn
            changed = True
        else:
            print(f'  [subagent] {agent["name"]}: {mid} (no mapping, left as-is)')
    if changed:
        update_ssm(ssm, '/agent-claw/subagents', json.dumps(defs, indent=2), args.dry_run)
    print('\n=== Done ===')
    print('Profiles created and SSM updated.')
    print('Redeploy not required — agent reads model IDs from SSM at startup.')
    if args.dry_run:
        print('\n[dry-run mode — no AWS changes were made]')
 if __name__ == '__main__':
    main()
--- a/scripts/seed_factcloud.py
+++ b/scripts/seed_factcloud.py
@@ -0,0 +1,35 @@
 #!/usr/bin/env python3
 """Seed Daniel's factcloud MCP connection into DynamoDB."""
 import boto3
 ACTOR_ID = 'telegram:8537376738'
 TABLE_NAME = 'agent-claw-users'
 conn = {
    'name': 'factcloud',
    'url': 'https://factbase-cloud-gateway-2czetaoh3u.gateway.bedrock-agentcore.us-east-1.amazonaws.com/mcp',
    'auth_type': 'oauth2_m2m',
    'client_id': '5fo2q4fb452j3aekd55g3190i4',
    'client_secret': '1e0bqs8r4jk90sbeivh96mn893mgmv96h2olvcq7m3o5gjpjc56p',
    'token_url': 'https://factbase-cloud.auth.us-east-1.amazoncognito.com/oauth2/token',
    'scopes': 'factbase-cloud/read factbase-cloud/write',
    'enabled': True,
 }
 session = boto3.Session(profile_name='ai1', region_name='us-east-1')
 ddb = session.resource('dynamodb')
 table = ddb.Table(TABLE_NAME)
 # Get existing connections, upsert factcloud
 resp = table.get_item(Key={'actor_id': ACTOR_ID})
 services = resp.get('Item', {}).get('enrolled_services', {})
 connections = services.get('mcp_connections', [])
 connections = [c for c in connections if c['name'] != 'factcloud']
 connections.append(conn)
 table.update_item(
    Key={'actor_id': ACTOR_ID},
    UpdateExpression='SET enrolled_services.mcp_connections = :conns',
    ExpressionAttributeValues={':conns': connections},
 )
 print(f'Seeded factcloud connection for {ACTOR_ID}')
Author	SHA1	Message	Date
daniel	4ca5fee2c0	refactor: move factcloud from hardcoded SSM to per-user DynamoDB oauth2_m2m connection - Add oauth2_m2m auth type to mcp_loader.py (client_secret in record, not SSM) - Remove _get_factcloud_token(), FACTCLOUD_* config, factcloud_clients from main.py - Seed Daniel's factcloud connection into enrolled_services.mcp_connections - factcloud now loaded dynamically via mcp_loader at session start	2026-05-16 09:49:28 -05:00
daniel	e77417b6cd	feat: wire factcloud as direct MCP connection, drop knowledge_agent subagent - Rename FACTBASE_CLOUD_* -> FACTCLOUD_* in config.py + SSM paths - factcloud MCPClient added directly to main agent tool set - knowledge_agent subagent removed (SSM + TOOL_PRESETS) - System prompt updated: factcloud tools are direct, not via subagent	2026-05-16 09:25:55 -05:00
daniel	ef5734101e	fix: add knowledge_agent to system prompt subagent list	2026-05-16 07:11:39 -05:00
daniel	8c28797bca	feat: add /goal command for durable multi-turn objectives - /goal set\|status\|checkpoint\|pause\|resume\|clear intercept in main.py - GOAL.md injected into system prompt when active (prompt_builder.py) - Goal context added to heartbeat for autonomous progress	2026-05-16 07:07:46 -05:00
daniel	42dbdcde9e	feat: factbase-cloud integration — knowledge_agent subagent with M2M auth	2026-05-15 23:32:23 -05:00
daniel	ed6577ccf9	feat: billing tags on CDK stack + inference profile creation script	2026-05-15 20:35:02 -05:00
daniel	4f17bbd2c3	fix: intercept [HEARTBEAT] prompt, suppress chatty non-urgent responses	2026-05-15 18:34:14 -05:00