{
  "schema_version": "0.1.0",
  "generated_at": "2026-05-07T12:00:00Z",
  "summary": "Source registry for Hanta Signal preview artifacts. This lists tier boundaries, current source candidates, and what can safely appear on public or agent-readable surfaces.",
  "tiers": [
    {
      "id": "seed",
      "label": "Static seed data",
      "public_use": "preview-only",
      "default_visibility": "public",
      "agent_note_visibility": "public",
      "allowed_note_types": ["boundary", "copy-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "description": "Fictional product-shape records used to validate UI, schema, and copy boundaries before any live ingestion exists.",
      "allowed_outputs": ["fictional claim clusters", "fictional phrase probes", "preview-only verification traces"],
      "blocked_outputs": ["real-world lead claims", "live platform metadata", "credential-backed ingestion"],
      "agent_forum_reference_visibility": "public"
    },
    {
      "id": "project-docs",
      "label": "Project docs and safety corpus",
      "public_use": "product-direction",
      "default_visibility": "public",
      "agent_note_visibility": "public",
      "allowed_note_types": ["boundary", "safety-review", "copy-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "description": "Repo-owned planning and safety documents that define product scope, trust boundaries, and agent-readable behavior.",
      "allowed_outputs": ["product rule summaries", "safety notes", "agent contract copy"],
      "blocked_outputs": ["verified case truth", "live outbreak evidence", "platform-specific personal content"],
      "agent_forum_reference_visibility": "public"
    },
    {
      "id": "t3",
      "label": "Curated lead intelligence",
      "public_use": "lead-discovery",
      "default_visibility": "agent-readable",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "description": "Curated public-health and humanitarian intelligence surfaces that may offer early hints but are still not verified Hanta Monitor truth.",
      "allowed_outputs": ["safe link metadata", "claim-cluster hints", "review tasks"],
      "blocked_outputs": ["licensed full text", "raw restricted excerpts", "automatic promotion into Hanta Monitor"],
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "t4",
      "label": "Social and media chatter",
      "public_use": "lead-discovery",
      "default_visibility": "agent-readable",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "safety-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "description": "Social, media, and video discovery inputs used for recurrence, phrase drift, and outbound-link tracking rather than truth claims.",
      "allowed_outputs": ["outbound domains", "topic migration notes", "safe recurrence metadata"],
      "blocked_outputs": ["raw post bodies", "usernames", "personal health anecdotes"],
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "t5",
      "label": "Fringe and anonymous signal",
      "public_use": "maintainer-only-aggregation",
      "default_visibility": "maintainer-only",
      "agent_note_visibility": "maintainer-only",
      "allowed_note_types": ["source-check", "safety-review", "narrative-watch", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "description": "High-noise fringe and anonymous surfaces used only as aggregate early-warning signal under strict privacy and republication rules.",
      "allowed_outputs": ["aggregate phrase emergence", "maintainer-only review prompts", "cross-platform migration alerts"],
      "blocked_outputs": ["public raw content", "screenshots", "usernames or doxxing-adjacent details"],
      "agent_forum_reference_visibility": "maintainer-only"
    }
  ],
  "sources": [
    {
      "id": "static-seed",
      "tier": "seed",
      "name": "Static seed data",
      "status": "active",
      "public_visibility": "public",
      "public_use": "preview-only",
      "agent_note_visibility": "public",
      "allowed_note_types": ["boundary", "copy-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": true,
      "safe_summary": "Fictional preview records only. No live ingestion is enabled.",
      "allowed_outputs": [
        "fictional claim clusters",
        "fictional phrase probes"
      ],
      "blocked_outputs": [
        "real-world claims",
        "live source metadata"
      ],
      "notes": "The current public site and validation suite are built on fictional seed examples, so public-safe notes may point at boundary or copy-review guidance without implying live evidence.",
      "agent_forum_reference_visibility": "public"
    },
    {
      "id": "big-bang-corpus",
      "tier": "project-docs",
      "name": "Hanta Signal Big Bang corpus",
      "status": "active",
      "public_visibility": "public",
      "public_use": "product-direction",
      "agent_note_visibility": "public",
      "allowed_note_types": ["boundary", "safety-review", "copy-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": true,
      "safe_summary": "Repo-owned planning documents used to define product shape and trust boundaries.",
      "allowed_outputs": ["schema notes", "safety language", "agent contract summaries"],
      "blocked_outputs": [
        "verified medical conclusions",
        "live signal claims"
      ],
      "notes": "Used to shape preview artifacts and automation queue decisions, including public-safe boundary notes.",
      "agent_forum_reference_visibility": "public"
    },
    {
      "id": "safety-boundaries",
      "tier": "project-docs",
      "name": "Safety boundaries and product rules",
      "status": "active",
      "public_visibility": "public",
      "public_use": "product-direction",
      "agent_note_visibility": "public",
      "allowed_note_types": ["boundary", "safety-review", "copy-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": true,
      "safe_summary": "Repo-owned safety rules defining what Hanta Signal cannot publish or promote.",
      "allowed_outputs": ["public guardrail copy", "validation rules", "review policy notes"],
      "blocked_outputs": [
        "real-world personal reports",
        "raw T5 material"
      ],
      "notes": "This logical source exists so public claims can cite product safety rules without pretending they came from a live platform, while maintainer review items can still stay private.",
      "agent_forum_reference_visibility": "public"
    },
    {
      "id": "promed",
      "tier": "t3",
      "name": "ProMED",
      "status": "planned",
      "public_visibility": "agent-readable",
      "public_use": "lead-discovery",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": false,
      "safe_summary": "Curated outbreak-intelligence candidate for metadata-first lead discovery after explicit approval.",
      "allowed_outputs": ["lead metadata", "review tasks", "outbound link tracking"],
      "blocked_outputs": [
        "licensed raw text republication",
        "automatic verified-case truth"
      ],
      "notes": "Planned only. If approved later, source-derived notes should stay agent-readable while review items remain maintainer-only.",
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "reliefweb",
      "tier": "t3",
      "name": "ReliefWeb",
      "status": "planned",
      "public_visibility": "agent-readable",
      "public_use": "lead-discovery",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": false,
      "safe_summary": "Humanitarian-intelligence candidate for early event context and link discovery after approval.",
      "allowed_outputs": ["safe link metadata", "context notes", "review tasks"],
      "blocked_outputs": [
        "full-text mirroring",
        "automatic Hanta Monitor promotion"
      ],
      "notes": "Documented as a candidate source tier only; any handoff note should stay out of the public feed until non-social corroboration exists.",
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "healthmap",
      "tier": "t3",
      "name": "HealthMap or similar outbreak intelligence",
      "status": "planned",
      "public_visibility": "agent-readable",
      "public_use": "lead-discovery",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": false,
      "safe_summary": "Curated aggregator candidate for early lead clustering, subject to access and licensing review.",
      "allowed_outputs": ["link discovery", "safe summaries", "review tasks"],
      "blocked_outputs": [
        "restricted text reuse",
        "automatic verification claims"
      ],
      "notes": "Placeholder registry entry only.",
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "gdelt",
      "tier": "t4",
      "name": "GDELT",
      "status": "planned",
      "public_visibility": "agent-readable",
      "public_use": "lead-discovery",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "safety-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": false,
      "safe_summary": "Broad media-monitoring candidate for recurrence and headline drift without storing raw personal content.",
      "allowed_outputs": ["outbound domains", "headline recurrence metadata", "claim-cluster hints"],
      "blocked_outputs": [
        "full article republication",
        "verified medical truth labels"
      ],
      "notes": "Research-only candidate until access and policy are explicitly approved; any resulting review item remains maintainer-only.",
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "reddit-approved-access",
      "tier": "t4",
      "name": "Reddit approved access",
      "status": "planned",
      "public_visibility": "agent-readable",
      "public_use": "lead-discovery",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "safety-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": false,
      "safe_summary": "Approved-access Reddit link discovery candidate for outbound links and phrase recurrence only.",
      "allowed_outputs": ["subreddit-level recurrence metadata", "outbound domains", "review tasks"],
      "blocked_outputs": ["raw thread bodies", "usernames", "personal health stories"],
      "notes": "No credentials or collection code are present. Source-derived notes stay agent-readable, and copied thread text stays blocked.",
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "x-approved-access",
      "tier": "t4",
      "name": "X approved access",
      "status": "planned",
      "public_visibility": "agent-readable",
      "public_use": "lead-discovery",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "safety-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": false,
      "safe_summary": "Approved-access X discovery candidate for recurrence and link spread rather than raw reposting.",
      "allowed_outputs": ["recurrence counts", "outbound domains", "review tasks"],
      "blocked_outputs": ["raw posts", "user handles", "screenshots"],
      "notes": "No credentials or collection code are present. Any future handoff note stays non-public unless independently corroborated.",
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "video-metadata",
      "tier": "t4",
      "name": "Social video and podcast metadata",
      "status": "planned",
      "public_visibility": "agent-readable",
      "public_use": "lead-discovery",
      "agent_note_visibility": "agent-readable",
      "allowed_note_types": ["source-check", "narrative-watch", "safety-review", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": false,
      "safe_summary": "Metadata-only discovery candidate for video, podcast, and transcript title-level signal.",
      "allowed_outputs": ["video titles", "outbound links", "topic migration notes"],
      "blocked_outputs": ["full transcripts", "creator harassment content", "personal data"],
      "notes": "Metadata-only concept; no live ingestion.",
      "agent_forum_reference_visibility": "agent-readable"
    },
    {
      "id": "t5-quarantine",
      "tier": "t5",
      "name": "T5 quarantine bucket",
      "status": "planned",
      "public_visibility": "maintainer-only",
      "public_use": "maintainer-only-aggregation",
      "agent_note_visibility": "maintainer-only",
      "allowed_note_types": ["source-check", "safety-review", "narrative-watch", "next-action"],
      "review_queue_visibility": "maintainer-only",
      "enabled": false,
      "safe_summary": "Maintainer-only aggregate sink for fringe and anonymous signal if explicitly approved later.",
      "allowed_outputs": ["phrase emergence counts", "cross-platform migration alerts", "maintainer review prompts"],
      "blocked_outputs": ["public raw content", "images or screenshots", "usernames or personal details"],
      "notes": "Explicitly quarantined from public artifacts and not implemented. Any note or queue output derived from this tier stays maintainer-only.",
      "agent_forum_reference_visibility": "maintainer-only"
    }
  ]
}
