{
  "report_format_version": "pepfold-report-v1",
  "generated_at": "2026-06-19T00:33:07.333Z",
  "specimen": {
    "number": 35,
    "sequence": "HAEGTFTSDVSSYLEGQAAKEFIAWLVKGRG",
    "sequence_length": 31,
    "status": "complete",
    "wallet": "6F4J6AdT5iQx4ExeN7JFE7EEM6fJ1XJ3DRUHT56gMfWF",
    "amount_sol": 0,
    "tx_hash": "5KUmm2Je1MUWY9Yhgbpog7SNbPUhUmpXvnKQLqpYWQLhmmZPHZPeBENhuHWPTykWvY5gPdQiqGCUYib4BoWRwoqb",
    "created_at": "2026-06-16T04:03:24.326506+00:00",
    "completed_at": "2026-06-16T04:16:23.985095+00:00"
  },
  "structure": {
    "pdb_url": "https://mrzziawbddodlpywncfy.supabase.co/storage/v1/object/public/pdb-files/2bc6d981-d222-47f7-934e-057903bb0417.pdb",
    "helix_pct": 0,
    "sheet_pct": 0,
    "loop_pct": 100
  },
  "triage": {
    "models": {
      "fold_model": {
        "name": "ESMFold",
        "version": "esmatlas-esmfold-v1"
      },
      "triage_model": {
        "name": "PEPFOLD heuristic triage",
        "version": "pepfold-triage-v1"
      },
      "comment_model": {
        "name": "Claude",
        "version": "claude-opus-4-7"
      }
    },
    "run_id": "run_11c5a667e6f64d6187a829ed14e19ed3",
    "metrics": [
      {
        "id": "fold_confidence",
        "label": "fold confidence",
        "value": 0.61,
        "source": {
          "model": "ESMFold",
          "version": "esmatlas-esmfold-v1"
        },
        "confidence": 0.52,
        "evidence_note": "derived from mean pLDDT on CA atoms",
        "confidence_band": [
          0.49,
          0.73
        ],
        "not_enough_confidence": true
      },
      {
        "id": "disorder_estimate",
        "label": "disorder estimate",
        "value": 0.677,
        "source": {
          "model": "PEPFOLD structure heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.52,
        "evidence_note": "estimated from loop proportion and low-confidence structure regions",
        "confidence_band": [
          0.557,
          0.797
        ],
        "not_enough_confidence": true
      },
      {
        "id": "aggregation_risk",
        "label": "aggregation risk",
        "value": 0.342,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "hydrophobic burden, aromatic burden, charge, and long hydrophobic runs",
        "confidence_band": [
          0.232,
          0.452
        ],
        "not_enough_confidence": false
      },
      {
        "id": "hydrophobic_burden",
        "label": "hydrophobic burden",
        "value": 0.419,
        "source": {
          "model": "PEPFOLD sequence analyzer",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.84,
        "evidence_note": "fraction of hydrophobic residues in sequence",
        "confidence_band": [
          0.379,
          0.459
        ],
        "not_enough_confidence": false
      },
      {
        "id": "charge_distribution_risk",
        "label": "charge distribution risk",
        "value": 0.032,
        "source": {
          "model": "PEPFOLD sequence analyzer",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.84,
        "evidence_note": "absolute net charge normalized by sequence length",
        "confidence_band": [
          0,
          0.072
        ],
        "not_enough_confidence": false
      },
      {
        "id": "solubility_risk",
        "label": "solubility risk",
        "value": 0.297,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "composite of aggregation risk, hydrophobic burden, and charge",
        "confidence_band": [
          0.187,
          0.407
        ],
        "not_enough_confidence": false
      },
      {
        "id": "developability_risk",
        "label": "developability risk",
        "value": 0.389,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "composite developability indicator used for triage",
        "confidence_band": [
          0.279,
          0.499
        ],
        "not_enough_confidence": false
      }
    ],
    "generated_at": "2026-06-16T04:15:05.025666+00:00",
    "report_version": "phase-a.v1",
    "sequence_length": 31,
    "synthesis_hints": [],
    "motif_liabilities": [
      "long hydrophobic run may increase aggregation risk"
    ],
    "developability_flags": [
      {
        "flag": "high_disorder_estimate",
        "reason": "predicted disorder is elevated",
        "severity": "medium"
      }
    ],
    "low_confidence_reasons": [
      "DSSP unavailable; secondary structure uses pLDDT fallback."
    ]
  },
  "audit": {
    "input": {
      "sequence_length": 31,
      "sequence_sha256": "7eac900d189747fcc34fe30e332a690bcf6123cf3280bd014641a3b5a619ab77"
    },
    "output": {
      "report_sha256": "a12b286fabcfc78af54dd3bbdf09b20f4857d7efc566866a0eae2d8b30cc20a8"
    },
    "run_id": "run_11c5a667e6f64d6187a829ed14e19ed3",
    "timestamp": "2026-06-16T04:15:05.025759+00:00",
    "pipeline_versions": {
      "pep_model_version": "claude-opus-4-7",
      "fold_model_version": "esmatlas-esmfold-v1",
      "triage_model_version": "pepfold-triage-v1",
      "secondary_structure_source": "plddt_fallback"
    }
  },
  "attestation": null,
  "next_experiments": {
    "engine": "pepfold-recs-v1",
    "recommendations": [
      {
        "id": "liability_redesign",
        "technique": "LIABILITY REDESIGN ROUND",
        "rationale": "redesign to remove the flagged motif(s) before going wet-lab: long hydrophobic run may increase aggregation risk. minimal substitutions usually suffice (e.g. N→Q for deamidation hotspots, M→L for met oxidation).",
        "evidence": "1 motif liability flag(s) in the sequence",
        "turnaround_days": [
          0,
          1
        ],
        "tier": "in_silico_only"
      },
      {
        "id": "nmr_hsqc",
        "technique": "1H-15N HSQC",
        "rationale": "if disorder is real, peaks will collapse into a narrow proton dispersion. if the peptide is actually folded, peaks will spread out. cheapest way to distinguish IDP from misfold.",
        "evidence": "disorder_estimate 68% (high)",
        "turnaround_days": [
          2,
          5
        ],
        "tier": "biophysical_validation"
      }
    ]
  },
  "comment": "that's semaglutide's backbone, more or less. fully unstructured on its own, which tracks. glp-1 analogs only fold when they find their receptor, otherwise they just dangle there waiting.",
  "tweet": {
    "id": "2066736623312871535",
    "url": "https://x.com/pepfoldagent/status/2066736623312871535"
  }
}