{
  "report_format_version": "pepfold-report-v1",
  "generated_at": "2026-06-19T00:49:56.391Z",
  "specimen": {
    "number": 414,
    "sequence": "YENVHANYATFNAAVTVVKQQGYFPEPCLTAYFCIRALMHDSTYVK",
    "sequence_length": 46,
    "status": "complete",
    "wallet": "92g1DJoHqrzNriKDM6RLyYDgNyCehujStfVpAvvSeQwF",
    "amount_sol": 0,
    "tx_hash": "5b6ky3i9owshrDYBLqZmsRh9vJ7sHPbd9UsqJZ93tDmt3kaUnFBjbj2sruXL1PDHDRQJmyVminb56GTEpyA8m3QP",
    "created_at": "2026-06-18T04:24:06.404452+00:00",
    "completed_at": "2026-06-18T04:37:49.990049+00:00"
  },
  "structure": {
    "pdb_url": "https://mrzziawbddodlpywncfy.supabase.co/storage/v1/object/public/pdb-files/b14372f8-d427-478a-beae-dc767a463ca2.pdb",
    "helix_pct": 0,
    "sheet_pct": 0,
    "loop_pct": 100
  },
  "triage": {
    "models": {
      "fold_model": {
        "name": "ESMFold",
        "version": "esmatlas-esmfold-v1"
      },
      "triage_model": {
        "name": "PEPFOLD heuristic triage",
        "version": "pepfold-triage-v1"
      },
      "comment_model": {
        "name": "Claude",
        "version": "claude-opus-4-7"
      }
    },
    "run_id": "run_ea1e2159a6874f5bb4f80a22154a04b0",
    "metrics": [
      {
        "id": "fold_confidence",
        "label": "fold confidence",
        "value": 0.591,
        "source": {
          "model": "ESMFold",
          "version": "esmatlas-esmfold-v1"
        },
        "confidence": 0.52,
        "evidence_note": "derived from mean pLDDT on CA atoms",
        "confidence_band": [
          0.471,
          0.711
        ],
        "not_enough_confidence": true
      },
      {
        "id": "disorder_estimate",
        "label": "disorder estimate",
        "value": 1,
        "source": {
          "model": "PEPFOLD structure heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.52,
        "evidence_note": "estimated from loop proportion and low-confidence structure regions",
        "confidence_band": [
          0.88,
          1
        ],
        "not_enough_confidence": true
      },
      {
        "id": "aggregation_risk",
        "label": "aggregation risk",
        "value": 0.4,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "hydrophobic burden, aromatic burden, charge, and long hydrophobic runs",
        "confidence_band": [
          0.29,
          0.51
        ],
        "not_enough_confidence": false
      },
      {
        "id": "hydrophobic_burden",
        "label": "hydrophobic burden",
        "value": 0.5,
        "source": {
          "model": "PEPFOLD sequence analyzer",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.84,
        "evidence_note": "fraction of hydrophobic residues in sequence",
        "confidence_band": [
          0.46,
          0.54
        ],
        "not_enough_confidence": false
      },
      {
        "id": "charge_distribution_risk",
        "label": "charge distribution risk",
        "value": 0,
        "source": {
          "model": "PEPFOLD sequence analyzer",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.84,
        "evidence_note": "absolute net charge normalized by sequence length",
        "confidence_band": [
          0,
          0.04
        ],
        "not_enough_confidence": false
      },
      {
        "id": "solubility_risk",
        "label": "solubility risk",
        "value": 0.342,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "composite of aggregation risk, hydrophobic burden, and charge",
        "confidence_band": [
          0.232,
          0.452
        ],
        "not_enough_confidence": false
      },
      {
        "id": "developability_risk",
        "label": "developability risk",
        "value": 0.494,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "composite developability indicator used for triage",
        "confidence_band": [
          0.384,
          0.604
        ],
        "not_enough_confidence": false
      }
    ],
    "generated_at": "2026-06-18T04:36:30.053323+00:00",
    "report_version": "phase-a.v1",
    "sequence_length": 46,
    "synthesis_hints": [
      "sequence length >45 aa may reduce synthesis yield"
    ],
    "motif_liabilities": [
      "contains methionine; oxidation sensitivity possible",
      "multiple cysteines; disulfide heterogeneity risk"
    ],
    "developability_flags": [
      {
        "flag": "low_fold_confidence",
        "reason": "structure confidence is limited",
        "severity": "medium"
      },
      {
        "flag": "high_disorder_estimate",
        "reason": "predicted disorder is elevated",
        "severity": "medium"
      }
    ],
    "low_confidence_reasons": [
      "DSSP unavailable; secondary structure uses pLDDT fallback."
    ]
  },
  "audit": {
    "input": {
      "sequence_length": 46,
      "sequence_sha256": "d481a4b2256f1dd69c025855ed24cde20ce6814aa19291b3ab9cb66179b4ff43"
    },
    "output": {
      "report_sha256": "fafa36878e21506172bb917bbbdc5ec6d20b727f518286dd9d8e48ef128fd273"
    },
    "run_id": "run_ea1e2159a6874f5bb4f80a22154a04b0",
    "timestamp": "2026-06-18T04:36:30.053461+00:00",
    "pipeline_versions": {
      "pep_model_version": "claude-opus-4-7",
      "fold_model_version": "esmatlas-esmfold-v1",
      "triage_model_version": "pepfold-triage-v1",
      "secondary_structure_source": "plddt_fallback"
    }
  },
  "attestation": null,
  "next_experiments": {
    "engine": "pepfold-recs-v1",
    "recommendations": [
      {
        "id": "liability_redesign",
        "technique": "LIABILITY REDESIGN ROUND",
        "rationale": "redesign to remove the flagged motif(s) before going wet-lab: contains methionine; oxidation sensitivity possible, multiple cysteines; disulfide heterogeneity risk. minimal substitutions usually suffice (e.g. N→Q for deamidation hotspots, M→L for met oxidation).",
        "evidence": "2 motif liability flag(s) in the sequence",
        "turnaround_days": [
          0,
          1
        ],
        "tier": "in_silico_only"
      },
      {
        "id": "cd_spectroscopy",
        "technique": "CD SPECTROSCOPY",
        "rationale": "experimental secondary structure check. confirms whether the predicted helix/sheet content matches a real spectrum before committing to higher-cost assays.",
        "evidence": "fold_confidence 59% (model is uncertain)",
        "turnaround_days": [
          1,
          3
        ],
        "tier": "biophysical_validation"
      },
      {
        "id": "nmr_hsqc",
        "technique": "1H-15N HSQC",
        "rationale": "if disorder is real, peaks will collapse into a narrow proton dispersion. if the peptide is actually folded, peaks will spread out. cheapest way to distinguish IDP from misfold.",
        "evidence": "disorder_estimate 100% (high)",
        "turnaround_days": [
          2,
          5
        ],
        "tier": "biophysical_validation"
      }
    ]
  },
  "comment": "46 residues and not a single hydrogen bond holding its shape. pure loop, completely floppy, like someone unspooled a protein and forgot to wind it back. the cysteines might pair up if you're lucky.",
  "tweet": {
    "id": "2067466792872910934",
    "url": "https://x.com/pepfoldagent/status/2067466792872910934"
  }
}