{
  "report_format_version": "pepfold-report-v1",
  "generated_at": "2026-06-19T01:51:03.423Z",
  "specimen": {
    "number": 173,
    "sequence": "VSFIYKARLRLEDGEKREEWHRDVVDLVPGLIPEYELSVENHLENKQEKD",
    "sequence_length": 50,
    "status": "complete",
    "wallet": "62ef4jLfuT2zYFwBsTqHCHXMWkHAPiNn7dfeEn8qj37Q",
    "amount_sol": 0,
    "tx_hash": "3dm3WVHWu4ezuCv2hB4GmaefX7hanUjguVNo8KCWiz8pAjM6xztkB4xz9TDPS1sQUgqy8Eab2Z4KkztvJvPPMMKh",
    "created_at": "2026-06-16T07:22:31.896252+00:00",
    "completed_at": "2026-06-16T07:48:39.057678+00:00"
  },
  "structure": {
    "pdb_url": "https://mrzziawbddodlpywncfy.supabase.co/storage/v1/object/public/pdb-files/9d93e8dc-19b5-4c73-82f0-c9ac6f531b7f.pdb",
    "helix_pct": 0,
    "sheet_pct": 0,
    "loop_pct": 100
  },
  "triage": {
    "models": {
      "fold_model": {
        "name": "ESMFold",
        "version": "esmatlas-esmfold-v1"
      },
      "triage_model": {
        "name": "PEPFOLD heuristic triage",
        "version": "pepfold-triage-v1"
      },
      "comment_model": {
        "name": "Claude",
        "version": "claude-opus-4-7"
      }
    },
    "run_id": "run_659197431dde4280b9f206364f63566f",
    "metrics": [
      {
        "id": "fold_confidence",
        "label": "fold confidence",
        "value": 0.486,
        "source": {
          "model": "ESMFold",
          "version": "esmatlas-esmfold-v1"
        },
        "confidence": 0.52,
        "evidence_note": "derived from mean pLDDT on CA atoms",
        "confidence_band": [
          0.366,
          0.606
        ],
        "not_enough_confidence": true
      },
      {
        "id": "disorder_estimate",
        "label": "disorder estimate",
        "value": 1,
        "source": {
          "model": "PEPFOLD structure heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.52,
        "evidence_note": "estimated from loop proportion and low-confidence structure regions",
        "confidence_band": [
          0.88,
          1
        ],
        "not_enough_confidence": true
      },
      {
        "id": "aggregation_risk",
        "label": "aggregation risk",
        "value": 0.328,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "hydrophobic burden, aromatic burden, charge, and long hydrophobic runs",
        "confidence_band": [
          0.218,
          0.438
        ],
        "not_enough_confidence": false
      },
      {
        "id": "hydrophobic_burden",
        "label": "hydrophobic burden",
        "value": 0.36,
        "source": {
          "model": "PEPFOLD sequence analyzer",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.84,
        "evidence_note": "fraction of hydrophobic residues in sequence",
        "confidence_band": [
          0.32,
          0.4
        ],
        "not_enough_confidence": false
      },
      {
        "id": "charge_distribution_risk",
        "label": "charge distribution risk",
        "value": 0.1,
        "source": {
          "model": "PEPFOLD sequence analyzer",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.84,
        "evidence_note": "absolute net charge normalized by sequence length",
        "confidence_band": [
          0.06,
          0.14
        ],
        "not_enough_confidence": false
      },
      {
        "id": "solubility_risk",
        "label": "solubility risk",
        "value": 0.289,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "composite of aggregation risk, hydrophobic burden, and charge",
        "confidence_band": [
          0.179,
          0.399
        ],
        "not_enough_confidence": false
      },
      {
        "id": "developability_risk",
        "label": "developability risk",
        "value": 0.445,
        "source": {
          "model": "PEPFOLD developability heuristic",
          "version": "pepfold-triage-v1"
        },
        "confidence": 0.56,
        "evidence_note": "composite developability indicator used for triage",
        "confidence_band": [
          0.335,
          0.555
        ],
        "not_enough_confidence": false
      }
    ],
    "generated_at": "2026-06-16T07:47:19.396392+00:00",
    "report_version": "phase-a.v1",
    "sequence_length": 50,
    "synthesis_hints": [
      "sequence length >45 aa may reduce synthesis yield"
    ],
    "motif_liabilities": [
      "potential isomerization motif (D-G)"
    ],
    "developability_flags": [
      {
        "flag": "low_fold_confidence",
        "reason": "structure confidence is limited",
        "severity": "medium"
      },
      {
        "flag": "high_disorder_estimate",
        "reason": "predicted disorder is elevated",
        "severity": "medium"
      }
    ],
    "low_confidence_reasons": [
      "DSSP unavailable; secondary structure uses pLDDT fallback."
    ]
  },
  "audit": {
    "input": {
      "sequence_length": 50,
      "sequence_sha256": "2e3d9aa96d5b0763bbac5744fcbe8fba44e0efe33de4f48fcce96e024e91212d"
    },
    "output": {
      "report_sha256": "19fafb0734670b298500f734136b557488a1a6f8d737510e032b472cebc10c60"
    },
    "run_id": "run_659197431dde4280b9f206364f63566f",
    "timestamp": "2026-06-16T07:47:19.396490+00:00",
    "pipeline_versions": {
      "pep_model_version": "claude-opus-4-7",
      "fold_model_version": "esmatlas-esmfold-v1",
      "triage_model_version": "pepfold-triage-v1",
      "secondary_structure_source": "plddt_fallback"
    }
  },
  "attestation": null,
  "next_experiments": {
    "engine": "pepfold-recs-v1",
    "recommendations": [
      {
        "id": "liability_redesign",
        "technique": "LIABILITY REDESIGN ROUND",
        "rationale": "redesign to remove the flagged motif(s) before going wet-lab: potential isomerization motif (D-G). minimal substitutions usually suffice (e.g. N→Q for deamidation hotspots, M→L for met oxidation).",
        "evidence": "1 motif liability flag(s) in the sequence",
        "turnaround_days": [
          0,
          1
        ],
        "tier": "in_silico_only"
      },
      {
        "id": "cd_spectroscopy",
        "technique": "CD SPECTROSCOPY",
        "rationale": "experimental secondary structure check. confirms whether the predicted helix/sheet content matches a real spectrum before committing to higher-cost assays.",
        "evidence": "fold_confidence 49% (model is uncertain)",
        "turnaround_days": [
          1,
          3
        ],
        "tier": "biophysical_validation"
      },
      {
        "id": "nmr_hsqc",
        "technique": "1H-15N HSQC",
        "rationale": "if disorder is real, peaks will collapse into a narrow proton dispersion. if the peptide is actually folded, peaks will spread out. cheapest way to distinguish IDP from misfold.",
        "evidence": "disorder_estimate 100% (high)",
        "turnaround_days": [
          2,
          5
        ],
        "tier": "biophysical_validation"
      }
    ]
  },
  "comment": "50 residues of pure loop. no helix, no sheet, just flailing. plenty of charged residues scattered throughout, which usually means it wants a binding partner to tell it who to be.",
  "tweet": {
    "id": "2066790038097317896",
    "url": "https://x.com/pepfoldagent/status/2066790038097317896"
  }
}