{
  "access": {
    "embargo": {
      "active": false,
      "reason": null
    },
    "files": "public",
    "record": "public",
    "status": "open"
  },
  "created": "2026-05-29T00:37:04.249268+00:00",
  "custom_fields": {
    "code:codeRepository": "https://github.com/synthiumjp/metacog-engineering",
    "code:developmentStatus": {
      "id": "active",
      "title": {
        "en": "Active"
      }
    },
    "code:programmingLanguage": [
      {
        "id": "python",
        "title": {
          "en": "Python"
        }
      }
    ]
  },
  "deletion_status": {
    "is_deleted": false,
    "status": "P"
  },
  "files": {
    "count": 1,
    "enabled": true,
    "entries": {
      "ptcsft_arxiv.pdf": {
        "access": {
          "hidden": false
        },
        "checksum": "md5:e8bcdaebe8011bb81123524a8292956c",
        "ext": "pdf",
        "id": "b8354af7-f229-4811-8c87-9521d99c1608",
        "key": "ptcsft_arxiv.pdf",
        "links": {
          "content": "https://zenodo.org/api/records/20436841/files/ptcsft_arxiv.pdf/content",
          "iiif_api": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf/full/full/0/default.png",
          "iiif_base": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf",
          "iiif_canvas": "https://zenodo.org/api/iiif/record:20436841/canvas/ptcsft_arxiv.pdf",
          "iiif_info": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf/info.json",
          "self": "https://zenodo.org/api/records/20436841/files/ptcsft_arxiv.pdf"
        },
        "metadata": {
          "height": 842,
          "width": 595
        },
        "mimetype": "application/pdf",
        "size": 620353,
        "storage_class": "L"
      }
    },
    "order": [],
    "total_bytes": 620353
  },
  "id": "20436841",
  "is_draft": false,
  "is_published": true,
  "links": {
    "access": "https://zenodo.org/api/records/20436841/access",
    "access_grants": "https://zenodo.org/api/records/20436841/access/grants",
    "access_links": "https://zenodo.org/api/records/20436841/access/links",
    "access_request": "https://zenodo.org/api/records/20436841/access/request",
    "access_users": "https://zenodo.org/api/records/20436841/access/users",
    "archive": "https://zenodo.org/api/records/20436841/files-archive",
    "archive_media": "https://zenodo.org/api/records/20436841/media-files-archive",
    "communities": "https://zenodo.org/api/records/20436841/communities",
    "communities-suggestions": "https://zenodo.org/api/records/20436841/communities-suggestions",
    "doi": "https://doi.org/10.5281/zenodo.20436841",
    "draft": "https://zenodo.org/api/records/20436841/draft",
    "file_modification": "https://zenodo.org/api/records/20436841/file-modification",
    "files": "https://zenodo.org/api/records/20436841/files",
    "latest": "https://zenodo.org/api/records/20436841/versions/latest",
    "latest_html": "https://zenodo.org/records/20436841/latest",
    "media_files": "https://zenodo.org/api/records/20436841/media-files",
    "parent": "https://zenodo.org/api/records/20436840",
    "parent_doi": "https://doi.org/10.5281/zenodo.20436840",
    "parent_doi_html": "https://zenodo.org/doi/10.5281/zenodo.20436840",
    "parent_html": "https://zenodo.org/records/20436840",
    "preview_html": "https://zenodo.org/records/20436841?preview=1",
    "quota_increase": "https://zenodo.org/api/records/20436841/quota-increase",
    "request_deletion": "https://zenodo.org/api/records/20436841/request-deletion",
    "requests": "https://zenodo.org/api/records/20436841/requests",
    "reserve_doi": "https://zenodo.org/api/records/20436841/draft/pids/doi",
    "self": "https://zenodo.org/api/records/20436841",
    "self_doi": "https://doi.org/10.5281/zenodo.20436841",
    "self_doi_html": "https://zenodo.org/doi/10.5281/zenodo.20436841",
    "self_html": "https://zenodo.org/records/20436841",
    "self_iiif_manifest": "https://zenodo.org/api/iiif/record:20436841/manifest",
    "self_iiif_sequence": "https://zenodo.org/api/iiif/record:20436841/sequence/default",
    "thumbnails": {
      "10": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf/full/%5E10,/0/default.jpg",
      "100": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf/full/%5E100,/0/default.jpg",
      "1200": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf/full/%5E1200,/0/default.jpg",
      "250": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf/full/%5E250,/0/default.jpg",
      "50": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf/full/%5E50,/0/default.jpg",
      "750": "https://zenodo.org/api/iiif/record:20436841:ptcsft_arxiv.pdf/full/%5E750,/0/default.jpg"
    },
    "versions": "https://zenodo.org/api/records/20436841/versions"
  },
  "media_files": {
    "count": 1,
    "enabled": true,
    "entries": {
      "ptcsft_arxiv.pdf.ptif": {
        "access": {
          "hidden": true
        },
        "ext": "ptif",
        "id": "57c35bdf-2b7c-4ffc-b9c2-3865ae5a23e4",
        "key": "ptcsft_arxiv.pdf.ptif",
        "links": {
          "content": "https://zenodo.org/api/records/20436841/files/ptcsft_arxiv.pdf.ptif/content",
          "self": "https://zenodo.org/api/records/20436841/files/ptcsft_arxiv.pdf.ptif"
        },
        "metadata": null,
        "mimetype": "application/octet-stream",
        "processor": {
          "source_file_id": "b8354af7-f229-4811-8c87-9521d99c1608",
          "status": "finished",
          "type": "image-tiles"
        },
        "size": 0,
        "storage_class": "L"
      }
    },
    "order": [],
    "total_bytes": 0
  },
  "metadata": {
    "creators": [
      {
        "person_or_org": {
          "family_name": "Cacioli",
          "given_name": "Jon-Paul",
          "identifiers": [
            {
              "identifier": "0009-0000-7054-2014",
              "scheme": "orcid"
            }
          ],
          "name": "Cacioli, Jon-Paul",
          "type": "personal"
        },
        "role": {
          "id": "contactperson",
          "title": {
            "de": "Kontaktperson",
            "en": "Contact person"
          }
        }
      }
    ],
    "dates": [
      {
        "date": "2026",
        "type": {
          "id": "available",
          "title": {
            "de": "Verf\u00fcgbar",
            "en": "Available"
          }
        }
      }
    ],
    "description": "<p class=\"font-claude-response-body break-words whitespace-normal leading-[1.7]\">Background: Verbal confidence in instruct-tuned large language models fails because the readout pathway from internal correctness representations to the confidence-token position transmits little of the available signal. Linear probes on hidden states discriminate correct from incorrect responses at AUROC2 = 0.76&ndash;0.88 across seven of eight models spanning four families and three scales (the exception, Qwen 72B, is a probe outlier), yet verbal confidence saturates near ceiling (mean ~95&ndash;99%).</p>\n<p class=\"font-claude-response-body break-words whitespace-normal leading-[1.7]\">Objectives: We introduce probe-targeted confidence-calibrated supervised fine-tuning (PT-CSFT), which uses a linear probe on a model's own hidden states to generate continuous confidence targets for LoRA fine-tuning. We evaluate whether this method closes the metacognitive gap across model families, scales, and cognitive domains.</p>\n<p class=\"font-claude-response-body break-words whitespace-normal leading-[1.7]\">Methods: PT-CSFT modifies attention key and output projections and the three MLP projections via LoRA while leaving queries, values, and the language model head unchanged. We evaluate on eight models (7B&ndash;72B, four families) across TriviaQA, GSM8K, and ARC-Challenge. A two-stage curriculum addresses the 70B regime. The logit readout reads softmax distributions over confidence tokens as a continuous signal. Pre-registration: OSF Phase 1 (<a class=\"underline underline underline-offset-2 decoration-1 decoration-current/40 hover:decoration-current focus:decoration-current\" href=\"https://osf.io/ngkwc/\">https://osf.io/ngkwc/</a>), Phase 0 (<a class=\"underline underline underline-offset-2 decoration-1 decoration-current/40 hover:decoration-current focus:decoration-current\" href=\"https://osf.io/mpcr5\">https://osf.io/mpcr5</a>).</p>\n<p class=\"font-claude-response-body break-words whitespace-normal leading-[1.7]\">Results: PT-CSFT recovers 91&ndash;115% of probe discrimination in verbal confidence at 7&ndash;32B. At 70B, a two-stage curriculum closes 66% of the gap on the logit channel (AUROC2 = 0.797), the first VRS-Valid confidence signal at 70B. On GSM8K, the logit readout achieves AUROC2 = 0.862 &plusmn; 0.013 across 10 seeds, exceeding the probe. Post-hoc Platt scaling yields ECE = 0.042. The signal transfers out-of-distribution (NQ: 0.757, PopQA: 0.834) and enables confidence-gated retrieval (2.17x accuracy differential).</p>\n<p class=\"font-claude-response-body break-words whitespace-normal leading-[1.7]\">Conclusions: Controlled activation patching at the confidence-token position supports the interpretation that verbal confidence failure is a routing problem. The intervention is position-specific (mid-question control: chance), bidirectional (91% forward, 89% reverse), selective (83% of answers unchanged), and follows a near-monotonic layer-depth gradient (Spearman rho = 0.976, p &lt; 1e-4). These observations are consistent with PT-CSFT repairing a position-specific pathway for confidence without disrupting answer computation, though they do not trace the effect to specific model components. Multi-seed replication across three model families confirms stability (Llama 8B: 0.836 &plusmn; 0.011; Qwen 7B: 0.801 &plusmn; 0.022; Mistral 7B: 0.771 &plusmn; 0.017; 6 seeds each). The logit readout universally rescues where text confidence fails.</p>",
    "languages": [
      {
        "id": "eng",
        "title": {
          "en": "English"
        }
      }
    ],
    "publication_date": "2026-05-29",
    "publisher": "Zenodo",
    "related_identifiers": [
      {
        "identifier": "https://osf.io/ngkwc/",
        "relation_type": {
          "id": "issupplementedby",
          "title": {
            "de": "Wird erg\u00e4nzt durch",
            "en": "Is supplemented by"
          }
        },
        "resource_type": {
          "id": "other",
          "title": {
            "de": "Sonstige",
            "en": "Other"
          }
        },
        "scheme": "url"
      },
      {
        "identifier": "https://osf.io/mpcr5",
        "relation_type": {
          "id": "issupplementedby",
          "title": {
            "de": "Wird erg\u00e4nzt durch",
            "en": "Is supplemented by"
          }
        },
        "resource_type": {
          "id": "other",
          "title": {
            "de": "Sonstige",
            "en": "Other"
          }
        },
        "scheme": "url"
      },
      {
        "identifier": "https://github.com/synthiumjp/metacog-engineering",
        "relation_type": {
          "id": "issupplementedby",
          "title": {
            "de": "Wird erg\u00e4nzt durch",
            "en": "Is supplemented by"
          }
        },
        "resource_type": {
          "id": "software",
          "title": {
            "de": "Software",
            "en": "Software"
          }
        },
        "scheme": "url"
      }
    ],
    "resource_type": {
      "id": "publication-preprint",
      "title": {
        "de": "Preprint",
        "en": "Preprint"
      }
    },
    "rights": [
      {
        "description": {
          "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited."
        },
        "icon": "cc-by-icon",
        "id": "cc-by-4.0",
        "props": {
          "scheme": "spdx",
          "url": "https://creativecommons.org/licenses/by/4.0/legalcode"
        },
        "title": {
          "en": "Creative Commons Attribution 4.0 International"
        }
      }
    ],
    "subjects": [
      {
        "subject": "large language models"
      },
      {
        "subject": "LLM calibration"
      },
      {
        "subject": "verbal confidence"
      },
      {
        "subject": "metacognition"
      },
      {
        "subject": "LoRA fine-tuning"
      },
      {
        "subject": "activation patching"
      },
      {
        "subject": "mechanistic interpretability"
      },
      {
        "subject": "signal detection theory"
      }
    ],
    "title": "Making LLMs Say What They Know: Probe-Targeted Fine-Tuning for Verbal Confidence Calibration",
    "version": "1"
  },
  "parent": {
    "access": {
      "owned_by": {
        "user": "1662781"
      },
      "settings": {
        "accept_conditions_text": null,
        "allow_guest_requests": false,
        "allow_user_requests": false,
        "secret_link_expiration": 0
      }
    },
    "communities": {},
    "id": "20436840",
    "pids": {
      "doi": {
        "client": "datacite",
        "identifier": "10.5281/zenodo.20436840",
        "provider": "datacite"
      }
    }
  },
  "pids": {
    "doi": {
      "client": "datacite",
      "identifier": "10.5281/zenodo.20436841",
      "provider": "datacite"
    },
    "oai": {
      "identifier": "oai:zenodo.org:20436841",
      "provider": "oai"
    }
  },
  "revision_id": 3,
  "stats": {
    "all_versions": {
      "data_volume": 49628240.0,
      "downloads": 80,
      "unique_downloads": 68,
      "unique_views": 206,
      "views": 227
    },
    "this_version": {
      "data_volume": 49628240.0,
      "downloads": 80,
      "unique_downloads": 68,
      "unique_views": 206,
      "views": 227
    }
  },
  "status": "published",
  "swh": {},
  "updated": "2026-05-29T00:37:04.628466+00:00",
  "versions": {
    "index": 1,
    "is_latest": true
  }
}