{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2022:C4QEOHJDVNTSCLOI5OGDXHMACH","short_pith_number":"pith:C4QEOHJD","schema_version":"1.0","canonical_sha256":"1720471d23ab67212dc8eb8c3b9d8011d619894cb9641af24252a602ed11d3c5","source":{"kind":"arxiv","id":"2201.01283","version":1},"attestation_state":"computed","paper":{"title":"Self-supervised Learning from 100 Million Medical Images","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Awais Mansoor, Bogdan Georgescu, Dominik Neumann, Dorin Comaniciu, Florin C. Ghesu, James M. Balter, Pragneshkumar Patel, R.S. Vishwanath, Sasa Grbic, Youngjin Yoo, Yue Cao","submitted_at":"2022-01-04T18:27:04Z","abstract_excerpt":"Building accurate and robust artificial intelligence systems for medical image assessment requires not only the research and design of advanced deep learning models but also the creation of large and curated sets of annotated training examples. Constructing such datasets, however, is often very costly -- due to the complex nature of annotation tasks and the high level of expertise required for the interpretation of medical images (e.g., expert radiologists). To counter this limitation, we propose a method for self-supervised learning of rich image features based on contrastive learning and onl"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2201.01283","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2022-01-04T18:27:04Z","cross_cats_sorted":[],"title_canon_sha256":"3f0096d5219c6344082654949e50e60e5e56cea4d2aa16adca6df849c17bc286","abstract_canon_sha256":"980c4851a7fb05041686dc7c8e9736aa8dbe9d3f77c24183687fba9c769d4575"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T03:45:59.468711Z","signature_b64":"924mZV+/ITmXitLXhLZXWTYixyPm3hkX+A4zYAcB/bUPk416h+2VPQQ6oWdomC83/NwEMAdJ7inj6iaU7l1ADw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1720471d23ab67212dc8eb8c3b9d8011d619894cb9641af24252a602ed11d3c5","last_reissued_at":"2026-07-05T03:45:59.468174Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T03:45:59.468174Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Self-supervised Learning from 100 Million Medical Images","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Awais Mansoor, Bogdan Georgescu, Dominik Neumann, Dorin Comaniciu, Florin C. Ghesu, James M. Balter, Pragneshkumar Patel, R.S. Vishwanath, Sasa Grbic, Youngjin Yoo, Yue Cao","submitted_at":"2022-01-04T18:27:04Z","abstract_excerpt":"Building accurate and robust artificial intelligence systems for medical image assessment requires not only the research and design of advanced deep learning models but also the creation of large and curated sets of annotated training examples. Constructing such datasets, however, is often very costly -- due to the complex nature of annotation tasks and the high level of expertise required for the interpretation of medical images (e.g., expert radiologists). To counter this limitation, we propose a method for self-supervised learning of rich image features based on contrastive learning and onl"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2201.01283","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2201.01283/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2201.01283","created_at":"2026-07-05T03:45:59.468242+00:00"},{"alias_kind":"arxiv_version","alias_value":"2201.01283v1","created_at":"2026-07-05T03:45:59.468242+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2201.01283","created_at":"2026-07-05T03:45:59.468242+00:00"},{"alias_kind":"pith_short_12","alias_value":"C4QEOHJDVNTS","created_at":"2026-07-05T03:45:59.468242+00:00"},{"alias_kind":"pith_short_16","alias_value":"C4QEOHJDVNTSCLOI","created_at":"2026-07-05T03:45:59.468242+00:00"},{"alias_kind":"pith_short_8","alias_value":"C4QEOHJD","created_at":"2026-07-05T03:45:59.468242+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":1,"internal_anchor_count":0,"sample":[{"citing_arxiv_id":"2605.08819","citing_title":"From pre-training to downstream performance: Does domain-specific pre-training make sense?","ref_index":11,"is_internal_anchor":false}]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH","json":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH.json","graph_json":"https://pith.science/api/pith-number/C4QEOHJDVNTSCLOI5OGDXHMACH/graph.json","events_json":"https://pith.science/api/pith-number/C4QEOHJDVNTSCLOI5OGDXHMACH/events.json","paper":"https://pith.science/paper/C4QEOHJD"},"agent_actions":{"view_html":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH","download_json":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH.json","view_paper":"https://pith.science/paper/C4QEOHJD","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2201.01283&json=true","fetch_graph":"https://pith.science/api/pith-number/C4QEOHJDVNTSCLOI5OGDXHMACH/graph.json","fetch_events":"https://pith.science/api/pith-number/C4QEOHJDVNTSCLOI5OGDXHMACH/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH/action/timestamp_anchor","attest_storage":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH/action/storage_attestation","attest_author":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH/action/author_attestation","sign_citation":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH/action/citation_signature","submit_replication":"https://pith.science/pith/C4QEOHJDVNTSCLOI5OGDXHMACH/action/replication_record"}},"created_at":"2026-07-05T03:45:59.468242+00:00","updated_at":"2026-07-05T03:45:59.468242+00:00"}