{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:UTFNWVWDIOD6KJXUPLEBJIMUJC","short_pith_number":"pith:UTFNWVWD","schema_version":"1.0","canonical_sha256":"a4cadb56c34387e526f47ac814a1944895fb1e9c500d5e455abfff825857a63a","source":{"kind":"arxiv","id":"1801.10269","version":1},"attestation_state":"computed","paper":{"title":"The Impact of Class Rebalancing Techniques on the Performance and Interpretation of Defect Prediction Models","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.SE","authors_text":"Ahmed E. Hassan, Chakkrit Tantithamthavorn, Kenichi Matsumoto","submitted_at":"2018-01-31T01:32:58Z","abstract_excerpt":"Defect prediction models that are trained on class imbalanced datasets (i.e., the proportion of defective and clean modules is not equally represented) are highly susceptible to produce inaccurate prediction models. Prior research compares the impact of class rebalancing techniques on the performance of defect prediction models. Prior research efforts arrive at contradictory conclusions due to the use of different choice of datasets, classification techniques, and performance measures. Such contradictory conclusions make it hard to derive practical guidelines for whether class rebalancing tech"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1801.10269","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2018-01-31T01:32:58Z","cross_cats_sorted":[],"title_canon_sha256":"10b76c40a8c267a2776a5d953805e2beab266f8bbe95691447c09b2f0d23a466","abstract_canon_sha256":"b160785414c4ff9050fc9adba6fa77fa14281280e60d08699c941e5f64834fb3"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:24:41.299736Z","signature_b64":"aB2OBjBhGU9YGhjNeNbnF/o88Kj3/dIODe9AoFqw5jymoZnAW5OB04gwu7XWvGjo61MDB9NZBljkELsYrSFBBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a4cadb56c34387e526f47ac814a1944895fb1e9c500d5e455abfff825857a63a","last_reissued_at":"2026-05-18T00:24:41.299069Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:24:41.299069Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"The Impact of Class Rebalancing Techniques on the Performance and Interpretation of Defect Prediction Models","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.SE","authors_text":"Ahmed E. Hassan, Chakkrit Tantithamthavorn, Kenichi Matsumoto","submitted_at":"2018-01-31T01:32:58Z","abstract_excerpt":"Defect prediction models that are trained on class imbalanced datasets (i.e., the proportion of defective and clean modules is not equally represented) are highly susceptible to produce inaccurate prediction models. Prior research compares the impact of class rebalancing techniques on the performance of defect prediction models. Prior research efforts arrive at contradictory conclusions due to the use of different choice of datasets, classification techniques, and performance measures. Such contradictory conclusions make it hard to derive practical guidelines for whether class rebalancing tech"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.10269","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1801.10269","created_at":"2026-05-18T00:24:41.299170+00:00"},{"alias_kind":"arxiv_version","alias_value":"1801.10269v1","created_at":"2026-05-18T00:24:41.299170+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.10269","created_at":"2026-05-18T00:24:41.299170+00:00"},{"alias_kind":"pith_short_12","alias_value":"UTFNWVWDIOD6","created_at":"2026-05-18T12:32:56.356000+00:00"},{"alias_kind":"pith_short_16","alias_value":"UTFNWVWDIOD6KJXU","created_at":"2026-05-18T12:32:56.356000+00:00"},{"alias_kind":"pith_short_8","alias_value":"UTFNWVWD","created_at":"2026-05-18T12:32:56.356000+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC","json":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC.json","graph_json":"https://pith.science/api/pith-number/UTFNWVWDIOD6KJXUPLEBJIMUJC/graph.json","events_json":"https://pith.science/api/pith-number/UTFNWVWDIOD6KJXUPLEBJIMUJC/events.json","paper":"https://pith.science/paper/UTFNWVWD"},"agent_actions":{"view_html":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC","download_json":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC.json","view_paper":"https://pith.science/paper/UTFNWVWD","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1801.10269&json=true","fetch_graph":"https://pith.science/api/pith-number/UTFNWVWDIOD6KJXUPLEBJIMUJC/graph.json","fetch_events":"https://pith.science/api/pith-number/UTFNWVWDIOD6KJXUPLEBJIMUJC/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC/action/timestamp_anchor","attest_storage":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC/action/storage_attestation","attest_author":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC/action/author_attestation","sign_citation":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC/action/citation_signature","submit_replication":"https://pith.science/pith/UTFNWVWDIOD6KJXUPLEBJIMUJC/action/replication_record"}},"created_at":"2026-05-18T00:24:41.299170+00:00","updated_at":"2026-05-18T00:24:41.299170+00:00"}