{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:XMOT5WPAZF33U4FKEHNEAMPL5R","short_pith_number":"pith:XMOT5WPA","canonical_record":{"source":{"id":"2506.01486","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-06-02T09:46:08Z","cross_cats_sorted":[],"title_canon_sha256":"10dfb8ce7385feaaaaf9c152da6a3a060f62414662dcc2ae9ff7f990d6e7f56e","abstract_canon_sha256":"246b580ef6ae66ce75ce9493053c36fb77d9f9038f9a1717fe509b3592a6eb39"},"schema_version":"1.0"},"canonical_sha256":"bb1d3ed9e0c977ba70aa21da4031ebec6d43cdb7f1812d73f5e57bc3afe941d6","source":{"kind":"arxiv","id":"2506.01486","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2506.01486","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"arxiv_version","alias_value":"2506.01486v2","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2506.01486","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"pith_short_12","alias_value":"XMOT5WPAZF33","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"pith_short_16","alias_value":"XMOT5WPAZF33U4FK","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"pith_short_8","alias_value":"XMOT5WPA","created_at":"2026-06-25T01:17:44Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:XMOT5WPAZF33U4FKEHNEAMPL5R","target":"record","payload":{"canonical_record":{"source":{"id":"2506.01486","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-06-02T09:46:08Z","cross_cats_sorted":[],"title_canon_sha256":"10dfb8ce7385feaaaaf9c152da6a3a060f62414662dcc2ae9ff7f990d6e7f56e","abstract_canon_sha256":"246b580ef6ae66ce75ce9493053c36fb77d9f9038f9a1717fe509b3592a6eb39"},"schema_version":"1.0"},"canonical_sha256":"bb1d3ed9e0c977ba70aa21da4031ebec6d43cdb7f1812d73f5e57bc3afe941d6","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-25T01:17:44.825176Z","signature_b64":"/EdlfCieTKxDxtpbfeIk6ag0PAurc+ez4h/VCRfTn5btTjy9ELd9Sp4sPfEgJA8zExQAvvx/eVCXcxGlUw6WCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"bb1d3ed9e0c977ba70aa21da4031ebec6d43cdb7f1812d73f5e57bc3afe941d6","last_reissued_at":"2026-06-25T01:17:44.824677Z","signature_status":"signed_v1","first_computed_at":"2026-06-25T01:17:44.824677Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2506.01486","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-25T01:17:44Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SZ+9l+NFdb7F3hRHjDsTy0K9msfC3K6cTEi+uXlHqsgdov8w4H+pfLpBO2jiryzb4E29Co6TifOcfBc29hxXBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-25T11:09:26.291914Z"},"content_sha256":"8b9c546bbda95758892e2f63ce32ca492816949bfcfd8577be7d379617758cb2","schema_version":"1.0","event_id":"sha256:8b9c546bbda95758892e2f63ce32ca492816949bfcfd8577be7d379617758cb2"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:XMOT5WPAZF33U4FKEHNEAMPL5R","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Model-agnostic Mitigation Strategies of Data Imbalance for Regression","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Andreas Rauh, Jelke Wibbeke, Sebastian Rohjans","submitted_at":"2025-06-02T09:46:08Z","abstract_excerpt":"Data imbalance persists as a pervasive challenge in regression tasks, introducing bias in model performance and undermining predictive reliability. This is particularly detrimental in applications aimed at predicting rare events that fall outside of the domain of the bulk of the training data. In this study, we review the current state-of-the-art regarding sampling-based methods and cost-sensitive learning. Additionally, we propose novel approaches to mitigate model bias. To better assess the importance of data, we introduce the density-distance and density-ratio relevance functions, which eff"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2506.01486","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2506.01486/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-25T01:17:44Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"aIqp2E/vZ/Jl5shcjaIxohLBMWr7bRDbLIDT2DGliEEGbLAxE2hHATabVNP9adNRB8O0Ln3X91RszK0vxIVtDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-25T11:09:26.292285Z"},"content_sha256":"f817d32ed67693a6bc3449d617d67718e0bdfc459cffa10d316787e9e79499ae","schema_version":"1.0","event_id":"sha256:f817d32ed67693a6bc3449d617d67718e0bdfc459cffa10d316787e9e79499ae"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XMOT5WPAZF33U4FKEHNEAMPL5R/bundle.json","state_url":"https://pith.science/pith/XMOT5WPAZF33U4FKEHNEAMPL5R/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XMOT5WPAZF33U4FKEHNEAMPL5R/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-25T11:09:26Z","links":{"resolver":"https://pith.science/pith/XMOT5WPAZF33U4FKEHNEAMPL5R","bundle":"https://pith.science/pith/XMOT5WPAZF33U4FKEHNEAMPL5R/bundle.json","state":"https://pith.science/pith/XMOT5WPAZF33U4FKEHNEAMPL5R/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XMOT5WPAZF33U4FKEHNEAMPL5R/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:XMOT5WPAZF33U4FKEHNEAMPL5R","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"246b580ef6ae66ce75ce9493053c36fb77d9f9038f9a1717fe509b3592a6eb39","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-06-02T09:46:08Z","title_canon_sha256":"10dfb8ce7385feaaaaf9c152da6a3a060f62414662dcc2ae9ff7f990d6e7f56e"},"schema_version":"1.0","source":{"id":"2506.01486","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2506.01486","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"arxiv_version","alias_value":"2506.01486v2","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2506.01486","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"pith_short_12","alias_value":"XMOT5WPAZF33","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"pith_short_16","alias_value":"XMOT5WPAZF33U4FK","created_at":"2026-06-25T01:17:44Z"},{"alias_kind":"pith_short_8","alias_value":"XMOT5WPA","created_at":"2026-06-25T01:17:44Z"}],"graph_snapshots":[{"event_id":"sha256:f817d32ed67693a6bc3449d617d67718e0bdfc459cffa10d316787e9e79499ae","target":"graph","created_at":"2026-06-25T01:17:44Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2506.01486/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Data imbalance persists as a pervasive challenge in regression tasks, introducing bias in model performance and undermining predictive reliability. This is particularly detrimental in applications aimed at predicting rare events that fall outside of the domain of the bulk of the training data. In this study, we review the current state-of-the-art regarding sampling-based methods and cost-sensitive learning. Additionally, we propose novel approaches to mitigate model bias. To better assess the importance of data, we introduce the density-distance and density-ratio relevance functions, which eff","authors_text":"Andreas Rauh, Jelke Wibbeke, Sebastian Rohjans","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-06-02T09:46:08Z","title":"Model-agnostic Mitigation Strategies of Data Imbalance for Regression"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2506.01486","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8b9c546bbda95758892e2f63ce32ca492816949bfcfd8577be7d379617758cb2","target":"record","created_at":"2026-06-25T01:17:44Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"246b580ef6ae66ce75ce9493053c36fb77d9f9038f9a1717fe509b3592a6eb39","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2025-06-02T09:46:08Z","title_canon_sha256":"10dfb8ce7385feaaaaf9c152da6a3a060f62414662dcc2ae9ff7f990d6e7f56e"},"schema_version":"1.0","source":{"id":"2506.01486","kind":"arxiv","version":2}},"canonical_sha256":"bb1d3ed9e0c977ba70aa21da4031ebec6d43cdb7f1812d73f5e57bc3afe941d6","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"bb1d3ed9e0c977ba70aa21da4031ebec6d43cdb7f1812d73f5e57bc3afe941d6","first_computed_at":"2026-06-25T01:17:44.824677Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-25T01:17:44.824677Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"/EdlfCieTKxDxtpbfeIk6ag0PAurc+ez4h/VCRfTn5btTjy9ELd9Sp4sPfEgJA8zExQAvvx/eVCXcxGlUw6WCg==","signature_status":"signed_v1","signed_at":"2026-06-25T01:17:44.825176Z","signed_message":"canonical_sha256_bytes"},"source_id":"2506.01486","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8b9c546bbda95758892e2f63ce32ca492816949bfcfd8577be7d379617758cb2","sha256:f817d32ed67693a6bc3449d617d67718e0bdfc459cffa10d316787e9e79499ae"],"state_sha256":"8106766142d12ce75f7a37e95f1c8d15d8d4f3ea5e7eca3c48be30672ac815c3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6fwvN4n6Up2OqxKeKWPWk6fZKhK1bVnWFtuH78CzahHGKldrpYQ9i/GnKvIqd9PoIYkPC7OJwL/sLUzAVYnpDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-25T11:09:26.294478Z","bundle_sha256":"414e180cc5b6e906ecc384f79af22fab2ba3edba0510f45fd0bb8843e6b6d1dc"}}