{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:XS5PEADDJXOSTASMPOOMXNMYAG","short_pith_number":"pith:XS5PEADD","canonical_record":{"source":{"id":"1501.02031","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2015-01-09T03:59:36Z","cross_cats_sorted":[],"title_canon_sha256":"41fd9da223c5ebb352f790b12ae4266459eca7b87e5913feb889c09b91a180fe","abstract_canon_sha256":"41661712acf66919de32554538f805e928d76dcdf02238166fdbb5a9e54a61ee"},"schema_version":"1.0"},"canonical_sha256":"bcbaf200634ddd29824c7b9ccbb59801bb53e3523d1df067e13620e55dbc2966","source":{"kind":"arxiv","id":"1501.02031","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1501.02031","created_at":"2026-05-18T02:29:45Z"},{"alias_kind":"arxiv_version","alias_value":"1501.02031v1","created_at":"2026-05-18T02:29:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1501.02031","created_at":"2026-05-18T02:29:45Z"},{"alias_kind":"pith_short_12","alias_value":"XS5PEADDJXOS","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_16","alias_value":"XS5PEADDJXOSTASM","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_8","alias_value":"XS5PEADD","created_at":"2026-05-18T12:29:50Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:XS5PEADDJXOSTASMPOOMXNMYAG","target":"record","payload":{"canonical_record":{"source":{"id":"1501.02031","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2015-01-09T03:59:36Z","cross_cats_sorted":[],"title_canon_sha256":"41fd9da223c5ebb352f790b12ae4266459eca7b87e5913feb889c09b91a180fe","abstract_canon_sha256":"41661712acf66919de32554538f805e928d76dcdf02238166fdbb5a9e54a61ee"},"schema_version":"1.0"},"canonical_sha256":"bcbaf200634ddd29824c7b9ccbb59801bb53e3523d1df067e13620e55dbc2966","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:29:45.000574Z","signature_b64":"YdgZjy/xFZhpMA2QCq+CmSdIX9ni+LufbSCCDJFahJLICjMJgS1fFwWcMuh6WILl1sg9zO231ynF4FdpAwF6BQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"bcbaf200634ddd29824c7b9ccbb59801bb53e3523d1df067e13620e55dbc2966","last_reissued_at":"2026-05-18T02:29:45.000152Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:29:45.000152Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1501.02031","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:29:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"mX0e+MeYXejA0aXOdMymjDmBZTjdWNsWLQMWXfCJfxMAtL9Zq8JGMGSYxYqoEOI1V/9vjr4L42OOrMnW/zgLDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-23T17:58:37.284372Z"},"content_sha256":"52a65eb297ac548dce9e3fae23ab0af683a239c8bce003bbacddd877417335bc","schema_version":"1.0","event_id":"sha256:52a65eb297ac548dce9e3fae23ab0af683a239c8bce003bbacddd877417335bc"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:XS5PEADDJXOSTASMPOOMXNMYAG","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Web Template Extraction Based on Hyperlink Analysis","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"David Insa (Universitat Polit\\`ecnica de Val\\`encia), Josep Silva (Universitat Polit\\`ecnica de Val\\`encia), Juli\\'an Alarte (Universitat Polit\\`ecnica de Val\\`encia), Salvador Tamarit (Universidad Polit\\'ecnica de Madrid)","submitted_at":"2015-01-09T03:59:36Z","abstract_excerpt":"Web templates are one of the main development resources for website engineers.  Templates allow them to increase productivity by plugin content into already formatted and prepared pagelets. For the final user templates are also useful, because they provide uniformity and a common look and feel for all webpages.    However, from the point of view of crawlers and indexers, templates are an important problem, because templates usually contain irrelevant information such as advertisements, menus, and banners. Processing and storing this information is likely to lead to a waste of resources (storag"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1501.02031","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:29:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IsZ05olxzu0sAJYJ5fKbHCKs0q54N4H4+7FvM8Nxoyl9FbPkOqlGwMQ1fnYkr8OuJhIsqZ/5nKeV8SrshqJFAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-23T17:58:37.284734Z"},"content_sha256":"9b2048593ba76b01b7caa8c2f759976d679fe2a576b03dc7fdb7d56fc177a85d","schema_version":"1.0","event_id":"sha256:9b2048593ba76b01b7caa8c2f759976d679fe2a576b03dc7fdb7d56fc177a85d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XS5PEADDJXOSTASMPOOMXNMYAG/bundle.json","state_url":"https://pith.science/pith/XS5PEADDJXOSTASMPOOMXNMYAG/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XS5PEADDJXOSTASMPOOMXNMYAG/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-23T17:58:37Z","links":{"resolver":"https://pith.science/pith/XS5PEADDJXOSTASMPOOMXNMYAG","bundle":"https://pith.science/pith/XS5PEADDJXOSTASMPOOMXNMYAG/bundle.json","state":"https://pith.science/pith/XS5PEADDJXOSTASMPOOMXNMYAG/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XS5PEADDJXOSTASMPOOMXNMYAG/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:XS5PEADDJXOSTASMPOOMXNMYAG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"41661712acf66919de32554538f805e928d76dcdf02238166fdbb5a9e54a61ee","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2015-01-09T03:59:36Z","title_canon_sha256":"41fd9da223c5ebb352f790b12ae4266459eca7b87e5913feb889c09b91a180fe"},"schema_version":"1.0","source":{"id":"1501.02031","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1501.02031","created_at":"2026-05-18T02:29:45Z"},{"alias_kind":"arxiv_version","alias_value":"1501.02031v1","created_at":"2026-05-18T02:29:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1501.02031","created_at":"2026-05-18T02:29:45Z"},{"alias_kind":"pith_short_12","alias_value":"XS5PEADDJXOS","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_16","alias_value":"XS5PEADDJXOSTASM","created_at":"2026-05-18T12:29:50Z"},{"alias_kind":"pith_short_8","alias_value":"XS5PEADD","created_at":"2026-05-18T12:29:50Z"}],"graph_snapshots":[{"event_id":"sha256:9b2048593ba76b01b7caa8c2f759976d679fe2a576b03dc7fdb7d56fc177a85d","target":"graph","created_at":"2026-05-18T02:29:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Web templates are one of the main development resources for website engineers.  Templates allow them to increase productivity by plugin content into already formatted and prepared pagelets. For the final user templates are also useful, because they provide uniformity and a common look and feel for all webpages.    However, from the point of view of crawlers and indexers, templates are an important problem, because templates usually contain irrelevant information such as advertisements, menus, and banners. Processing and storing this information is likely to lead to a waste of resources (storag","authors_text":"David Insa (Universitat Polit\\`ecnica de Val\\`encia), Josep Silva (Universitat Polit\\`ecnica de Val\\`encia), Juli\\'an Alarte (Universitat Polit\\`ecnica de Val\\`encia), Salvador Tamarit (Universidad Polit\\'ecnica de Madrid)","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2015-01-09T03:59:36Z","title":"Web Template Extraction Based on Hyperlink Analysis"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1501.02031","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:52a65eb297ac548dce9e3fae23ab0af683a239c8bce003bbacddd877417335bc","target":"record","created_at":"2026-05-18T02:29:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"41661712acf66919de32554538f805e928d76dcdf02238166fdbb5a9e54a61ee","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2015-01-09T03:59:36Z","title_canon_sha256":"41fd9da223c5ebb352f790b12ae4266459eca7b87e5913feb889c09b91a180fe"},"schema_version":"1.0","source":{"id":"1501.02031","kind":"arxiv","version":1}},"canonical_sha256":"bcbaf200634ddd29824c7b9ccbb59801bb53e3523d1df067e13620e55dbc2966","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"bcbaf200634ddd29824c7b9ccbb59801bb53e3523d1df067e13620e55dbc2966","first_computed_at":"2026-05-18T02:29:45.000152Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:29:45.000152Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"YdgZjy/xFZhpMA2QCq+CmSdIX9ni+LufbSCCDJFahJLICjMJgS1fFwWcMuh6WILl1sg9zO231ynF4FdpAwF6BQ==","signature_status":"signed_v1","signed_at":"2026-05-18T02:29:45.000574Z","signed_message":"canonical_sha256_bytes"},"source_id":"1501.02031","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:52a65eb297ac548dce9e3fae23ab0af683a239c8bce003bbacddd877417335bc","sha256:9b2048593ba76b01b7caa8c2f759976d679fe2a576b03dc7fdb7d56fc177a85d"],"state_sha256":"236b0d2f46f04496a666006d77200626f200fddfeef1df9aa27e4c0209302310"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ibMEcxfv862IMY0YeNCK4NdLr30mIPHFz4tp75tjoom7f2+ZPg9Rh/y7xCnTlsjSq8EWK+QuMt/HYySDhFf7BA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-23T17:58:37.286715Z","bundle_sha256":"e624d24e256fcbd76105b65fca92f3961bfb57ac42d7ca59de71a1e2eb4caf52"}}