{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:EK3V5POC6QU4XR3JXTSAE2KKR2","short_pith_number":"pith:EK3V5POC","schema_version":"1.0","canonical_sha256":"22b75ebdc2f429cbc769bce402694a8ebc2cbb8edc2b77927a5e35ba113271b8","source":{"kind":"arxiv","id":"2606.08867","version":1},"attestation_state":"computed","paper":{"title":"Building Customer Support AI Agents at 100M-User Scale: An Evaluation-Driven Framework","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Aman Gupta, Carolina Baptista de Lima, Daniel Silva, Edesio Alcoba\\c{c}a, Herbert Fei, Jose Chrystian Lima Pacheco, Kevin Rossell, Luis Moneda, Luiz Paulo Rabachini, Rohan Ramanath, Shao Tang","submitted_at":"2026-06-07T22:44:00Z","abstract_excerpt":"The rapid rise in LLM capabilities has made AI agents increasingly viable across a broad range of tasks. Among the most promising applications is building production-ready customer-facing agents, a challenge that demands coordinated excellence in evaluation methodology, context engineering, training, and online measurement. Yet these critical pillars are typically developed in isolation, creating blind spots that only surface after deployment.\n  In this paper, we present a unified framework that bridges offline development with online impact for customer support AI agents at Nubank, a company "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.08867","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2026-06-07T22:44:00Z","cross_cats_sorted":[],"title_canon_sha256":"06b461d196f1ccce2c74643ffce9b5583ce06c4c29b2f19b229175132133a23e","abstract_canon_sha256":"d0f47b80655ea67b711133e27960e19273c13ba5198d7f1755934afa1f0b1517"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-09T02:07:43.855735Z","signature_b64":"IFMUJbZvdDr0+mtFlJqko0m1pK26A21pYip3un9c9ep+JuUr/NXFHg/hD/l8sPQhkkDVojsLTuWpFPu5ui0xDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"22b75ebdc2f429cbc769bce402694a8ebc2cbb8edc2b77927a5e35ba113271b8","last_reissued_at":"2026-06-09T02:07:43.854743Z","signature_status":"signed_v1","first_computed_at":"2026-06-09T02:07:43.854743Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Building Customer Support AI Agents at 100M-User Scale: An Evaluation-Driven Framework","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Aman Gupta, Carolina Baptista de Lima, Daniel Silva, Edesio Alcoba\\c{c}a, Herbert Fei, Jose Chrystian Lima Pacheco, Kevin Rossell, Luis Moneda, Luiz Paulo Rabachini, Rohan Ramanath, Shao Tang","submitted_at":"2026-06-07T22:44:00Z","abstract_excerpt":"The rapid rise in LLM capabilities has made AI agents increasingly viable across a broad range of tasks. Among the most promising applications is building production-ready customer-facing agents, a challenge that demands coordinated excellence in evaluation methodology, context engineering, training, and online measurement. Yet these critical pillars are typically developed in isolation, creating blind spots that only surface after deployment.\n  In this paper, we present a unified framework that bridges offline development with online impact for customer support AI agents at Nubank, a company "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.08867","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.08867/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.08867","created_at":"2026-06-09T02:07:43.854913+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.08867v1","created_at":"2026-06-09T02:07:43.854913+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.08867","created_at":"2026-06-09T02:07:43.854913+00:00"},{"alias_kind":"pith_short_12","alias_value":"EK3V5POC6QU4","created_at":"2026-06-09T02:07:43.854913+00:00"},{"alias_kind":"pith_short_16","alias_value":"EK3V5POC6QU4XR3J","created_at":"2026-06-09T02:07:43.854913+00:00"},{"alias_kind":"pith_short_8","alias_value":"EK3V5POC","created_at":"2026-06-09T02:07:43.854913+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2","json":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2.json","graph_json":"https://pith.science/api/pith-number/EK3V5POC6QU4XR3JXTSAE2KKR2/graph.json","events_json":"https://pith.science/api/pith-number/EK3V5POC6QU4XR3JXTSAE2KKR2/events.json","paper":"https://pith.science/paper/EK3V5POC"},"agent_actions":{"view_html":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2","download_json":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2.json","view_paper":"https://pith.science/paper/EK3V5POC","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.08867&json=true","fetch_graph":"https://pith.science/api/pith-number/EK3V5POC6QU4XR3JXTSAE2KKR2/graph.json","fetch_events":"https://pith.science/api/pith-number/EK3V5POC6QU4XR3JXTSAE2KKR2/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2/action/timestamp_anchor","attest_storage":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2/action/storage_attestation","attest_author":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2/action/author_attestation","sign_citation":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2/action/citation_signature","submit_replication":"https://pith.science/pith/EK3V5POC6QU4XR3JXTSAE2KKR2/action/replication_record"}},"created_at":"2026-06-09T02:07:43.854913+00:00","updated_at":"2026-06-09T02:07:43.854913+00:00"}