{"count": 308, "next": null, "previous": null, "results": [{"id": 3792, "uid": "9bf31c7ff062936a96d3c8bd1f8f2ff3", "name": "EarthSight: A Distributed Framework for Low-Latency Satellite Intelligence", "authors": [{"id": 27599, "fullname": "Ansel Erol", "url": "http://mlsys.org/api/miniconf/users/27599?format=json", "institution": "Georgia Institute of Technology"}, {"id": 28491, "fullname": "Seungjun Lee", "url": "http://mlsys.org/api/miniconf/users/28491?format=json", "institution": "Korea Advanced Institute of Science &amp; Technology"}, {"id": 27358, "fullname": "Divya Mahajan", "url": "http://mlsys.org/api/miniconf/users/27358?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient ML", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3792", "url": "https://github.com/scai-tech/earthsight", "sourceid": -15, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T14:00:00-07:00", "endtime": "2026-05-21T14:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3710?format=json", "parent_id": 3710, "eventmedia": [{"id": 1226, "modified": "2026-05-20T08:46:49.165562-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3792_EM9rZRX.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3569?format=json"], "related_events_ids": [3569]}, {"id": 3734, "uid": "d1fe173d08e959397adf34b1d77e88d7", "name": "Machine Learning Fleet Efficiency: Improving TPU Systems at Scale with ML Productivity Goodput", "authors": [{"id": 27181, "fullname": "Arissa Wongpanich", "url": "http://mlsys.org/api/miniconf/users/27181?format=json", "institution": "Google"}, {"id": 11197, "fullname": "Tayo Oguntebi", "url": "http://mlsys.org/api/miniconf/users/11197?format=json", "institution": "Google LLC"}, {"id": 27182, "fullname": "Jose Baiocchi Paredes", "url": "http://mlsys.org/api/miniconf/users/27182?format=json", "institution": "Google"}, {"id": 11105, "fullname": "Yu Wang", "url": "http://mlsys.org/api/miniconf/users/11105?format=json", "institution": "Harvard University"}, {"id": 27183, "fullname": "Phitchaya Phothilimthana", "url": "http://mlsys.org/api/miniconf/users/27183?format=json", "institution": "OpenAI"}, {"id": 27184, "fullname": "Ritwika Mitra", "url": "http://mlsys.org/api/miniconf/users/27184?format=json", "institution": "Google"}, {"id": 27185, "fullname": "Zongwei Zhou", "url": "http://mlsys.org/api/miniconf/users/27185?format=json", "institution": null}, {"id": 11194, "fullname": "Naveen Kumar", "url": "http://mlsys.org/api/miniconf/users/11194?format=json", "institution": "Google"}, {"id": 10754, "fullname": "Vijay Janapa Reddi", "url": "http://mlsys.org/api/miniconf/users/10754?format=json", "institution": "Harvard University"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3734", "url": null, "sourceid": -79, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T17:45:00-07:00", "endtime": "2026-05-21T18:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3717?format=json", "parent_id": 3717, "eventmedia": [{"id": 1140, "modified": "2026-05-25T21:58:49.633917-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3734_MKeQyls.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3511?format=json"], "related_events_ids": [3511]}, {"id": 3783, "uid": "7f1de29e6da19d22b51c68001e7e0e54", "name": "Learning from Less: Measuring the Effectiveness of RLVR in Low Data and Compute Regimes", "authors": [{"id": 27558, "fullname": "Justin Bauer", "url": "http://mlsys.org/api/miniconf/users/27558?format=json", "institution": "Snorkel AI"}, {"id": 27559, "fullname": "Thomas Walshe", "url": "http://mlsys.org/api/miniconf/users/27559?format=json", "institution": "Reflection AI"}, {"id": 27560, "fullname": "Derek Pham", "url": "http://mlsys.org/api/miniconf/users/27560?format=json", "institution": "Snorkel AI"}, {"id": 27561, "fullname": "Harit Vishwakarma", "url": "http://mlsys.org/api/miniconf/users/27561?format=json", "institution": "University of Wisconsin, Madison"}, {"id": 27562, "fullname": "Armin Parchami", "url": "http://mlsys.org/api/miniconf/users/27562?format=json", "institution": "Snorkel AI"}, {"id": 27563, "fullname": "Frederic Sala", "url": "http://mlsys.org/api/miniconf/users/27563?format=json", "institution": "University of Wisconsin, Madison"}, {"id": 27564, "fullname": "Paroma Varma", "url": "http://mlsys.org/api/miniconf/users/27564?format=json", "institution": "Snorkel AI"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3783", "url": null, "sourceid": -135, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T16:00:00-07:00", "endtime": "2026-05-20T16:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3692?format=json", "parent_id": 3692, "eventmedia": [{"id": 1092, "modified": "2026-05-15T12:19:03.072214-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3783.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3560?format=json"], "related_events_ids": [3560]}, {"id": 3574, "uid": "a87ff679a2f3e71d9181a67b7542122c", "name": "Spira: Exploiting Voxel Data Structural Properties for Efficient Sparse Convolution in Point Cloud Networks", "authors": [{"id": 28464, "fullname": "Dionysios Adamopoulos", "url": "http://mlsys.org/api/miniconf/users/28464?format=json", "institution": "National Technical University of Athens"}, {"id": 27614, "fullname": "Anastasia Poulopoulou", "url": "http://mlsys.org/api/miniconf/users/27614?format=json", "institution": ""}, {"id": 27615, "fullname": "Georgios Goumas", "url": "http://mlsys.org/api/miniconf/users/27615?format=json", "institution": "National Technical University of Athens"}, {"id": 16879, "fullname": "Christina Giannoula", "url": "http://mlsys.org/api/miniconf/users/16879?format=json", "institution": "Max Planck Institute for Software Systems (MPI-SWS)"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3574", "url": "https://github.com/SPIN-Research-Group/Spira", "sourceid": 4, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=YQMilw805Q", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 868, "modified": "2026-03-23T21:52:45.845629-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=YQMilw805Q", "resourcetype": "UriEventmedia"}, {"id": 967, "file": "/media/PosterPDFs/MLSys%202026/3574.png", "modified": "2026-05-05T04:19:18.887828-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 968, "file": "/media/PosterPDFs/MLSys%202026/3574-thumb.png", "modified": "2026-05-05T04:19:18.988531-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "46", "related_events": ["http://mlsys.org/api/miniconf/events/3797?format=json"], "related_events_ids": [3797]}, {"id": 3825, "uid": "7f39f8317fbdb1988ef4c628eba02591", "name": "HetRL: Efficient Reinforcement Learning for LLMs in Heterogeneous Environments", "authors": [{"id": 26252, "fullname": "Yongjun He", "url": "http://mlsys.org/api/miniconf/users/26252?format=json", "institution": "ETH Zurich"}, {"id": 12135, "fullname": "Shuai Zhang", "url": "http://mlsys.org/api/miniconf/users/12135?format=json", "institution": "Amazon Web Services"}, {"id": 28961, "fullname": "Jiading Gai", "url": "http://mlsys.org/api/miniconf/users/28961?format=json", "institution": "Amazon"}, {"id": 27748, "fullname": "Xiyuan Zhang", "url": "http://mlsys.org/api/miniconf/users/27748?format=json", "institution": "AWS"}, {"id": 27749, "fullname": "Boran Han", "url": "http://mlsys.org/api/miniconf/users/27749?format=json", "institution": "Amazon/AWS"}, {"id": 27750, "fullname": "Bernie Wang", "url": "http://mlsys.org/api/miniconf/users/27750?format=json", "institution": "Amazon"}, {"id": 28496, "fullname": "Huzefa Rangwala", "url": "http://mlsys.org/api/miniconf/users/28496?format=json", "institution": "Siemens Corporate Research"}, {"id": 27637, "fullname": "George Karypis", "url": "http://mlsys.org/api/miniconf/users/27637?format=json", "institution": "University of Minnesota, Minneapolis"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3825", "url": null, "sourceid": -61, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T15:30:00-07:00", "endtime": "2026-05-20T15:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3692?format=json", "parent_id": 3692, "eventmedia": [{"id": 1156, "modified": "2026-05-17T21:19:00.961928-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3825_dNuKxpR.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3602?format=json"], "related_events_ids": [3602]}, {"id": 3543, "uid": "f899139df5e1059396431415e770c6dd", "name": "Beat the long tail: Distribution-Aware Speculative Decoding for RL Training", "authors": [{"id": 21038, "fullname": "Zelei Shao", "url": "http://mlsys.org/api/miniconf/users/21038?format=json", "institution": "Together AI"}, {"id": 27361, "fullname": "Vikranth Srivatsa", "url": "http://mlsys.org/api/miniconf/users/27361?format=json", "institution": "University of California, San Diego"}, {"id": 27362, "fullname": "Sanjana Srivastava", "url": "http://mlsys.org/api/miniconf/users/27362?format=json", "institution": null}, {"id": 25635, "fullname": "Qingyang Wu", "url": "http://mlsys.org/api/miniconf/users/25635?format=json", "institution": "Together AI"}, {"id": 27254, "fullname": "Alpay Ariyak", "url": "http://mlsys.org/api/miniconf/users/27254?format=json", "institution": null}, {"id": 23865, "fullname": "Xiaoxia Wu", "url": "http://mlsys.org/api/miniconf/users/23865?format=json", "institution": "TogtherAI"}, {"id": 18639, "fullname": "Ameen Patel", "url": "http://mlsys.org/api/miniconf/users/18639?format=json", "institution": "Together.ai"}, {"id": 27251, "fullname": "Jue Wang", "url": "http://mlsys.org/api/miniconf/users/27251?format=json", "institution": "Together AI"}, {"id": 27363, "fullname": "Percy Liang", "url": "http://mlsys.org/api/miniconf/users/27363?format=json", "institution": "Stanford University"}, {"id": 18765, "fullname": "Tri Dao", "url": "http://mlsys.org/api/miniconf/users/18765?format=json", "institution": "Princeton University, Together AI"}, {"id": 18868, "fullname": "Ce Zhang", "url": "http://mlsys.org/api/miniconf/users/18868?format=json", "institution": null}, {"id": 26292, "fullname": "Yiying Zhang", "url": "http://mlsys.org/api/miniconf/users/26292?format=json", "institution": "UCSD and GenseeAI"}, {"id": 18231, "fullname": "Ben Athiwaratkun", "url": "http://mlsys.org/api/miniconf/users/18231?format=json", "institution": null}, {"id": 24298, "fullname": "Chenfeng Xu", "url": "http://mlsys.org/api/miniconf/users/24298?format=json", "institution": "Together AI/UT Austin"}, {"id": 27250, "fullname": "Junxiong Wang", "url": "http://mlsys.org/api/miniconf/users/27250?format=json", "institution": "TogetherAI"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3543", "url": null, "sourceid": 100, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=kMeqqPBjSl", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 837, "modified": "2026-03-23T21:52:44.534495-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=kMeqqPBjSl", "resourcetype": "UriEventmedia"}, {"id": 1227, "file": "/media/PosterPDFs/MLSys%202026/3543.png", "modified": "2026-05-19T13:15:23.214150-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1228, "file": "/media/PosterPDFs/MLSys%202026/3543-thumb.png", "modified": "2026-05-19T13:15:23.319405-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "35", "related_events": ["http://mlsys.org/api/miniconf/events/3766?format=json"], "related_events_ids": [3766]}, {"id": 3853, "uid": "c0c7c76d30bd3dcaefc96f40275bdc0a", "name": "ADR: AN AGENTIC DETECTION SYSTEMFORENTERPRISE AGENTIC AI SECURITY", "authors": [{"id": 27880, "fullname": "Chenning Li", "url": "http://mlsys.org/api/miniconf/users/27880?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 17735, "fullname": "Pan Hu", "url": "http://mlsys.org/api/miniconf/users/17735?format=json", "institution": "Uber"}, {"id": 28472, "fullname": "Justin Xu", "url": "http://mlsys.org/api/miniconf/users/28472?format=json", "institution": "University of Oxford"}, {"id": 27882, "fullname": "Baris Ozbas", "url": "http://mlsys.org/api/miniconf/users/27882?format=json", "institution": "Uber"}, {"id": 27883, "fullname": "Olivia Liu", "url": "http://mlsys.org/api/miniconf/users/27883?format=json", "institution": ""}, {"id": 25578, "fullname": "Caroline Van", "url": "http://mlsys.org/api/miniconf/users/25578?format=json", "institution": "Uber Technologies"}, {"id": 27884, "fullname": "Manxue Li", "url": "http://mlsys.org/api/miniconf/users/27884?format=json", "institution": null}, {"id": 27885, "fullname": "Wei Zhou", "url": "http://mlsys.org/api/miniconf/users/27885?format=json", "institution": "Uber"}, {"id": 12450, "fullname": "Mohammad Alizadeh", "url": "http://mlsys.org/api/miniconf/users/12450?format=json", "institution": "MIT CSAIL"}, {"id": 27886, "fullname": "Pengyu Zhang", "url": "http://mlsys.org/api/miniconf/users/27886?format=json", "institution": "Uber"}, {"id": 28966, "fullname": "KK Sriramadhesikan", "url": "http://mlsys.org/api/miniconf/users/28966?format=json", "institution": null}, {"id": 28967, "fullname": "Ming Zhang", "url": "http://mlsys.org/api/miniconf/users/28967?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Agentic AI/MLSys", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3853", "url": null, "sourceid": -50, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T08:30:00-07:00", "endtime": "2026-05-21T08:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3700?format=json", "parent_id": 3700, "eventmedia": [{"id": 1246, "modified": "2026-05-21T13:48:12.291138-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3853_k9cXWDE.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3630?format=json"], "related_events_ids": [3630]}, {"id": 3781, "uid": "7f6ffaa6bb0b408017b62254211691b5", "name": "AIRS: Scaling Live Inference in Resource Constrained Environments", "authors": [{"id": 27552, "fullname": "Nilesh Jagnik", "url": "http://mlsys.org/api/miniconf/users/27552?format=json", "institution": "Google"}, {"id": 27553, "fullname": "Xiaohao Yang", "url": "http://mlsys.org/api/miniconf/users/27553?format=json", "institution": null}, {"id": 27554, "fullname": "Tuan Do", "url": "http://mlsys.org/api/miniconf/users/27554?format=json", "institution": null}, {"id": 27555, "fullname": "Chelsea Chen", "url": "http://mlsys.org/api/miniconf/users/27555?format=json", "institution": null}, {"id": 27556, "fullname": "Harshvardhan GM", "url": "http://mlsys.org/api/miniconf/users/27556?format=json", "institution": "Google LLC"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3781", "url": null, "sourceid": -112, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T16:45:00-07:00", "endtime": "2026-05-21T17:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3717?format=json", "parent_id": 3717, "eventmedia": [{"id": 1247, "modified": "2026-05-21T17:10:37.128443-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3781.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3558?format=json"], "related_events_ids": [3558]}, {"id": 3823, "uid": "54229abfcfa5649e7003b83dd4755294", "name": "Optimizing PyTorch Inference with LLM-Based Multi-Agent Systems", "authors": [{"id": 27737, "fullname": "Kirill Nagaitsev", "url": "http://mlsys.org/api/miniconf/users/27737?format=json", "institution": "Northwestern University"}, {"id": 27738, "fullname": "Luka Grbcic", "url": "http://mlsys.org/api/miniconf/users/27738?format=json", "institution": "Lawrence Berkeley National Laboratory"}, {"id": 27739, "fullname": "Samuel Williams", "url": "http://mlsys.org/api/miniconf/users/27739?format=json", "institution": "Lawrence Berkeley National Lab"}, {"id": 27740, "fullname": "Costin Iancu", "url": "http://mlsys.org/api/miniconf/users/27740?format=json", "institution": "Ambassador University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3823", "url": null, "sourceid": -91, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T13:45:00-07:00", "endtime": "2026-05-19T14:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3668?format=json", "parent_id": 3668, "eventmedia": [{"id": 1096, "modified": "2026-05-15T13:08:20.950344-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3823.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3600?format=json"], "related_events_ids": [3600]}, {"id": 3816, "uid": "fc490ca45c00b1249bbe3554a4fdf6fb", "name": "MorphServe: Efficient and Workload-Aware LLM Serving via Runtime Quantized Layer Swapping and KV Cache Resizing", "authors": [{"id": 27401, "fullname": "Zhaoyuan Su", "url": "http://mlsys.org/api/miniconf/users/27401?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27679, "fullname": "Zeyu Zhang", "url": "http://mlsys.org/api/miniconf/users/27679?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27403, "fullname": "Tingfeng Lan", "url": "http://mlsys.org/api/miniconf/users/27403?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27405, "fullname": "Zirui Wang", "url": "http://mlsys.org/api/miniconf/users/27405?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27680, "fullname": "Haiying Shen", "url": "http://mlsys.org/api/miniconf/users/27680?format=json", "institution": null}, {"id": 27681, "fullname": "Juncheng Yang", "url": "http://mlsys.org/api/miniconf/users/27681?format=json", "institution": "Harvard University"}, {"id": 27406, "fullname": "Yue Cheng", "url": "http://mlsys.org/api/miniconf/users/27406?format=json", "institution": "University of Virginia, Charlottesville"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3816", "url": null, "sourceid": -65, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T08:45:00-07:00", "endtime": "2026-05-20T09:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3678?format=json", "parent_id": 3678, "eventmedia": [{"id": 1078, "modified": "2026-05-21T21:23:14.249281-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3816_X9jZeWW.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3593?format=json"], "related_events_ids": [3593]}, {"id": 3556, "uid": "c9e1074f5b3f9fc8ea15d152add07294", "name": "Attribution-based Sparse Activation in Large Language Models", "authors": [{"id": 27495, "fullname": "Jifeng Song", "url": "http://mlsys.org/api/miniconf/users/27495?format=json", "institution": "University of Pittsburgh"}, {"id": 27496, "fullname": "Xiangyu Yin", "url": "http://mlsys.org/api/miniconf/users/27496?format=json", "institution": "University of Pittsburgh"}, {"id": 27497, "fullname": "Boyuan Yang", "url": "http://mlsys.org/api/miniconf/users/27497?format=json", "institution": "University of Pittsburgh"}, {"id": 27498, "fullname": "Kai Huang", "url": "http://mlsys.org/api/miniconf/users/27498?format=json", "institution": "University of Pittsburgh"}, {"id": 27499, "fullname": "Weichen Liu", "url": "http://mlsys.org/api/miniconf/users/27499?format=json", "institution": "University of Pittsburgh"}, {"id": 27500, "fullname": "Wei Gao", "url": "http://mlsys.org/api/miniconf/users/27500?format=json", "institution": "University of Pittsburgh"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3556", "url": null, "sourceid": 104, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=gJFigZeb5D", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 850, "modified": "2026-03-23T21:52:45.078334-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=gJFigZeb5D", "resourcetype": "UriEventmedia"}, {"id": 1109, "file": "/media/PosterPDFs/MLSys%202026/3556.png", "modified": "2026-05-15T14:40:41.538291-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1110, "file": "/media/PosterPDFs/MLSys%202026/3556-thumb.png", "modified": "2026-05-15T14:40:41.628052-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "48", "related_events": ["http://mlsys.org/api/miniconf/events/3779?format=json"], "related_events_ids": [3779]}, {"id": 3808, "uid": "19ca14e7ea6328a42e0eb13d585e4c22", "name": "AccelOpt: A Self-Improving LLM Agentic System for AI Accelerator Kernel Optimization", "authors": [{"id": 18114, "fullname": "Genghan Zhang", "url": "http://mlsys.org/api/miniconf/users/18114?format=json", "institution": "Stanford University"}, {"id": 27646, "fullname": "Shaowei Zhu", "url": "http://mlsys.org/api/miniconf/users/27646?format=json", "institution": "Amazon"}, {"id": 27647, "fullname": "Anjiang Wei", "url": "http://mlsys.org/api/miniconf/users/27647?format=json", "institution": null}, {"id": 27171, "fullname": "Zhenyu Song", "url": "http://mlsys.org/api/miniconf/users/27171?format=json", "institution": null}, {"id": 27648, "fullname": "Allen Nie", "url": "http://mlsys.org/api/miniconf/users/27648?format=json", "institution": "Google DeepMind"}, {"id": 15476, "fullname": "Zhen Jia", "url": "http://mlsys.org/api/miniconf/users/15476?format=json", "institution": "Amazon"}, {"id": 17626, "fullname": "Nandita Vijaykumar", "url": "http://mlsys.org/api/miniconf/users/17626?format=json", "institution": "Department of Computer Science, University of Toronto"}, {"id": 11990, "fullname": "Yida Wang", "url": "http://mlsys.org/api/miniconf/users/11990?format=json", "institution": "Amazon"}, {"id": 15013, "fullname": "Kunle Olukotun", "url": "http://mlsys.org/api/miniconf/users/15013?format=json", "institution": "Stanford"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Compilers and Kernels", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3808", "url": "https://ppl.stanford.edu/accelopt.html", "sourceid": -36, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T17:00:00-07:00", "endtime": "2026-05-21T17:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3718?format=json", "parent_id": 3718, "eventmedia": [{"id": 1248, "modified": "2026-05-21T23:27:39.250012-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3808.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3585?format=json"], "related_events_ids": [3585]}, {"id": 3862, "uid": "a684eceee76fc522773286a895bc8436", "name": "Sparing Strategies to Minimize Reliability Impact On Large Training Jobs", "authors": [{"id": 27967, "fullname": "Kevin Quirk", "url": "http://mlsys.org/api/miniconf/users/27967?format=json", "institution": null}, {"id": 27968, "fullname": "Matthew Lennie", "url": "http://mlsys.org/api/miniconf/users/27968?format=json", "institution": null}, {"id": 27969, "fullname": "Ehsan K. Ardestani", "url": "http://mlsys.org/api/miniconf/users/27969?format=json", "institution": "Meta"}, {"id": 27970, "fullname": "Satyajeet Ahuja", "url": "http://mlsys.org/api/miniconf/users/27970?format=json", "institution": null}, {"id": 27971, "fullname": "Matthew Bergeron", "url": "http://mlsys.org/api/miniconf/users/27971?format=json", "institution": null}, {"id": 27972, "fullname": "Andrew Grier", "url": "http://mlsys.org/api/miniconf/users/27972?format=json", "institution": null}, {"id": 27973, "fullname": "Zhaodong Wang", "url": "http://mlsys.org/api/miniconf/users/27973?format=json", "institution": "Facebook"}, {"id": 27974, "fullname": "Mustafa Ozdal", "url": "http://mlsys.org/api/miniconf/users/27974?format=json", "institution": null}, {"id": 27975, "fullname": "Xu Zhang", "url": "http://mlsys.org/api/miniconf/users/27975?format=json", "institution": "Meta Platforms"}, {"id": 27976, "fullname": "Abhinav Triguna", "url": "http://mlsys.org/api/miniconf/users/27976?format=json", "institution": null}, {"id": 27977, "fullname": "Ying Zhang", "url": "http://mlsys.org/api/miniconf/users/27977?format=json", "institution": "University of Michigan - Ann Arbor"}, {"id": 28524, "fullname": "Mathew Oldham", "url": "http://mlsys.org/api/miniconf/users/28524?format=json", "institution": null}, {"id": 28959, "fullname": "Chunqiang Tang", "url": "http://mlsys.org/api/miniconf/users/28959?format=json", "institution": "Facebook"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Training 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3862", "url": null, "sourceid": -54, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T14:45:00-07:00", "endtime": "2026-05-21T15:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3713?format=json", "parent_id": 3713, "eventmedia": [{"id": 1104, "modified": "2026-05-22T08:55:58.209544-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3862_xkbT8SW.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3639?format=json"], "related_events_ids": [3639]}, {"id": 3568, "uid": "3def184ad8f4755ff269862ea77393dd", "name": "PARROT: Persuasion and Agreement Robustness Rating of Output Truth \u2014 A Sycophancy Robustness Benchmark for LLMs", "authors": [{"id": 28463, "fullname": "\u00d6zay Ezerceli", "url": "http://mlsys.org/api/miniconf/users/28463?format=json", "institution": "Isik University"}, {"id": 27598, "fullname": "Mahmoud ElHussieni", "url": "http://mlsys.org/api/miniconf/users/27598?format=json", "institution": "Istanbul Medipol University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3568", "url": "https://github.com/YusufCelebii/parrot-revision", "sourceid": 125, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=cU2wiOnfm5", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 862, "modified": "2026-03-23T21:52:45.595554-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=cU2wiOnfm5", "resourcetype": "UriEventmedia"}, {"id": 1251, "file": "/media/PosterPDFs/MLSys%202026/3568.png", "modified": "2026-06-09T04:24:51.982785-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "31", "related_events": ["http://mlsys.org/api/miniconf/events/3791?format=json"], "related_events_ids": [3791]}, {"id": 3598, "uid": "2838023a778dfaecdc212708f721b788", "name": "FreeScale: Distributed Training for Sequence Recommendation Models with Minimal Scaling Cost", "authors": [{"id": 27718, "fullname": "Chenhao Feng", "url": "http://mlsys.org/api/miniconf/users/27718?format=json", "institution": ""}, {"id": 25617, "fullname": "Haoli Zhang", "url": "http://mlsys.org/api/miniconf/users/25617?format=json", "institution": "Meta"}, {"id": 27158, "fullname": "Shakhzod Ali-zade", "url": "http://mlsys.org/api/miniconf/users/27158?format=json", "institution": "Meta Platforms, Inc."}, {"id": 15737, "fullname": "Yanli Zhao", "url": "http://mlsys.org/api/miniconf/users/15737?format=json", "institution": null}, {"id": 11119, "fullname": "Liang Luo", "url": "http://mlsys.org/api/miniconf/users/11119?format=json", "institution": "Meta"}, {"id": 27719, "fullname": "Jennifer Cao", "url": "http://mlsys.org/api/miniconf/users/27719?format=json", "institution": "Facebook"}, {"id": 27720, "fullname": "Lisen Deng", "url": "http://mlsys.org/api/miniconf/users/27720?format=json", "institution": "Meta"}, {"id": 27721, "fullname": "Siqiao Chen", "url": "http://mlsys.org/api/miniconf/users/27721?format=json", "institution": null}, {"id": 27722, "fullname": "Chenyu Zhao", "url": "http://mlsys.org/api/miniconf/users/27722?format=json", "institution": "Facebook"}, {"id": 27723, "fullname": "Tristan Rice", "url": "http://mlsys.org/api/miniconf/users/27723?format=json", "institution": "Meta, PyTorch Distributed"}, {"id": 27724, "fullname": "Daniel Johnson", "url": "http://mlsys.org/api/miniconf/users/27724?format=json", "institution": null}, {"id": 27725, "fullname": "Min Si", "url": "http://mlsys.org/api/miniconf/users/27725?format=json", "institution": null}, {"id": 27726, "fullname": "Tiantu Xu", "url": "http://mlsys.org/api/miniconf/users/27726?format=json", "institution": "Meta"}, {"id": 27727, "fullname": "Yi Zhang", "url": "http://mlsys.org/api/miniconf/users/27727?format=json", "institution": "Facebook"}, {"id": 27728, "fullname": "Evgenii Kolpakov", "url": "http://mlsys.org/api/miniconf/users/27728?format=json", "institution": ""}, {"id": 27729, "fullname": "Siqi Yan", "url": "http://mlsys.org/api/miniconf/users/27729?format=json", "institution": "Facebook"}, {"id": 23924, "fullname": "Chuanhao Zhuge", "url": "http://mlsys.org/api/miniconf/users/23924?format=json", "institution": "Meta"}, {"id": 27730, "fullname": "Min Ni", "url": "http://mlsys.org/api/miniconf/users/27730?format=json", "institution": "Northwestern University"}, {"id": 27731, "fullname": "Bi Xue", "url": "http://mlsys.org/api/miniconf/users/27731?format=json", "institution": "Thinking Machines Lab"}, {"id": 27732, "fullname": "Qunshu Zhang", "url": "http://mlsys.org/api/miniconf/users/27732?format=json", "institution": "Facebook"}, {"id": 16149, "fullname": "Shen Li", "url": "http://mlsys.org/api/miniconf/users/16149?format=json", "institution": "Meta"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3598", "url": null, "sourceid": 51, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=MY0BIdK4hn", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 892, "modified": "2026-03-23T21:52:46.752798-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=MY0BIdK4hn", "resourcetype": "UriEventmedia"}, {"id": 1112, "file": "/media/PosterPDFs/MLSys%202026/3598.png", "modified": "2026-05-15T14:48:56.169711-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1113, "file": "/media/PosterPDFs/MLSys%202026/3598-thumb.png", "modified": "2026-05-15T15:01:52.231022-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "32", "related_events": ["http://mlsys.org/api/miniconf/events/3821?format=json"], "related_events_ids": [3821]}, {"id": 3821, "uid": "2838023a778dfaecdc212708f721b788", "name": "FreeScale: Distributed Training for Sequence Recommendation Models with Minimal Scaling Cost", "authors": [{"id": 27718, "fullname": "Chenhao Feng", "url": "http://mlsys.org/api/miniconf/users/27718?format=json", "institution": ""}, {"id": 25617, "fullname": "Haoli Zhang", "url": "http://mlsys.org/api/miniconf/users/25617?format=json", "institution": "Meta"}, {"id": 27158, "fullname": "Shakhzod Ali-zade", "url": "http://mlsys.org/api/miniconf/users/27158?format=json", "institution": "Meta Platforms, Inc."}, {"id": 15737, "fullname": "Yanli Zhao", "url": "http://mlsys.org/api/miniconf/users/15737?format=json", "institution": null}, {"id": 11119, "fullname": "Liang Luo", "url": "http://mlsys.org/api/miniconf/users/11119?format=json", "institution": "Meta"}, {"id": 27719, "fullname": "Jennifer Cao", "url": "http://mlsys.org/api/miniconf/users/27719?format=json", "institution": "Facebook"}, {"id": 27720, "fullname": "Lisen Deng", "url": "http://mlsys.org/api/miniconf/users/27720?format=json", "institution": "Meta"}, {"id": 27721, "fullname": "Siqiao Chen", "url": "http://mlsys.org/api/miniconf/users/27721?format=json", "institution": null}, {"id": 27722, "fullname": "Chenyu Zhao", "url": "http://mlsys.org/api/miniconf/users/27722?format=json", "institution": "Facebook"}, {"id": 27723, "fullname": "Tristan Rice", "url": "http://mlsys.org/api/miniconf/users/27723?format=json", "institution": "Meta, PyTorch Distributed"}, {"id": 27724, "fullname": "Daniel Johnson", "url": "http://mlsys.org/api/miniconf/users/27724?format=json", "institution": null}, {"id": 27725, "fullname": "Min Si", "url": "http://mlsys.org/api/miniconf/users/27725?format=json", "institution": null}, {"id": 27726, "fullname": "Tiantu Xu", "url": "http://mlsys.org/api/miniconf/users/27726?format=json", "institution": "Meta"}, {"id": 27727, "fullname": "Yi Zhang", "url": "http://mlsys.org/api/miniconf/users/27727?format=json", "institution": "Facebook"}, {"id": 27728, "fullname": "Evgenii Kolpakov", "url": "http://mlsys.org/api/miniconf/users/27728?format=json", "institution": ""}, {"id": 27729, "fullname": "Siqi Yan", "url": "http://mlsys.org/api/miniconf/users/27729?format=json", "institution": "Facebook"}, {"id": 23924, "fullname": "Chuanhao Zhuge", "url": "http://mlsys.org/api/miniconf/users/23924?format=json", "institution": "Meta"}, {"id": 27730, "fullname": "Min Ni", "url": "http://mlsys.org/api/miniconf/users/27730?format=json", "institution": "Northwestern University"}, {"id": 27731, "fullname": "Bi Xue", "url": "http://mlsys.org/api/miniconf/users/27731?format=json", "institution": "Thinking Machines Lab"}, {"id": 27732, "fullname": "Qunshu Zhang", "url": "http://mlsys.org/api/miniconf/users/27732?format=json", "institution": "Facebook"}, {"id": 16149, "fullname": "Shen Li", "url": "http://mlsys.org/api/miniconf/users/16149?format=json", "institution": "Meta"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Training 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3821", "url": null, "sourceid": -51, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T16:00:00-07:00", "endtime": "2026-05-21T16:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3713?format=json", "parent_id": 3713, "eventmedia": [{"id": 1097, "modified": "2026-05-15T14:17:13.785962-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3821_gs6415h.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3598?format=json"], "related_events_ids": [3598]}, {"id": 3813, "uid": "d2ddea18f00665ce8623e36bd4e3c7c5", "name": "PLayer-FL: A Principled Approach to Personalized Layer-wise Cross-Silo Federated Learning", "authors": [{"id": 27662, "fullname": "Ahmed Elhussein", "url": "http://mlsys.org/api/miniconf/users/27662?format=json", "institution": "Columbia University"}, {"id": 25923, "fullname": "Florent Pollet", "url": "http://mlsys.org/api/miniconf/users/25923?format=json", "institution": "Columbia University"}, {"id": 28492, "fullname": "Gamze Gursoy", "url": "http://mlsys.org/api/miniconf/users/28492?format=json", "institution": "University of Cambridge"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Federated Learning", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3813", "url": "https://github.com/G2Lab/PLayer-FL", "sourceid": -73, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T17:30:00-07:00", "endtime": "2026-05-19T17:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3672?format=json", "parent_id": 3672, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3590?format=json"], "related_events_ids": [3590]}, {"id": 3555, "uid": "68d30a9594728bc39aa24be94b319d21", "name": "Wave: A Symbolic Python DSL And Compiler for High-Performance Machine Learning", "authors": [{"id": 18549, "fullname": "Harsh Menon", "url": "http://mlsys.org/api/miniconf/users/18549?format=json", "institution": "AMD"}, {"id": 28460, "fullname": "Oleksandr Zinenko", "url": "http://mlsys.org/api/miniconf/users/28460?format=json", "institution": "Advanced Micro Devices"}, {"id": 25620, "fullname": "Gaurav Verma", "url": "http://mlsys.org/api/miniconf/users/25620?format=json", "institution": "Advanced Micro Devices, Inc. (AMD) and Stony Brook University, NY"}, {"id": 27188, "fullname": "Stanley Winata", "url": "http://mlsys.org/api/miniconf/users/27188?format=json", "institution": null}, {"id": 27487, "fullname": "Ivan Butygin", "url": "http://mlsys.org/api/miniconf/users/27487?format=json", "institution": null}, {"id": 27488, "fullname": "Nithin Meganathan", "url": "http://mlsys.org/api/miniconf/users/27488?format=json", "institution": "AMD"}, {"id": 27147, "fullname": "Sanket Pandit", "url": "http://mlsys.org/api/miniconf/users/27147?format=json", "institution": "Advanced Micro Devices"}, {"id": 27489, "fullname": "William Gallard Hatch", "url": "http://mlsys.org/api/miniconf/users/27489?format=json", "institution": "AMD"}, {"id": 27490, "fullname": "Surya Jasper", "url": "http://mlsys.org/api/miniconf/users/27490?format=json", "institution": null}, {"id": 27491, "fullname": "Megan Kuo", "url": "http://mlsys.org/api/miniconf/users/27491?format=json", "institution": null}, {"id": 27492, "fullname": "Sahil FAIZAL", "url": "http://mlsys.org/api/miniconf/users/27492?format=json", "institution": "AMD"}, {"id": 27493, "fullname": "Ashay Rane", "url": "http://mlsys.org/api/miniconf/users/27493?format=json", "institution": null}, {"id": 27494, "fullname": "Aurore De Spirlet", "url": "http://mlsys.org/api/miniconf/users/27494?format=json", "institution": null}, {"id": 26125, "fullname": "Martin P. L\u00fccke", "url": "http://mlsys.org/api/miniconf/users/26125?format=json", "institution": "AMD"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3555", "url": null, "sourceid": 84, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=gcXV1E8HRH", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 849, "modified": "2026-03-23T21:52:45.042858-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=gcXV1E8HRH", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "49", "related_events": ["http://mlsys.org/api/miniconf/events/3778?format=json"], "related_events_ids": [3778]}, {"id": 3529, "uid": "8613985ec49eb8f757ae6439e879bb2a", "name": "Meeting SLOs, Slashing Hours: Automated Enterprise LLM Optimization with OptiKIT", "authors": [{"id": 25907, "fullname": "Nicholas Santavas", "url": "http://mlsys.org/api/miniconf/users/25907?format=json", "institution": "eBay"}, {"id": 27293, "fullname": "Kareem Eissa", "url": "http://mlsys.org/api/miniconf/users/27293?format=json", "institution": "Siemens Healthineers"}, {"id": 27294, "fullname": "Patrycja Cieplicka", "url": "http://mlsys.org/api/miniconf/users/27294?format=json", "institution": null}, {"id": 27295, "fullname": "Piotr Florek", "url": "http://mlsys.org/api/miniconf/users/27295?format=json", "institution": ""}, {"id": 27296, "fullname": "Matteo Nulli", "url": "http://mlsys.org/api/miniconf/users/27296?format=json", "institution": "eBay Inc."}, {"id": 27297, "fullname": "Stefan Vasilev", "url": "http://mlsys.org/api/miniconf/users/27297?format=json", "institution": "eBay Inc."}, {"id": 27298, "fullname": "Seyyed Hashemi", "url": "http://mlsys.org/api/miniconf/users/27298?format=json", "institution": "eBay Inc."}, {"id": 27299, "fullname": "Antonios Gasteratos", "url": "http://mlsys.org/api/miniconf/users/27299?format=json", "institution": "Dimocritus University of Thrace"}, {"id": 27300, "fullname": "Shahram Khadivi", "url": "http://mlsys.org/api/miniconf/users/27300?format=json", "institution": "eBay Inc."}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3529", "url": null, "sourceid": 90, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=om4H7AI2hc", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 823, "modified": "2026-03-23T21:52:43.982129-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=om4H7AI2hc", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "20", "related_events": ["http://mlsys.org/api/miniconf/events/3752?format=json"], "related_events_ids": [3752]}, {"id": 3752, "uid": "8613985ec49eb8f757ae6439e879bb2a", "name": "Meeting SLOs, Slashing Hours: Automated Enterprise LLM Optimization with OptiKIT", "authors": [{"id": 25907, "fullname": "Nicholas Santavas", "url": "http://mlsys.org/api/miniconf/users/25907?format=json", "institution": "eBay"}, {"id": 27293, "fullname": "Kareem Eissa", "url": "http://mlsys.org/api/miniconf/users/27293?format=json", "institution": "Siemens Healthineers"}, {"id": 27294, "fullname": "Patrycja Cieplicka", "url": "http://mlsys.org/api/miniconf/users/27294?format=json", "institution": null}, {"id": 27295, "fullname": "Piotr Florek", "url": "http://mlsys.org/api/miniconf/users/27295?format=json", "institution": ""}, {"id": 27296, "fullname": "Matteo Nulli", "url": "http://mlsys.org/api/miniconf/users/27296?format=json", "institution": "eBay Inc."}, {"id": 27297, "fullname": "Stefan Vasilev", "url": "http://mlsys.org/api/miniconf/users/27297?format=json", "institution": "eBay Inc."}, {"id": 27298, "fullname": "Seyyed Hashemi", "url": "http://mlsys.org/api/miniconf/users/27298?format=json", "institution": "eBay Inc."}, {"id": 27299, "fullname": "Antonios Gasteratos", "url": "http://mlsys.org/api/miniconf/users/27299?format=json", "institution": "Dimocritus University of Thrace"}, {"id": 27300, "fullname": "Shahram Khadivi", "url": "http://mlsys.org/api/miniconf/users/27300?format=json", "institution": "eBay Inc."}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Serving 6", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3752", "url": null, "sourceid": -90, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T13:45:00-07:00", "endtime": "2026-05-21T14:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3709?format=json", "parent_id": 3709, "eventmedia": [{"id": 1108, "modified": "2026-05-15T14:33:05.371823-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3752.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3529?format=json"], "related_events_ids": [3529]}, {"id": 3811, "uid": "d09bf41544a3365a46c9077ebb5e35c3", "name": "G-HEMP: FAST MULTI-GPU PRIVATE INFERENCE FOR LARGE-SCALE GCNS WITH HOMOMORPHIC ENCRYPTION", "authors": [{"id": 27655, "fullname": "Ran Ran", "url": "http://mlsys.org/api/miniconf/users/27655?format=json", "institution": "North Carolina State University"}, {"id": 27656, "fullname": "Zhaoting Gong", "url": "http://mlsys.org/api/miniconf/users/27656?format=json", "institution": "North Carolina State University"}, {"id": 27657, "fullname": "Zhaowei Li", "url": "http://mlsys.org/api/miniconf/users/27657?format=json", "institution": "North Carolina State University"}, {"id": 27658, "fullname": "Xianting Lu", "url": "http://mlsys.org/api/miniconf/users/27658?format=json", "institution": "North Carolina State University"}, {"id": 27659, "fullname": "Jiajia Li", "url": "http://mlsys.org/api/miniconf/users/27659?format=json", "institution": "North Carolina State University"}, {"id": 27660, "fullname": "Wujie Wen", "url": "http://mlsys.org/api/miniconf/users/27660?format=json", "institution": "North Carolina State University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Security and Privacy", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3811", "url": null, "sourceid": -75, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T16:30:00-07:00", "endtime": "2026-05-19T16:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3673?format=json", "parent_id": 3673, "eventmedia": [{"id": 1231, "modified": "2026-05-19T14:14:12.774535-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3811.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3588?format=json"], "related_events_ids": [3588]}, {"id": 3519, "uid": "34173cb38f07f89ddbebc2ac9128303f", "name": "MLCommons Chakra: Advancing Performance Benchmarking and Co-design using Standardized Execution Traces", "authors": [{"id": 27214, "fullname": "Srinivas", "url": "http://mlsys.org/api/miniconf/users/27214?format=json", "institution": "NVIDIA"}, {"id": 27225, "fullname": "Andrey Balogh", "url": "http://mlsys.org/api/miniconf/users/27225?format=json", "institution": ""}, {"id": 27227, "fullname": "Brad B", "url": "http://mlsys.org/api/miniconf/users/27227?format=json", "institution": ""}, {"id": 27216, "fullname": "Brian Coutinho", "url": "http://mlsys.org/api/miniconf/users/27216?format=json", "institution": null}, {"id": 20878, "fullname": "Louis Feng", "url": "http://mlsys.org/api/miniconf/users/20878?format=json", "institution": "University of California, Davis"}, {"id": 27217, "fullname": "Sheng Fu", "url": "http://mlsys.org/api/miniconf/users/27217?format=json", "institution": null}, {"id": 27218, "fullname": "Sanshan Gao", "url": "http://mlsys.org/api/miniconf/users/27218?format=json", "institution": null}, {"id": 27231, "fullname": "Mehryar Garakani", "url": "http://mlsys.org/api/miniconf/users/27231?format=json", "institution": null}, {"id": 27215, "fullname": "Taekyung Heo", "url": "http://mlsys.org/api/miniconf/users/27215?format=json", "institution": null}, {"id": 14827, "fullname": "David Kanter", "url": "http://mlsys.org/api/miniconf/users/14827?format=json", "institution": "MLCommons"}, {"id": 27220, "fullname": "Josh Ladd", "url": "http://mlsys.org/api/miniconf/users/27220?format=json", "institution": null}, {"id": 27224, "fullname": "Ziwei Li", "url": "http://mlsys.org/api/miniconf/users/27224?format=json", "institution": null}, {"id": 28956, "fullname": "Winston Liu", "url": "http://mlsys.org/api/miniconf/users/28956?format=json", "institution": "Keysight Technologies"}, {"id": 16517, "fullname": "Changhai Man", "url": "http://mlsys.org/api/miniconf/users/16517?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27226, "fullname": "Dan Mihailescu", "url": "http://mlsys.org/api/miniconf/users/27226?format=json", "institution": "Keysight Technologies"}, {"id": 27228, "fullname": "Spandan More", "url": "http://mlsys.org/api/miniconf/users/27228?format=json", "institution": "AMD"}, {"id": 27221, "fullname": "Joongun Park", "url": "http://mlsys.org/api/miniconf/users/27221?format=json", "institution": null}, {"id": 27230, "fullname": "Ashwin Ramachandran", "url": "http://mlsys.org/api/miniconf/users/27230?format=json", "institution": ""}, {"id": 26285, "fullname": "Vinay Ramakrishnaiah", "url": "http://mlsys.org/api/miniconf/users/26285?format=json", "institution": "AMD"}, {"id": 27229, "fullname": "Saeed Rashidi", "url": "http://mlsys.org/api/miniconf/users/27229?format=json", "institution": "Meta"}, {"id": 10754, "fullname": "Vijay Janapa Reddi", "url": "http://mlsys.org/api/miniconf/users/10754?format=json", "institution": "Harvard University"}, {"id": 14774, "fullname": "Puneet Sharma", "url": "http://mlsys.org/api/miniconf/users/14774?format=json", "institution": "HP Labs"}, {"id": 27219, "fullname": "Phio Tian", "url": "http://mlsys.org/api/miniconf/users/27219?format=json", "institution": null}, {"id": 14298, "fullname": "William Won", "url": "http://mlsys.org/api/miniconf/users/14298?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27142, "fullname": "Hanjiang Wu", "url": "http://mlsys.org/api/miniconf/users/27142?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27223, "fullname": "Huan Xu", "url": "http://mlsys.org/api/miniconf/users/27223?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27222, "fullname": "Jinsun Yoo", "url": "http://mlsys.org/api/miniconf/users/27222?format=json", "institution": "Georgia Institute of Technology"}, {"id": 11662, "fullname": "Tushar Krishna", "url": "http://mlsys.org/api/miniconf/users/11662?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3519", "url": null, "sourceid": 30, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=s2WcSv2Hzt", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 813, "modified": "2026-03-23T21:52:43.622745-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=s2WcSv2Hzt", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "40", "related_events": ["http://mlsys.org/api/miniconf/events/3742?format=json"], "related_events_ids": [3742]}, {"id": 3575, "uid": "d3d9446802a44259755d38e6d163e820", "name": "db-SP: Accelerating Sparse Attention for Visual Generative Models with Dual-Balanced Sequence Parallelism", "authors": [{"id": 25683, "fullname": "Siqi Chen", "url": "http://mlsys.org/api/miniconf/users/25683?format=json", "institution": "Tsinghua University"}, {"id": 15899, "fullname": "Ke Hong", "url": "http://mlsys.org/api/miniconf/users/15899?format=json", "institution": "Tsinghua University"}, {"id": 27616, "fullname": "Tianchen Zhao", "url": "http://mlsys.org/api/miniconf/users/27616?format=json", "institution": "Tsinghua University, Tsinghua University"}, {"id": 27617, "fullname": "Ruiqi Xie", "url": "http://mlsys.org/api/miniconf/users/27617?format=json", "institution": "Tsinghua University"}, {"id": 27618, "fullname": "Zhenhua Zhu", "url": "http://mlsys.org/api/miniconf/users/27618?format=json", "institution": "Tsinghua University, Tsinghua University"}, {"id": 27619, "fullname": "Xudong Zhang", "url": "http://mlsys.org/api/miniconf/users/27619?format=json", "institution": "Tsinghua University, Tsinghua University"}, {"id": 17647, "fullname": "Yu Wang", "url": "http://mlsys.org/api/miniconf/users/17647?format=json", "institution": "Tsinghua University, Tsinghua University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3575", "url": null, "sourceid": 10, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=XgKteNxNe0", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 869, "modified": "2026-03-23T21:52:45.881732-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=XgKteNxNe0", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "8", "related_events": ["http://mlsys.org/api/miniconf/events/3798?format=json"], "related_events_ids": [3798]}, {"id": 3766, "uid": "f899139df5e1059396431415e770c6dd", "name": "Beat the long tail: Distribution-Aware Speculative Decoding for RL Training", "authors": [{"id": 21038, "fullname": "Zelei Shao", "url": "http://mlsys.org/api/miniconf/users/21038?format=json", "institution": "Together AI"}, {"id": 27361, "fullname": "Vikranth Srivatsa", "url": "http://mlsys.org/api/miniconf/users/27361?format=json", "institution": "University of California, San Diego"}, {"id": 27362, "fullname": "Sanjana Srivastava", "url": "http://mlsys.org/api/miniconf/users/27362?format=json", "institution": null}, {"id": 25635, "fullname": "Qingyang Wu", "url": "http://mlsys.org/api/miniconf/users/25635?format=json", "institution": "Together AI"}, {"id": 27254, "fullname": "Alpay Ariyak", "url": "http://mlsys.org/api/miniconf/users/27254?format=json", "institution": null}, {"id": 23865, "fullname": "Xiaoxia Wu", "url": "http://mlsys.org/api/miniconf/users/23865?format=json", "institution": "TogtherAI"}, {"id": 18639, "fullname": "Ameen Patel", "url": "http://mlsys.org/api/miniconf/users/18639?format=json", "institution": "Together.ai"}, {"id": 27251, "fullname": "Jue Wang", "url": "http://mlsys.org/api/miniconf/users/27251?format=json", "institution": "Together AI"}, {"id": 27363, "fullname": "Percy Liang", "url": "http://mlsys.org/api/miniconf/users/27363?format=json", "institution": "Stanford University"}, {"id": 18765, "fullname": "Tri Dao", "url": "http://mlsys.org/api/miniconf/users/18765?format=json", "institution": "Princeton University, Together AI"}, {"id": 18868, "fullname": "Ce Zhang", "url": "http://mlsys.org/api/miniconf/users/18868?format=json", "institution": null}, {"id": 26292, "fullname": "Yiying Zhang", "url": "http://mlsys.org/api/miniconf/users/26292?format=json", "institution": "UCSD and GenseeAI"}, {"id": 18231, "fullname": "Ben Athiwaratkun", "url": "http://mlsys.org/api/miniconf/users/18231?format=json", "institution": null}, {"id": 24298, "fullname": "Chenfeng Xu", "url": "http://mlsys.org/api/miniconf/users/24298?format=json", "institution": "Together AI/UT Austin"}, {"id": 27250, "fullname": "Junxiong Wang", "url": "http://mlsys.org/api/miniconf/users/27250?format=json", "institution": "TogetherAI"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3766", "url": null, "sourceid": -100, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T16:30:00-07:00", "endtime": "2026-05-20T16:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3692?format=json", "parent_id": 3692, "eventmedia": [{"id": 1145, "modified": "2026-05-16T00:09:05.426924-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3766.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3543?format=json"], "related_events_ids": [3543]}, {"id": 3846, "uid": "1f0e3dad99908345f7439f8ffabdffc4", "name": "HELIOS : Adaptive Model And Early-Exit Selection for Efficient LLM Inference Serving", "authors": [{"id": 25962, "fullname": "Avinash Kumar", "url": "http://mlsys.org/api/miniconf/users/25962?format=json", "institution": "The University of Texas at Austin"}, {"id": 19188, "fullname": "Shashank Nag", "url": "http://mlsys.org/api/miniconf/users/19188?format=json", "institution": "The University of Texas at Austin"}, {"id": 27844, "fullname": "Jason Clemons", "url": "http://mlsys.org/api/miniconf/users/27844?format=json", "institution": "NVIDIA"}, {"id": 12633, "fullname": "LIZY JOHn", "url": "http://mlsys.org/api/miniconf/users/12633?format=json", "institution": "UT-Austin"}, {"id": 27845, "fullname": "Poulami Das", "url": "http://mlsys.org/api/miniconf/users/27845?format=json", "institution": "University of Texas at Austin"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient ML", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3846", "url": null, "sourceid": -19, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T13:00:00-07:00", "endtime": "2026-05-21T13:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3710?format=json", "parent_id": 3710, "eventmedia": [{"id": 1111, "modified": "2026-05-15T14:44:24.526689-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3846.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3623?format=json"], "related_events_ids": [3623]}, {"id": 3798, "uid": "d3d9446802a44259755d38e6d163e820", "name": "db-SP: Accelerating Sparse Attention for Visual Generative Models with Dual-Balanced Sequence Parallelism", "authors": [{"id": 25683, "fullname": "Siqi Chen", "url": "http://mlsys.org/api/miniconf/users/25683?format=json", "institution": "Tsinghua University"}, {"id": 15899, "fullname": "Ke Hong", "url": "http://mlsys.org/api/miniconf/users/15899?format=json", "institution": "Tsinghua University"}, {"id": 27616, "fullname": "Tianchen Zhao", "url": "http://mlsys.org/api/miniconf/users/27616?format=json", "institution": "Tsinghua University, Tsinghua University"}, {"id": 27617, "fullname": "Ruiqi Xie", "url": "http://mlsys.org/api/miniconf/users/27617?format=json", "institution": "Tsinghua University"}, {"id": 27618, "fullname": "Zhenhua Zhu", "url": "http://mlsys.org/api/miniconf/users/27618?format=json", "institution": "Tsinghua University, Tsinghua University"}, {"id": 27619, "fullname": "Xudong Zhang", "url": "http://mlsys.org/api/miniconf/users/27619?format=json", "institution": "Tsinghua University, Tsinghua University"}, {"id": 17647, "fullname": "Yu Wang", "url": "http://mlsys.org/api/miniconf/users/17647?format=json", "institution": "Tsinghua University, Tsinghua University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Multimodal and Generative Models", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3798", "url": null, "sourceid": -10, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T13:15:00-07:00", "endtime": "2026-05-19T13:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3669?format=json", "parent_id": 3669, "eventmedia": [{"id": 1075, "modified": "2026-05-15T07:06:49.608220-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3798.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3575?format=json"], "related_events_ids": [3575]}, {"id": 3510, "uid": "6f4922f45568161a8cdf4ad2299f6d23", "name": "Accelerating Large-Scale Reasoning Model Inference with Sparse Self-Speculative Decoding", "authors": [{"id": 20906, "fullname": "Yilong Zhao", "url": "http://mlsys.org/api/miniconf/users/20906?format=json", "institution": "University of California, Berkeley"}, {"id": 21005, "fullname": "Jiaming Tang", "url": "http://mlsys.org/api/miniconf/users/21005?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 17683, "fullname": "Kan Zhu", "url": "http://mlsys.org/api/miniconf/users/17683?format=json", "institution": "University of Washington"}, {"id": 12026, "fullname": "Zihao Ye", "url": "http://mlsys.org/api/miniconf/users/12026?format=json", "institution": "NVIDIA"}, {"id": 27178, "fullname": "Chi-Chih Chang", "url": "http://mlsys.org/api/miniconf/users/27178?format=json", "institution": "Cornell University"}, {"id": 27179, "fullname": "Chaofan Lin", "url": "http://mlsys.org/api/miniconf/users/27179?format=json", "institution": "Tsinghua University"}, {"id": 27180, "fullname": "Jongseok Park", "url": "http://mlsys.org/api/miniconf/users/27180?format=json", "institution": "University of California, Berkeley"}, {"id": 17675, "fullname": "Guangxuan Xiao", "url": "http://mlsys.org/api/miniconf/users/17675?format=json", "institution": "MIT"}, {"id": 17625, "fullname": "Mohamed Abdelfattah", "url": "http://mlsys.org/api/miniconf/users/17625?format=json", "institution": "Cornell University"}, {"id": 11143, "fullname": "Mingyu Gao", "url": "http://mlsys.org/api/miniconf/users/11143?format=json", "institution": "Tsinghua University"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}, {"id": 12133, "fullname": "Song Han", "url": "http://mlsys.org/api/miniconf/users/12133?format=json", "institution": "MIT"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3510", "url": null, "sourceid": 18, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=yeqrwcWjPu", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 804, "modified": "2026-03-23T21:52:43.314747-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=yeqrwcWjPu", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "10", "related_events": ["http://mlsys.org/api/miniconf/events/3733?format=json"], "related_events_ids": [3733]}, {"id": 3545, "uid": "a5bfc9e07964f8dddeb95fc584cd965d", "name": "ExecuTorch - A Unified PyTorch Solution to Run ML Models On-Device", "authors": [{"id": 28448, "fullname": "Mergen Nachin", "url": "http://mlsys.org/api/miniconf/users/28448?format=json", "institution": "Meta"}, {"id": 28957, "fullname": "Digant Desai", "url": "http://mlsys.org/api/miniconf/users/28957?format=json", "institution": "Facebook"}, {"id": 27381, "fullname": "Sicheng Jia", "url": "http://mlsys.org/api/miniconf/users/27381?format=json", "institution": "Meta, Inc."}, {"id": 25593, "fullname": "Chen Lai", "url": "http://mlsys.org/api/miniconf/users/25593?format=json", "institution": "Meta"}, {"id": 27372, "fullname": "Mengwei Liu", "url": "http://mlsys.org/api/miniconf/users/27372?format=json", "institution": "Meta Platforms Inc"}, {"id": 27369, "fullname": "Jacob Szwejbka", "url": "http://mlsys.org/api/miniconf/users/27369?format=json", "institution": null}, {"id": 28486, "fullname": "Raziel Alvarez", "url": "http://mlsys.org/api/miniconf/users/28486?format=json", "institution": null}, {"id": 28487, "fullname": "Robert Ascani", "url": "http://mlsys.org/api/miniconf/users/28487?format=json", "institution": "Meta"}, {"id": 27393, "fullname": "Dave Bort", "url": "http://mlsys.org/api/miniconf/users/27393?format=json", "institution": null}, {"id": 27379, "fullname": "Manuel Candales", "url": "http://mlsys.org/api/miniconf/users/27379?format=json", "institution": "Meta"}, {"id": 28488, "fullname": "Andrew Caples", "url": "http://mlsys.org/api/miniconf/users/28488?format=json", "institution": null}, {"id": 27384, "fullname": "Yanan Cao", "url": "http://mlsys.org/api/miniconf/users/27384?format=json", "institution": "Meta Platforms"}, {"id": 27385, "fullname": "Zhengxu Chen", "url": "http://mlsys.org/api/miniconf/users/27385?format=json", "institution": null}, {"id": 28450, "fullname": "Soumith Chintala", "url": "http://mlsys.org/api/miniconf/users/28450?format=json", "institution": "Thinking Machines"}, {"id": 27367, "fullname": "Gregory Comer", "url": "http://mlsys.org/api/miniconf/users/27367?format=json", "institution": ""}, {"id": 27375, "fullname": "Tanvir Islam", "url": "http://mlsys.org/api/miniconf/users/27375?format=json", "institution": null}, {"id": 28489, "fullname": "Songhao Jia", "url": "http://mlsys.org/api/miniconf/users/28489?format=json", "institution": "Meta"}, {"id": 27394, "fullname": "Tarun Karuturi", "url": "http://mlsys.org/api/miniconf/users/27394?format=json", "institution": null}, {"id": 28965, "fullname": "Jack Khuu", "url": "http://mlsys.org/api/miniconf/users/28965?format=json", "institution": "Meta"}, {"id": 27366, "fullname": "Abhinay Kukkadapu", "url": "http://mlsys.org/api/miniconf/users/27366?format=json", "institution": null}, {"id": 27387, "fullname": "Tugsbayasgalan Manlaibaatar", "url": "http://mlsys.org/api/miniconf/users/27387?format=json", "institution": null}, {"id": 27390, "fullname": "Andrew Or", "url": "http://mlsys.org/api/miniconf/users/27390?format=json", "institution": "Facebook"}, {"id": 27370, "fullname": "Kimish Patel", "url": "http://mlsys.org/api/miniconf/users/27370?format=json", "institution": null}, {"id": 27373, "fullname": "Siddartha Pothapragada", "url": "http://mlsys.org/api/miniconf/users/27373?format=json", "institution": null}, {"id": 28451, "fullname": "Lucy Qiu", "url": "http://mlsys.org/api/miniconf/users/28451?format=json", "institution": "Meta"}, {"id": 27396, "fullname": "Supriya Rao", "url": "http://mlsys.org/api/miniconf/users/27396?format=json", "institution": "Facebook"}, {"id": 27395, "fullname": "Orion Reblitz-Richardson", "url": "http://mlsys.org/api/miniconf/users/27395?format=json", "institution": null}, {"id": 27392, "fullname": "Max Ren", "url": "http://mlsys.org/api/miniconf/users/27392?format=json", "institution": null}, {"id": 27380, "fullname": "Scott Roy", "url": "http://mlsys.org/api/miniconf/users/27380?format=json", "institution": "Meta"}, {"id": 27376, "fullname": "Anthony Shoumikhin", "url": "http://mlsys.org/api/miniconf/users/27376?format=json", "institution": null}, {"id": 27383, "fullname": "Scott Wolchok", "url": "http://mlsys.org/api/miniconf/users/27383?format=json", "institution": null}, {"id": 27397, "fullname": "Guang Yang", "url": "http://mlsys.org/api/miniconf/users/27397?format=json", "institution": null}, {"id": 27388, "fullname": "Angela Yi", "url": "http://mlsys.org/api/miniconf/users/27388?format=json", "institution": "Stanford University"}, {"id": 27391, "fullname": "Martin Yuan", "url": "http://mlsys.org/api/miniconf/users/27391?format=json", "institution": null}, {"id": 27378, "fullname": "Hansong Zhang", "url": "http://mlsys.org/api/miniconf/users/27378?format=json", "institution": "Meta Platforms"}, {"id": 27368, "fullname": "Jack Zhang", "url": "http://mlsys.org/api/miniconf/users/27368?format=json", "institution": null}, {"id": 27389, "fullname": "Zhenrui Zhang", "url": "http://mlsys.org/api/miniconf/users/27389?format=json", "institution": "Facebook"}, {"id": 27386, "fullname": "Shunting Zhang", "url": "http://mlsys.org/api/miniconf/users/27386?format=json", "institution": ""}, {"id": 27365, "fullname": "Cemal Bilgin", "url": "http://mlsys.org/api/miniconf/users/27365?format=json", "institution": "Meta"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3545", "url": "https://github.com/pytorch/executorch", "sourceid": 37, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=jmE5nwC9kb", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 839, "modified": "2026-03-23T21:52:44.608714-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=jmE5nwC9kb", "resourcetype": "UriEventmedia"}, {"id": 1020, "file": "/media/PosterPDFs/MLSys%202026/3545.png", "modified": "2026-05-15T14:49:49.901287-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1021, "file": "/media/PosterPDFs/MLSys%202026/3545-thumb.png", "modified": "2026-05-13T22:25:07.739491-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "4", "related_events": ["http://mlsys.org/api/miniconf/events/3768?format=json"], "related_events_ids": [3768]}, {"id": 3565, "uid": "44f683a84163b3523afe57c2e008bc8c", "name": "Locality-Aware Beam Scheduling for Efficient Test-Time Compute with a Consumer-grade GPU", "authors": [{"id": 25535, "fullname": "Hsing-Ti Wang", "url": "http://mlsys.org/api/miniconf/users/25535?format=json", "institution": "NTU ECLab"}, {"id": 26242, "fullname": "Hung-Tso Shiao", "url": "http://mlsys.org/api/miniconf/users/26242?format=json", "institution": "National Taiwan University"}, {"id": 27580, "fullname": "Chia-Lin Yang", "url": "http://mlsys.org/api/miniconf/users/27580?format=json", "institution": "Department of computer science and informational engineering, National Taiwan University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3565", "url": null, "sourceid": 62, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=dTo8jAXm9K", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 859, "modified": "2026-03-23T21:52:45.475684-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=dTo8jAXm9K", "resourcetype": "UriEventmedia"}, {"id": 1146, "file": "/media/PosterPDFs/MLSys%202026/3565.png", "modified": "2026-05-16T00:12:36.261546-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1147, "file": "/media/PosterPDFs/MLSys%202026/3565-thumb.png", "modified": "2026-05-16T00:12:36.380996-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "7", "related_events": ["http://mlsys.org/api/miniconf/events/3788?format=json"], "related_events_ids": [3788]}, {"id": 3843, "uid": "03afdbd66e7929b125f8597834fa83a4", "name": "PROMPTS: PeRformance Optimization via Multi-Agent Planning for LLM Training and Serving", "authors": [{"id": 27835, "fullname": "Yuran Ding", "url": "http://mlsys.org/api/miniconf/users/27835?format=json", "institution": "Google"}, {"id": 27836, "fullname": "Ruobing Han", "url": "http://mlsys.org/api/miniconf/users/27836?format=json", "institution": "Google DeepMind"}, {"id": 27837, "fullname": "Xiaofan Zhang", "url": "http://mlsys.org/api/miniconf/users/27837?format=json", "institution": "Google"}, {"id": 27838, "fullname": "Xinwei Chen", "url": "http://mlsys.org/api/miniconf/users/27838?format=json", "institution": "Waymo"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Agentic AI/MLSys", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3843", "url": null, "sourceid": -63, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T08:45:00-07:00", "endtime": "2026-05-21T09:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3700?format=json", "parent_id": 3700, "eventmedia": [{"id": 1100, "modified": "2026-05-15T13:42:46.872129-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3843.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3620?format=json"], "related_events_ids": [3620]}, {"id": 3622, "uid": "3295c76acbf4caaed33c36b1b5fc2cb1", "name": "ParallelKittens: Systematic and Practical Simplification of Multi-GPU AI Kernels", "authors": [{"id": 27842, "fullname": "Stuart H. Sul", "url": "http://mlsys.org/api/miniconf/users/27842?format=json", "institution": "Stanford University"}, {"id": 27192, "fullname": "Simran Arora", "url": "http://mlsys.org/api/miniconf/users/27192?format=json", "institution": "Computer Science Department, Stanford University"}, {"id": 27843, "fullname": "Benjamin Spector", "url": "http://mlsys.org/api/miniconf/users/27843?format=json", "institution": "Stanford University"}, {"id": 11444, "fullname": "Christopher R\u00e9", "url": "http://mlsys.org/api/miniconf/users/11444?format=json", "institution": "Stanford University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3622", "url": null, "sourceid": 66, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=Cv5e5uRXFb", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 916, "modified": "2026-03-23T21:52:47.696063-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=Cv5e5uRXFb", "resourcetype": "UriEventmedia"}, {"id": 1098, "file": "/media/PosterPDFs/MLSys%202026/3622.png", "modified": "2026-05-15T13:30:15.669165-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1099, "file": "/media/PosterPDFs/MLSys%202026/3622-thumb.png", "modified": "2026-05-15T13:44:48.182159-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "33", "related_events": ["http://mlsys.org/api/miniconf/events/3845?format=json"], "related_events_ids": [3845]}, {"id": 3806, "uid": "98f13708210194c475687be6106a3b84", "name": "AgenticCache: Cache-Driven Asynchronous Planning for Embodied AI Agents", "authors": [{"id": 25550, "fullname": "Hojoon Kim", "url": "http://mlsys.org/api/miniconf/users/25550?format=json", "institution": "Seoul National University"}, {"id": 27643, "fullname": "Yuheng Wu", "url": "http://mlsys.org/api/miniconf/users/27643?format=json", "institution": "Stanford University"}, {"id": 27644, "fullname": "Thierry Tambe", "url": "http://mlsys.org/api/miniconf/users/27644?format=json", "institution": "Stanford University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3806", "url": null, "sourceid": -20, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T15:00:00-07:00", "endtime": "2026-05-19T15:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3674?format=json", "parent_id": 3674, "eventmedia": [{"id": 1169, "modified": "2026-05-19T14:25:08.320838-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3806_NIaKgZ6.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3583?format=json"], "related_events_ids": [3583]}, {"id": 3753, "uid": "f4b9ec30ad9f68f89b29639786cb62ef", "name": "Matrix: Peer-to-Peer Multi-Agent Synthetic Data Generation Framework", "authors": [{"id": 27301, "fullname": "Dong Wang", "url": "http://mlsys.org/api/miniconf/users/27301?format=json", "institution": "Meta FAIR"}, {"id": 27302, "fullname": "Yang Li", "url": "http://mlsys.org/api/miniconf/users/27302?format=json", "institution": "Facebook"}, {"id": 27303, "fullname": "Ansong Ni", "url": "http://mlsys.org/api/miniconf/users/27303?format=json", "institution": "Meta AI"}, {"id": 27304, "fullname": "Ching-Feng Yeh", "url": "http://mlsys.org/api/miniconf/users/27304?format=json", "institution": "Facebook"}, {"id": 27305, "fullname": "Youssef Emad", "url": "http://mlsys.org/api/miniconf/users/27305?format=json", "institution": "Facebook"}, {"id": 27306, "fullname": "Xinjie Lei", "url": "http://mlsys.org/api/miniconf/users/27306?format=json", "institution": "Meta"}, {"id": 27307, "fullname": "Liam Robbins", "url": "http://mlsys.org/api/miniconf/users/27307?format=json", "institution": "FAIR"}, {"id": 27308, "fullname": "Karthik Padthe", "url": "http://mlsys.org/api/miniconf/users/27308?format=json", "institution": "Meta AI"}, {"id": 27309, "fullname": "Hu Xu", "url": "http://mlsys.org/api/miniconf/users/27309?format=json", "institution": "FAIR, Foundation"}, {"id": 27310, "fullname": "Xian Li", "url": "http://mlsys.org/api/miniconf/users/27310?format=json", "institution": "Facebook AI"}, {"id": 27311, "fullname": "Asli Celikyilmaz", "url": "http://mlsys.org/api/miniconf/users/27311?format=json", "institution": "FAIR"}, {"id": 27312, "fullname": "Ramya Raghavendra", "url": "http://mlsys.org/api/miniconf/users/27312?format=json", "institution": "Facebook"}, {"id": 27313, "fullname": "LIFEI HUANG", "url": "http://mlsys.org/api/miniconf/users/27313?format=json", "institution": "Facebook"}, {"id": 27314, "fullname": "Carole-Jean Wu", "url": "http://mlsys.org/api/miniconf/users/27314?format=json", "institution": "Meta"}, {"id": 27315, "fullname": "Shang-Wen Li", "url": "http://mlsys.org/api/miniconf/users/27315?format=json", "institution": "Facebook"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3753", "url": null, "sourceid": -94, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T14:00:00-07:00", "endtime": "2026-05-19T14:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3668?format=json", "parent_id": 3668, "eventmedia": [{"id": 980, "modified": "2026-05-10T19:35:01.378852-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3753_h4L43wQ.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3530?format=json"], "related_events_ids": [3530]}, {"id": 3773, "uid": "f457c545a9ded88f18ecee47145a72c0", "name": "SwiftGS: Algorithm and System Co-Optimization for Fast 3D Gaussian Splatting on GPUs", "authors": [{"id": 25558, "fullname": "Lingjun Gao", "url": "http://mlsys.org/api/miniconf/users/25558?format=json", "institution": "Imperial College London"}, {"id": 27429, "fullname": "Zhican Wang", "url": "http://mlsys.org/api/miniconf/users/27429?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 27430, "fullname": "Zhiwen Mo", "url": "http://mlsys.org/api/miniconf/users/27430?format=json", "institution": "Imperial College London"}, {"id": 27431, "fullname": "Hongxiang Fan", "url": "http://mlsys.org/api/miniconf/users/27431?format=json", "institution": "Imperial College London"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Multimodal and Generative Models", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3773", "url": null, "sourceid": -49, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T13:30:00-07:00", "endtime": "2026-05-19T13:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3669?format=json", "parent_id": 3669, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3550?format=json"], "related_events_ids": [3550]}, {"id": 3795, "uid": "d9d4f495e875a2e075a1a4a6e1b9770f", "name": "BOute: Cost-Efficient LLM Serving with Heterogeneous LLMs and GPUs via Multi-Objective Bayesian Optimization", "authors": [{"id": 21099, "fullname": "YOUHE JIANG", "url": "http://mlsys.org/api/miniconf/users/21099?format=json", "institution": "University of Cambridge"}, {"id": 27606, "fullname": "Fangcheng Fu", "url": "http://mlsys.org/api/miniconf/users/27606?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 10630, "fullname": "Eiko Yoneki", "url": "http://mlsys.org/api/miniconf/users/10630?format=json", "institution": "University of Cambridge"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3795", "url": null, "sourceid": -46, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T09:00:00-07:00", "endtime": "2026-05-20T09:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3678?format=json", "parent_id": 3678, "eventmedia": [{"id": 1101, "modified": "2026-05-15T13:55:06.253381-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3795.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3572?format=json"], "related_events_ids": [3572]}, {"id": 3796, "uid": "a1d0c6e83f027327d8461063f4ac58a6", "name": "TeleRAG: Efficient Retrieval-Augmented Generation Inference with Lookahead Retrieval", "authors": [{"id": 27607, "fullname": "Chien-Yu Lin", "url": "http://mlsys.org/api/miniconf/users/27607?format=json", "institution": "Meta"}, {"id": 26295, "fullname": "Keisuke Kamahori", "url": "http://mlsys.org/api/miniconf/users/26295?format=json", "institution": "University of Washington"}, {"id": 27608, "fullname": "Yiyu Liu", "url": "http://mlsys.org/api/miniconf/users/27608?format=json", "institution": "Harvard University"}, {"id": 27609, "fullname": "Xiaoxiang Shi", "url": "http://mlsys.org/api/miniconf/users/27609?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 27610, "fullname": "Madhav Kashyap", "url": "http://mlsys.org/api/miniconf/users/27610?format=json", "institution": "University of Washington"}, {"id": 27416, "fullname": "Yile Gu", "url": "http://mlsys.org/api/miniconf/users/27416?format=json", "institution": "Department of Computer Science, University of Washington"}, {"id": 27611, "fullname": "Rulin Shao", "url": "http://mlsys.org/api/miniconf/users/27611?format=json", "institution": "University of Washington"}, {"id": 12026, "fullname": "Zihao Ye", "url": "http://mlsys.org/api/miniconf/users/12026?format=json", "institution": "NVIDIA"}, {"id": 17683, "fullname": "Kan Zhu", "url": "http://mlsys.org/api/miniconf/users/17683?format=json", "institution": "University of Washington"}, {"id": 27612, "fullname": "Rohan Kadekodi", "url": "http://mlsys.org/api/miniconf/users/27612?format=json", "institution": "University of Washington"}, {"id": 17972, "fullname": "Stephanie Wang", "url": "http://mlsys.org/api/miniconf/users/17972?format=json", "institution": "UW &amp; Anyscale"}, {"id": 11122, "fullname": "Arvind Krishnamurthy", "url": "http://mlsys.org/api/miniconf/users/11122?format=json", "institution": "University of Washington"}, {"id": 11020, "fullname": "Luis Ceze", "url": "http://mlsys.org/api/miniconf/users/11020?format=json", "institution": "University of Washington and NVIDIA"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3796", "url": "https://github.com/uw-syfi/TeleRAG", "sourceid": -42, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T15:15:00-07:00", "endtime": "2026-05-19T15:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3674?format=json", "parent_id": 3674, "eventmedia": [{"id": 1115, "modified": "2026-05-19T14:40:41.323772-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3796_JIkCNfh.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3573?format=json"], "related_events_ids": [3573]}, {"id": 3854, "uid": "d82c8d1619ad8176d665453cfb2e55f0", "name": "BLASST: Dynamic BLocked Attention Sparsity via Softmax Thresholding", "authors": [{"id": 27887, "fullname": "Jiayi Yuan", "url": "http://mlsys.org/api/miniconf/users/27887?format=json", "institution": "Rice University"}, {"id": 15623, "fullname": "Cameron Shinn", "url": "http://mlsys.org/api/miniconf/users/15623?format=json", "institution": "University of California, Davis"}, {"id": 27888, "fullname": "Kai Xu", "url": "http://mlsys.org/api/miniconf/users/27888?format=json", "institution": "NVIDIA"}, {"id": 27889, "fullname": "Jingze Cui", "url": "http://mlsys.org/api/miniconf/users/27889?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 27890, "fullname": "George Klimiashvili", "url": "http://mlsys.org/api/miniconf/users/27890?format=json", "institution": "NVIDIA"}, {"id": 27891, "fullname": "Guangxuan Xiao", "url": "http://mlsys.org/api/miniconf/users/27891?format=json", "institution": null}, {"id": 27892, "fullname": "Perkz Zheng", "url": "http://mlsys.org/api/miniconf/users/27892?format=json", "institution": "NVIDIA"}, {"id": 27893, "fullname": "Bo Li", "url": "http://mlsys.org/api/miniconf/users/27893?format=json", "institution": "NVIDIA"}, {"id": 27894, "fullname": "Zhou Yuxin", "url": "http://mlsys.org/api/miniconf/users/27894?format=json", "institution": "NVIDIA"}, {"id": 27895, "fullname": "Zhouhai Ye", "url": "http://mlsys.org/api/miniconf/users/27895?format=json", "institution": "NVIDIA"}, {"id": 27896, "fullname": "Weijie You", "url": "http://mlsys.org/api/miniconf/users/27896?format=json", "institution": "NVIDIA"}, {"id": 28473, "fullname": "Tian Zheng", "url": "http://mlsys.org/api/miniconf/users/28473?format=json", "institution": "NVIDIA"}, {"id": 28474, "fullname": "Dominic Brown", "url": "http://mlsys.org/api/miniconf/users/28474?format=json", "institution": "NVIDIA"}, {"id": 28475, "fullname": "Pengbo Wang", "url": "http://mlsys.org/api/miniconf/users/28475?format=json", "institution": "NVIDIA"}, {"id": 27339, "fullname": "Markus Hoehnerbach", "url": "http://mlsys.org/api/miniconf/users/27339?format=json", "institution": "Meta"}, {"id": 27897, "fullname": "Richard Cai", "url": "http://mlsys.org/api/miniconf/users/27897?format=json", "institution": "NVIDIA"}, {"id": 27898, "fullname": "Julien Demouth", "url": "http://mlsys.org/api/miniconf/users/27898?format=json", "institution": "University of Lorraine"}, {"id": 27899, "fullname": "John D. Owens", "url": "http://mlsys.org/api/miniconf/users/27899?format=json", "institution": "UC Davis"}, {"id": 27900, "fullname": "Xia Hu", "url": "http://mlsys.org/api/miniconf/users/27900?format=json", "institution": "Shanghai Artificial Intelligence Laboratory"}, {"id": 27901, "fullname": "Song Han", "url": "http://mlsys.org/api/miniconf/users/27901?format=json", "institution": null}, {"id": 25625, "fullname": "Timmy Liu", "url": "http://mlsys.org/api/miniconf/users/25625?format=json", "institution": "Nvidia"}, {"id": 12477, "fullname": "Huizi Mao", "url": "http://mlsys.org/api/miniconf/users/12477?format=json", "institution": "Stanford University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Best Paper Session", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3854", "url": "https://github.com/NVIDIA/TensorRT-LLM", "sourceid": -53, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T09:25:00-07:00", "endtime": "2026-05-19T09:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3659?format=json", "parent_id": 3659, "eventmedia": [{"id": 1121, "modified": "2026-05-15T17:46:29.937345-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3854.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3631?format=json"], "related_events_ids": [3631]}, {"id": 3738, "uid": "70efdf2ec9b086079795c442636b55fb", "name": "Ontology-Guided Long-Term Agent Memory for Conversational RAG", "authors": [{"id": 27197, "fullname": "Sharon Cao", "url": "http://mlsys.org/api/miniconf/users/27197?format=json", "institution": "Hill Research"}, {"id": 27198, "fullname": "Rui Li", "url": "http://mlsys.org/api/miniconf/users/27198?format=json", "institution": "Hill Research"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3738", "url": null, "sourceid": -17, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T15:45:00-07:00", "endtime": "2026-05-19T16:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3674?format=json", "parent_id": 3674, "eventmedia": [{"id": 959, "modified": "2026-05-01T19:48:38.465895-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3738.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3515?format=json"], "related_events_ids": [3515]}, {"id": 3744, "uid": "e4da3b7fbbce2345d7772b0674a318d5", "name": "TokenWeave: Efficient Compute-Communication Overlap for Distributed LLM Inference", "authors": [{"id": 19241, "fullname": "Raja Gond", "url": "http://mlsys.org/api/miniconf/users/19241?format=json", "institution": "Independent Researcher"}, {"id": 17734, "fullname": "Nipun Kwatra", "url": "http://mlsys.org/api/miniconf/users/17734?format=json", "institution": "Microsoft Research India"}, {"id": 16198, "fullname": "Ramachandran Ramjee", "url": "http://mlsys.org/api/miniconf/users/16198?format=json", "institution": "Microsoft Research"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3744", "url": "https://github.com/microsoft/tokenweave.git", "sourceid": -5, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T15:30:00-07:00", "endtime": "2026-05-19T15:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3675?format=json", "parent_id": 3675, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3521?format=json"], "related_events_ids": [3521]}, {"id": 3850, "uid": "3988c7f88ebcb58c6ce932b957b6f332", "name": "ProToken: Token-Level Attribution for Federated Large Language Models", "authors": [{"id": 27165, "fullname": "Waris Gill", "url": "http://mlsys.org/api/miniconf/users/27165?format=json", "institution": "Virginia Tech"}, {"id": 27856, "fullname": "Ahmad Humayun", "url": "http://mlsys.org/api/miniconf/users/27856?format=json", "institution": "Virginia Polytechnic Institute and State University"}, {"id": 20986, "fullname": "Ali Anwar", "url": "http://mlsys.org/api/miniconf/users/20986?format=json", "institution": "University of Minnesota"}, {"id": 27857, "fullname": "Muhammad Ali Gulzar", "url": "http://mlsys.org/api/miniconf/users/27857?format=json", "institution": "Virginia Tech"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Federated Learning", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3850", "url": null, "sourceid": -137, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T16:45:00-07:00", "endtime": "2026-05-19T17:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3672?format=json", "parent_id": 3672, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3627?format=json"], "related_events_ids": [3627]}, {"id": 3861, "uid": "c9f0f895fb98ab9159f51fd0297e236d", "name": "Charon: A Unified and Fine-Grained Simulator for Large-Scale LLM Training and Inference", "authors": [{"id": 25502, "fullname": "Mengtian Yang", "url": "http://mlsys.org/api/miniconf/users/25502?format=json", "institution": "ByteDance Seed"}, {"id": 27169, "fullname": "Zhekun Zhang", "url": "http://mlsys.org/api/miniconf/users/27169?format=json", "institution": "ByteDance Inc."}, {"id": 25517, "fullname": "Mingheng Wu", "url": "http://mlsys.org/api/miniconf/users/25517?format=json", "institution": "ByteDance Seed"}, {"id": 27965, "fullname": "jianwen yan", "url": "http://mlsys.org/api/miniconf/users/27965?format=json", "institution": ""}, {"id": 27966, "fullname": "Hanshi Sun", "url": "http://mlsys.org/api/miniconf/users/27966?format=json", "institution": "ByteDance Seed"}, {"id": 20944, "fullname": "Li-Wen Chang", "url": "http://mlsys.org/api/miniconf/users/20944?format=json", "institution": "ByteDance Inc."}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3861", "url": null, "sourceid": -8, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T15:00:00-07:00", "endtime": "2026-05-21T15:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3714?format=json", "parent_id": 3714, "eventmedia": [{"id": 1117, "modified": "2026-05-20T23:17:09.204189-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3861_7kTIKEc.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3638?format=json"], "related_events_ids": [3638]}, {"id": 3803, "uid": "da4fb5c6e93e74d3df8527599fa62642", "name": "Zero redundancy distributed learning with differential privacy", "authors": [{"id": 27633, "fullname": "Zhiqi Bu", "url": "http://mlsys.org/api/miniconf/users/27633?format=json", "institution": "FAIR MSL"}, {"id": 27634, "fullname": "Justin Chiu", "url": "http://mlsys.org/api/miniconf/users/27634?format=json", "institution": "University of Washington"}, {"id": 27635, "fullname": "Ruixuan Liu", "url": "http://mlsys.org/api/miniconf/users/27635?format=json", "institution": "Emory University"}, {"id": 27636, "fullname": "Sheng Zha", "url": "http://mlsys.org/api/miniconf/users/27636?format=json", "institution": "Amazon"}, {"id": 27637, "fullname": "George Karypis", "url": "http://mlsys.org/api/miniconf/users/27637?format=json", "institution": "University of Minnesota, Minneapolis"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Federated Learning", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3803", "url": null, "sourceid": -120, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T17:45:00-07:00", "endtime": "2026-05-19T18:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3672?format=json", "parent_id": 3672, "eventmedia": [{"id": 1093, "modified": "2026-05-15T12:55:06.713294-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3803.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3580?format=json"], "related_events_ids": [3580]}, {"id": 3549, "uid": "182be0c5cdcd5072bb1864cdee4d3d6e", "name": "When Machine Learning Isn\u2019t Sure: Building Resilient ML-Based Computer Systems by Embracing Uncertainty", "authors": [{"id": 27421, "fullname": "Varun Gohil", "url": "http://mlsys.org/api/miniconf/users/27421?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27422, "fullname": "Nevena Stojkovic", "url": "http://mlsys.org/api/miniconf/users/27422?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27423, "fullname": "Noman Bashir", "url": "http://mlsys.org/api/miniconf/users/27423?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 28958, "fullname": "Sundar Dev", "url": "http://mlsys.org/api/miniconf/users/28958?format=json", "institution": "Google"}, {"id": 27425, "fullname": "Gaurang Upasani", "url": "http://mlsys.org/api/miniconf/users/27425?format=json", "institution": "Google"}, {"id": 27426, "fullname": "David Lo", "url": "http://mlsys.org/api/miniconf/users/27426?format=json", "institution": "Google"}, {"id": 27427, "fullname": "Parthasarathy Ranganathan", "url": "http://mlsys.org/api/miniconf/users/27427?format=json", "institution": "Google"}, {"id": 20861, "fullname": "Christina Delimitrou", "url": "http://mlsys.org/api/miniconf/users/20861?format=json", "institution": "Cornell University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3549", "url": null, "sourceid": 33, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=i0iOQL2MF5", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 843, "modified": "2026-03-23T21:52:44.765164-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=i0iOQL2MF5", "resourcetype": "UriEventmedia"}, {"id": 960, "file": "/media/PosterPDFs/MLSys%202026/3549.png", "modified": "2026-05-02T17:26:17.486394-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 961, "file": "/media/PosterPDFs/MLSys%202026/3549-thumb.png", "modified": "2026-05-14T19:28:12.211441-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "18", "related_events": ["http://mlsys.org/api/miniconf/events/3772?format=json"], "related_events_ids": [3772]}, {"id": 3810, "uid": "38b3eff8baf56627478ec76a704e9b52", "name": "ContextPilot: Fast Long-Context Inference via Context Reuse", "authors": [{"id": 25934, "fullname": "Yinsicheng Jiang", "url": "http://mlsys.org/api/miniconf/users/25934?format=json", "institution": "University of Edinburgh"}, {"id": 27651, "fullname": "Yeqi Huang", "url": "http://mlsys.org/api/miniconf/users/27651?format=json", "institution": "University of Edinburgh, University of Edinburgh"}, {"id": 27652, "fullname": "Liang Cheng", "url": "http://mlsys.org/api/miniconf/users/27652?format=json", "institution": "University of Edinburgh"}, {"id": 25084, "fullname": "Cheng Deng", "url": "http://mlsys.org/api/miniconf/users/25084?format=json", "institution": "The University of Edinburgh"}, {"id": 27653, "fullname": "Xuan Sun", "url": "http://mlsys.org/api/miniconf/users/27653?format=json", "institution": "University of Edinburgh, University of Edinburgh"}, {"id": 27654, "fullname": "Luo Mai", "url": "http://mlsys.org/api/miniconf/users/27654?format=json", "institution": "Edinburgh University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Multimodal and Generative Models", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3810", "url": "https://github.com/EfficientContext/ContextPilot", "sourceid": -101, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T13:00:00-07:00", "endtime": "2026-05-19T13:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3669?format=json", "parent_id": 3669, "eventmedia": [{"id": 1059, "modified": "2026-05-19T13:54:13.029400-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3810_J3tlVOU.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3587?format=json"], "related_events_ids": [3587]}, {"id": 3563, "uid": "093f65e080a295f8076b1c5722a46aa2", "name": "LEANN: A Low-Storage Overhead Vector Index", "authors": [{"id": 27567, "fullname": "Yichuan Wang", "url": "http://mlsys.org/api/miniconf/users/27567?format=json", "institution": "University of California, Berkeley"}, {"id": 27568, "fullname": "Zhifei Li", "url": "http://mlsys.org/api/miniconf/users/27568?format=json", "institution": "UC Berkeley, University of California, Berkeley"}, {"id": 21025, "fullname": "Shu Liu", "url": "http://mlsys.org/api/miniconf/users/21025?format=json", "institution": "University of California, Berkeley"}, {"id": 17645, "fullname": "Yongji Wu", "url": "http://mlsys.org/api/miniconf/users/17645?format=json", "institution": "Duke University"}, {"id": 27569, "fullname": "Ziming Mao", "url": "http://mlsys.org/api/miniconf/users/27569?format=json", "institution": "University of California, Berkeley"}, {"id": 20906, "fullname": "Yilong Zhao", "url": "http://mlsys.org/api/miniconf/users/20906?format=json", "institution": "University of California, Berkeley"}, {"id": 27570, "fullname": "Xiao Yan", "url": "http://mlsys.org/api/miniconf/users/27570?format=json", "institution": "Wuhan University"}, {"id": 20979, "fullname": "Zhiying Xu", "url": "http://mlsys.org/api/miniconf/users/20979?format=json", "institution": "Amazon"}, {"id": 19070, "fullname": "Yang Zhou", "url": "http://mlsys.org/api/miniconf/users/19070?format=json", "institution": "UC Davis"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}, {"id": 27571, "fullname": "Sewon Min", "url": "http://mlsys.org/api/miniconf/users/27571?format=json", "institution": "University of California, Berkeley"}, {"id": 21014, "fullname": "Matei Zaharia", "url": "http://mlsys.org/api/miniconf/users/21014?format=json", "institution": "University of California, Berkeley"}, {"id": 11239, "fullname": "Joseph Gonzalez", "url": "http://mlsys.org/api/miniconf/users/11239?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3563", "url": null, "sourceid": 59, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=e8Dp5QkFxP", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 857, "modified": "2026-03-23T21:52:45.384589-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=e8Dp5QkFxP", "resourcetype": "UriEventmedia"}, {"id": 1232, "file": "/media/PosterPDFs/MLSys%202026/3563.png", "modified": "2026-05-19T15:25:52.840486-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1233, "file": "/media/PosterPDFs/MLSys%202026/3563-thumb.png", "modified": "2026-05-19T15:25:53.669226-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "2", "related_events": ["http://mlsys.org/api/miniconf/events/3786?format=json"], "related_events_ids": [3786]}, {"id": 3607, "uid": "fe9fc289c3ff0af142b6d3bead98a923", "name": "BOOST: BOttleneck-Optimized Scalable Training Framework for Low-Rank Large Language Models", "authors": [{"id": 23955, "fullname": "Zhengyang Wang", "url": "http://mlsys.org/api/miniconf/users/23955?format=json", "institution": "University of California, Santa Barbara"}, {"id": 23956, "fullname": "Ziyue Liu", "url": "http://mlsys.org/api/miniconf/users/23956?format=json", "institution": "University of California Santa Barbara"}, {"id": 27774, "fullname": "Ruijie Zhang", "url": "http://mlsys.org/api/miniconf/users/27774?format=json", "institution": "University of California, Santa Barbara"}, {"id": 27161, "fullname": "Avinash Maurya", "url": "http://mlsys.org/api/miniconf/users/27161?format=json", "institution": "Argonne National Laboratory"}, {"id": 27775, "fullname": "Bogdan Nicolae", "url": "http://mlsys.org/api/miniconf/users/27775?format=json", "institution": null}, {"id": 27776, "fullname": "Paul Hovland", "url": "http://mlsys.org/api/miniconf/users/27776?format=json", "institution": "Argonne National Laboratory"}, {"id": 27777, "fullname": "Franck Cappello", "url": "http://mlsys.org/api/miniconf/users/27777?format=json", "institution": null}, {"id": 24510, "fullname": "zheng Zhang", "url": "http://mlsys.org/api/miniconf/users/24510?format=json", "institution": "University of California, Santa Barbara"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3607", "url": null, "sourceid": 83, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=JhN5hldx4V", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 901, "modified": "2026-03-23T21:52:47.082168-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=JhN5hldx4V", "resourcetype": "UriEventmedia"}, {"id": 1229, "file": "/media/PosterPDFs/MLSys%202026/3607.png", "modified": "2026-05-19T15:36:23.343055-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1230, "file": "/media/PosterPDFs/MLSys%202026/3607-thumb.png", "modified": "2026-05-19T15:36:23.464765-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "2", "related_events": ["http://mlsys.org/api/miniconf/events/3830?format=json"], "related_events_ids": [3830]}, {"id": 3587, "uid": "38b3eff8baf56627478ec76a704e9b52", "name": "ContextPilot: Fast Long-Context Inference via Context Reuse", "authors": [{"id": 25934, "fullname": "Yinsicheng Jiang", "url": "http://mlsys.org/api/miniconf/users/25934?format=json", "institution": "University of Edinburgh"}, {"id": 27651, "fullname": "Yeqi Huang", "url": "http://mlsys.org/api/miniconf/users/27651?format=json", "institution": "University of Edinburgh, University of Edinburgh"}, {"id": 27652, "fullname": "Liang Cheng", "url": "http://mlsys.org/api/miniconf/users/27652?format=json", "institution": "University of Edinburgh"}, {"id": 25084, "fullname": "Cheng Deng", "url": "http://mlsys.org/api/miniconf/users/25084?format=json", "institution": "The University of Edinburgh"}, {"id": 27653, "fullname": "Xuan Sun", "url": "http://mlsys.org/api/miniconf/users/27653?format=json", "institution": "University of Edinburgh, University of Edinburgh"}, {"id": 27654, "fullname": "Luo Mai", "url": "http://mlsys.org/api/miniconf/users/27654?format=json", "institution": "Edinburgh University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3587", "url": "https://github.com/EfficientContext/ContextPilot", "sourceid": 101, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=RnKvDy1jv2", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 881, "modified": "2026-03-23T21:52:46.341828-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=RnKvDy1jv2", "resourcetype": "UriEventmedia"}, {"id": 1057, "file": "/media/PosterPDFs/MLSys%202026/3587.png", "modified": "2026-05-14T20:11:49.163531-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1058, "file": "/media/PosterPDFs/MLSys%202026/3587-thumb.png", "modified": "2026-05-14T20:11:49.268185-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1060, "modified": "2026-05-14T20:17:04.843711-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3587.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "6", "related_events": ["http://mlsys.org/api/miniconf/events/3810?format=json"], "related_events_ids": [3810]}, {"id": 3508, "uid": "17e62166fc8586dfa4d1bc0e1742c08b", "name": "CRAFT: Fine-Grained Cost-Aware Expert Replication For Efficient Mixture-of-Experts Serving", "authors": [{"id": 27141, "fullname": "Adrian Zhao", "url": "http://mlsys.org/api/miniconf/users/27141?format=json", "institution": "University of Toronto"}, {"id": 27170, "fullname": "Zhenkun Cai", "url": "http://mlsys.org/api/miniconf/users/27170?format=json", "institution": "Amazon"}, {"id": 27171, "fullname": "Zhenyu Song", "url": "http://mlsys.org/api/miniconf/users/27171?format=json", "institution": null}, {"id": 27172, "fullname": "Lingfan Yu", "url": "http://mlsys.org/api/miniconf/users/27172?format=json", "institution": "Amazon"}, {"id": 27173, "fullname": "Haozheng Fan", "url": "http://mlsys.org/api/miniconf/users/27173?format=json", "institution": "Amazon"}, {"id": 20941, "fullname": "Jun Wu", "url": "http://mlsys.org/api/miniconf/users/20941?format=json", "institution": "Amazon"}, {"id": 11990, "fullname": "Yida Wang", "url": "http://mlsys.org/api/miniconf/users/11990?format=json", "institution": "Amazon"}, {"id": 17626, "fullname": "Nandita Vijaykumar", "url": "http://mlsys.org/api/miniconf/users/17626?format=json", "institution": "Department of Computer Science, University of Toronto"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3508", "url": null, "sourceid": 43, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=zdRvzU9ZCe", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 802, "modified": "2026-03-23T21:52:43.222124-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=zdRvzU9ZCe", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "36", "related_events": ["http://mlsys.org/api/miniconf/events/3731?format=json"], "related_events_ids": [3731]}, {"id": 3768, "uid": "a5bfc9e07964f8dddeb95fc584cd965d", "name": "ExecuTorch - A Unified PyTorch Solution to Run ML Models On-Device", "authors": [{"id": 28448, "fullname": "Mergen Nachin", "url": "http://mlsys.org/api/miniconf/users/28448?format=json", "institution": "Meta"}, {"id": 28957, "fullname": "Digant Desai", "url": "http://mlsys.org/api/miniconf/users/28957?format=json", "institution": "Facebook"}, {"id": 27381, "fullname": "Sicheng Jia", "url": "http://mlsys.org/api/miniconf/users/27381?format=json", "institution": "Meta, Inc."}, {"id": 25593, "fullname": "Chen Lai", "url": "http://mlsys.org/api/miniconf/users/25593?format=json", "institution": "Meta"}, {"id": 27372, "fullname": "Mengwei Liu", "url": "http://mlsys.org/api/miniconf/users/27372?format=json", "institution": "Meta Platforms Inc"}, {"id": 27369, "fullname": "Jacob Szwejbka", "url": "http://mlsys.org/api/miniconf/users/27369?format=json", "institution": null}, {"id": 28486, "fullname": "Raziel Alvarez", "url": "http://mlsys.org/api/miniconf/users/28486?format=json", "institution": null}, {"id": 28487, "fullname": "Robert Ascani", "url": "http://mlsys.org/api/miniconf/users/28487?format=json", "institution": "Meta"}, {"id": 27393, "fullname": "Dave Bort", "url": "http://mlsys.org/api/miniconf/users/27393?format=json", "institution": null}, {"id": 27379, "fullname": "Manuel Candales", "url": "http://mlsys.org/api/miniconf/users/27379?format=json", "institution": "Meta"}, {"id": 28488, "fullname": "Andrew Caples", "url": "http://mlsys.org/api/miniconf/users/28488?format=json", "institution": null}, {"id": 27384, "fullname": "Yanan Cao", "url": "http://mlsys.org/api/miniconf/users/27384?format=json", "institution": "Meta Platforms"}, {"id": 27385, "fullname": "Zhengxu Chen", "url": "http://mlsys.org/api/miniconf/users/27385?format=json", "institution": null}, {"id": 28450, "fullname": "Soumith Chintala", "url": "http://mlsys.org/api/miniconf/users/28450?format=json", "institution": "Thinking Machines"}, {"id": 27367, "fullname": "Gregory Comer", "url": "http://mlsys.org/api/miniconf/users/27367?format=json", "institution": ""}, {"id": 27375, "fullname": "Tanvir Islam", "url": "http://mlsys.org/api/miniconf/users/27375?format=json", "institution": null}, {"id": 28489, "fullname": "Songhao Jia", "url": "http://mlsys.org/api/miniconf/users/28489?format=json", "institution": "Meta"}, {"id": 27394, "fullname": "Tarun Karuturi", "url": "http://mlsys.org/api/miniconf/users/27394?format=json", "institution": null}, {"id": 28965, "fullname": "Jack Khuu", "url": "http://mlsys.org/api/miniconf/users/28965?format=json", "institution": "Meta"}, {"id": 27366, "fullname": "Abhinay Kukkadapu", "url": "http://mlsys.org/api/miniconf/users/27366?format=json", "institution": null}, {"id": 27387, "fullname": "Tugsbayasgalan Manlaibaatar", "url": "http://mlsys.org/api/miniconf/users/27387?format=json", "institution": null}, {"id": 27390, "fullname": "Andrew Or", "url": "http://mlsys.org/api/miniconf/users/27390?format=json", "institution": "Facebook"}, {"id": 27370, "fullname": "Kimish Patel", "url": "http://mlsys.org/api/miniconf/users/27370?format=json", "institution": null}, {"id": 27373, "fullname": "Siddartha Pothapragada", "url": "http://mlsys.org/api/miniconf/users/27373?format=json", "institution": null}, {"id": 28451, "fullname": "Lucy Qiu", "url": "http://mlsys.org/api/miniconf/users/28451?format=json", "institution": "Meta"}, {"id": 27396, "fullname": "Supriya Rao", "url": "http://mlsys.org/api/miniconf/users/27396?format=json", "institution": "Facebook"}, {"id": 27395, "fullname": "Orion Reblitz-Richardson", "url": "http://mlsys.org/api/miniconf/users/27395?format=json", "institution": null}, {"id": 27392, "fullname": "Max Ren", "url": "http://mlsys.org/api/miniconf/users/27392?format=json", "institution": null}, {"id": 27380, "fullname": "Scott Roy", "url": "http://mlsys.org/api/miniconf/users/27380?format=json", "institution": "Meta"}, {"id": 27376, "fullname": "Anthony Shoumikhin", "url": "http://mlsys.org/api/miniconf/users/27376?format=json", "institution": null}, {"id": 27383, "fullname": "Scott Wolchok", "url": "http://mlsys.org/api/miniconf/users/27383?format=json", "institution": null}, {"id": 27397, "fullname": "Guang Yang", "url": "http://mlsys.org/api/miniconf/users/27397?format=json", "institution": null}, {"id": 27388, "fullname": "Angela Yi", "url": "http://mlsys.org/api/miniconf/users/27388?format=json", "institution": "Stanford University"}, {"id": 27391, "fullname": "Martin Yuan", "url": "http://mlsys.org/api/miniconf/users/27391?format=json", "institution": null}, {"id": 27378, "fullname": "Hansong Zhang", "url": "http://mlsys.org/api/miniconf/users/27378?format=json", "institution": "Meta Platforms"}, {"id": 27368, "fullname": "Jack Zhang", "url": "http://mlsys.org/api/miniconf/users/27368?format=json", "institution": null}, {"id": 27389, "fullname": "Zhenrui Zhang", "url": "http://mlsys.org/api/miniconf/users/27389?format=json", "institution": "Facebook"}, {"id": 27386, "fullname": "Shunting Zhang", "url": "http://mlsys.org/api/miniconf/users/27386?format=json", "institution": ""}, {"id": 27365, "fullname": "Cemal Bilgin", "url": "http://mlsys.org/api/miniconf/users/27365?format=json", "institution": "Meta"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Best Paper Session", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3768", "url": null, "sourceid": -37, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T09:45:00-07:00", "endtime": "2026-05-19T10:05:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3659?format=json", "parent_id": 3659, "eventmedia": [{"id": 1091, "modified": "2026-05-16T00:39:21.607379-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3768_4KzY8Rk.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3545?format=json"], "related_events_ids": [3545]}, {"id": 3603, "uid": "2b44928ae11fb9384c4cf38708677c48", "name": "MoEBlaze: Breaking the Memory Wall for Efficient MoE Training on Modern GPUs", "authors": [{"id": 27752, "fullname": "Jiyuan Zhang", "url": "http://mlsys.org/api/miniconf/users/27752?format=json", "institution": "Meta"}, {"id": 25811, "fullname": "Yining Liu", "url": "http://mlsys.org/api/miniconf/users/25811?format=json", "institution": "Meta"}, {"id": 27729, "fullname": "Siqi Yan", "url": "http://mlsys.org/api/miniconf/users/27729?format=json", "institution": "Facebook"}, {"id": 27720, "fullname": "Lisen Deng", "url": "http://mlsys.org/api/miniconf/users/27720?format=json", "institution": "Meta"}, {"id": 27719, "fullname": "Jennifer Cao", "url": "http://mlsys.org/api/miniconf/users/27719?format=json", "institution": "Facebook"}, {"id": 27159, "fullname": "Shuqi Yang", "url": "http://mlsys.org/api/miniconf/users/27159?format=json", "institution": "Meta"}, {"id": 27731, "fullname": "Bi Xue", "url": "http://mlsys.org/api/miniconf/users/27731?format=json", "institution": "Thinking Machines Lab"}, {"id": 27730, "fullname": "Min Ni", "url": "http://mlsys.org/api/miniconf/users/27730?format=json", "institution": "Northwestern University"}, {"id": 16149, "fullname": "Shen Li", "url": "http://mlsys.org/api/miniconf/users/16149?format=json", "institution": "Meta"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3603", "url": null, "sourceid": 115, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=L8qKfWWkry", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 897, "modified": "2026-03-23T21:52:46.937141-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=L8qKfWWkry", "resourcetype": "UriEventmedia"}, {"id": 1148, "file": "/media/PosterPDFs/MLSys%202026/3603.png", "modified": "2026-05-16T00:38:58.177766-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1149, "file": "/media/PosterPDFs/MLSys%202026/3603-thumb.png", "modified": "2026-05-16T00:59:32.902013-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "30", "related_events": ["http://mlsys.org/api/miniconf/events/3826?format=json"], "related_events_ids": [3826]}, {"id": 3826, "uid": "2b44928ae11fb9384c4cf38708677c48", "name": "MoEBlaze: Breaking the Memory Wall for Efficient MoE Training on Modern GPUs", "authors": [{"id": 27752, "fullname": "Jiyuan Zhang", "url": "http://mlsys.org/api/miniconf/users/27752?format=json", "institution": "Meta"}, {"id": 25811, "fullname": "Yining Liu", "url": "http://mlsys.org/api/miniconf/users/25811?format=json", "institution": "Meta"}, {"id": 27729, "fullname": "Siqi Yan", "url": "http://mlsys.org/api/miniconf/users/27729?format=json", "institution": "Facebook"}, {"id": 27720, "fullname": "Lisen Deng", "url": "http://mlsys.org/api/miniconf/users/27720?format=json", "institution": "Meta"}, {"id": 27719, "fullname": "Jennifer Cao", "url": "http://mlsys.org/api/miniconf/users/27719?format=json", "institution": "Facebook"}, {"id": 27159, "fullname": "Shuqi Yang", "url": "http://mlsys.org/api/miniconf/users/27159?format=json", "institution": "Meta"}, {"id": 27731, "fullname": "Bi Xue", "url": "http://mlsys.org/api/miniconf/users/27731?format=json", "institution": "Thinking Machines Lab"}, {"id": 27730, "fullname": "Min Ni", "url": "http://mlsys.org/api/miniconf/users/27730?format=json", "institution": "Northwestern University"}, {"id": 16149, "fullname": "Shen Li", "url": "http://mlsys.org/api/miniconf/users/16149?format=json", "institution": "Meta"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Training 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3826", "url": null, "sourceid": -115, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T15:45:00-07:00", "endtime": "2026-05-21T16:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3713?format=json", "parent_id": 3713, "eventmedia": [{"id": 1137, "modified": "2026-05-19T16:43:31.025775-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3826_TlhaaTE.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3603?format=json"], "related_events_ids": [3603]}, {"id": 3509, "uid": "02e74f10e0327ad868d138f2b4fdd6f0", "name": "From Tokens to Layers: Redefining Stall-Free Scheduling for MoE Serving with Layered Prefill", "authors": [{"id": 26188, "fullname": "Gunjun Lee", "url": "http://mlsys.org/api/miniconf/users/26188?format=json", "institution": "Seoul National University"}, {"id": 27174, "fullname": "Jiwon Kim", "url": "http://mlsys.org/api/miniconf/users/27174?format=json", "institution": null}, {"id": 27175, "fullname": "Jaiyoung Park", "url": "http://mlsys.org/api/miniconf/users/27175?format=json", "institution": null}, {"id": 27176, "fullname": "Younjoo Lee", "url": "http://mlsys.org/api/miniconf/users/27176?format=json", "institution": "Seoul National University"}, {"id": 27177, "fullname": "Jung Ho Ahn", "url": "http://mlsys.org/api/miniconf/users/27177?format=json", "institution": "Seoul National University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3509", "url": null, "sourceid": 27, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=yyDbI3HXco", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 803, "modified": "2026-03-23T21:52:43.267572-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=yyDbI3HXco", "resourcetype": "UriEventmedia"}, {"id": 1030, "file": "/media/PosterPDFs/MLSys%202026/3509.png", "modified": "2026-05-14T06:55:37.675255-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1031, "file": "/media/PosterPDFs/MLSys%202026/3509-thumb.png", "modified": "2026-05-14T06:55:37.783055-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "24", "related_events": ["http://mlsys.org/api/miniconf/events/3732?format=json"], "related_events_ids": [3732]}, {"id": 3782, "uid": "f0935e4cd5920aa6c7c996a5ee53a70f", "name": "Speculative Decoding: Performance or Illusion?", "authors": [{"id": 28490, "fullname": "Xiaoxuan Liu", "url": "http://mlsys.org/api/miniconf/users/28490?format=json", "institution": "OpenAI"}, {"id": 25915, "fullname": "Jiaxiang Yu", "url": "http://mlsys.org/api/miniconf/users/25915?format=json", "institution": "UC Berkeley"}, {"id": 27180, "fullname": "Jongseok Park", "url": "http://mlsys.org/api/miniconf/users/27180?format=json", "institution": "University of California, Berkeley"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}, {"id": 27557, "fullname": "Alvin Cheung", "url": "http://mlsys.org/api/miniconf/users/27557?format=json", "institution": "University of California, Berkeley"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 5", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3782", "url": null, "sourceid": -106, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T09:00:00-07:00", "endtime": "2026-05-21T09:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3701?format=json", "parent_id": 3701, "eventmedia": [{"id": 1150, "modified": "2026-05-16T01:05:15.795337-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3782.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3559?format=json"], "related_events_ids": [3559]}, {"id": 3824, "uid": "c45147dee729311ef5b5c3003946c48f", "name": "Pylo: Towards Accessible Learned Optimizers in PyTorch", "authors": [{"id": 27741, "fullname": "Paul Janson", "url": "http://mlsys.org/api/miniconf/users/27741?format=json", "institution": "Concordia University"}, {"id": 27742, "fullname": "Benjamin Th\u00e9rien", "url": "http://mlsys.org/api/miniconf/users/27742?format=json", "institution": "Mila / Universit\u00e9 de Montr\u00e9al"}, {"id": 27743, "fullname": "Quentin Anthony", "url": "http://mlsys.org/api/miniconf/users/27743?format=json", "institution": "EleutherAI"}, {"id": 27744, "fullname": "Xiaolong Huang", "url": "http://mlsys.org/api/miniconf/users/27744?format=json", "institution": "Concordia University"}, {"id": 27745, "fullname": "Abhinav Moudgil", "url": "http://mlsys.org/api/miniconf/users/27745?format=json", "institution": "Concordia University"}, {"id": 27746, "fullname": "Eugene Belilovsky", "url": "http://mlsys.org/api/miniconf/users/27746?format=json", "institution": "Concordia University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3824", "url": "https://belilovsky-lab.github.io/pylo/", "sourceid": -116, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T15:45:00-07:00", "endtime": "2026-05-20T16:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3692?format=json", "parent_id": 3692, "eventmedia": [{"id": 1049, "modified": "2026-05-19T17:42:11.308760-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3824_HZUGKXd.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3601?format=json"], "related_events_ids": [3601]}, {"id": 3787, "uid": "ec5decca5ed3d6b8079e2e7e7bacc9f2", "name": "PLA-Serve: A Prefill-Length-Aware LLM Serving System", "authors": [{"id": 17078, "fullname": "Jianshu She", "url": "http://mlsys.org/api/miniconf/users/17078?format=json", "institution": "MBZUAI"}, {"id": 27572, "fullname": "Zonghang Li", "url": "http://mlsys.org/api/miniconf/users/27572?format=json", "institution": "Mohamed bin Zayed University of Artificial Intelligence"}, {"id": 27573, "fullname": "HONGCHAO DU", "url": "http://mlsys.org/api/miniconf/users/27573?format=json", "institution": ""}, {"id": 27574, "fullname": "Shangyu Wu", "url": "http://mlsys.org/api/miniconf/users/27574?format=json", "institution": "Mohamed bin Zayed University of Artificial Intelligence"}, {"id": 27575, "fullname": "Wenhao Zheng", "url": "http://mlsys.org/api/miniconf/users/27575?format=json", "institution": "University of North Carolina at Chapel Hill"}, {"id": 16300, "fullname": "Eric Xing", "url": "http://mlsys.org/api/miniconf/users/16300?format=json", "institution": "MBZUAI, CMU, and Petuum Inc."}, {"id": 27577, "fullname": "Zhengzhong Liu", "url": "http://mlsys.org/api/miniconf/users/27577?format=json", "institution": "Mohamed bin Zayed University of Artificial Intelligence"}, {"id": 27578, "fullname": "Huaxiu Yao", "url": "http://mlsys.org/api/miniconf/users/27578?format=json", "institution": ""}, {"id": 27579, "fullname": "Chun Jason Xue", "url": "http://mlsys.org/api/miniconf/users/27579?format=json", "institution": "Mohamed bin Zayed University of Artificial Intelligence"}, {"id": 16309, "fullname": "Qirong Ho", "url": "http://mlsys.org/api/miniconf/users/16309?format=json", "institution": "MBZUAI"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3787", "url": "https://github.com/Jianshu-She/LAPS", "sourceid": -127, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T15:15:00-07:00", "endtime": "2026-05-19T15:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3675?format=json", "parent_id": 3675, "eventmedia": [{"id": 997, "modified": "2026-05-16T13:54:09.766199-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3787_G7LPmPu.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3564?format=json"], "related_events_ids": [3564]}, {"id": 3608, "uid": "ed3d2c21991e3bef5e069713af9fa6ca", "name": "GUARD: SCALABLE STRAGGLER DETECTION AND NODE HEALTH MANAGEMENT FOR LARGE-SCALE TRAINING", "authors": [{"id": 25932, "fullname": "guanliang liu", "url": "http://mlsys.org/api/miniconf/users/25932?format=json", "institution": "Amazon"}, {"id": 27783, "fullname": "Abhinandan Patni", "url": "http://mlsys.org/api/miniconf/users/27783?format=json", "institution": ""}, {"id": 27782, "fullname": "congzhu lin", "url": "http://mlsys.org/api/miniconf/users/27782?format=json", "institution": null}, {"id": 21189, "fullname": "Zoe Zeng", "url": "http://mlsys.org/api/miniconf/users/21189?format=json", "institution": "Amazon Foundation Modeling"}, {"id": 27778, "fullname": "Jack Wittmayer", "url": "http://mlsys.org/api/miniconf/users/27778?format=json", "institution": null}, {"id": 27780, "fullname": "Yinghong Liu", "url": "http://mlsys.org/api/miniconf/users/27780?format=json", "institution": "Amazon"}, {"id": 27781, "fullname": "josh wu", "url": "http://mlsys.org/api/miniconf/users/27781?format=json", "institution": null}, {"id": 27788, "fullname": "Anthony Ko", "url": "http://mlsys.org/api/miniconf/users/27788?format=json", "institution": null}, {"id": 27785, "fullname": "Alexander Zhipa", "url": "http://mlsys.org/api/miniconf/users/27785?format=json", "institution": "Amazon"}, {"id": 27163, "fullname": "Ashvin Nihalani", "url": "http://mlsys.org/api/miniconf/users/27163?format=json", "institution": "Amazon"}, {"id": 27786, "fullname": "Binxuan Huang", "url": "http://mlsys.org/api/miniconf/users/27786?format=json", "institution": "Amazon"}, {"id": 17887, "fullname": "Cong Cheng", "url": "http://mlsys.org/api/miniconf/users/17887?format=json", "institution": "Amazon"}, {"id": 27779, "fullname": "Mi Sun", "url": "http://mlsys.org/api/miniconf/users/27779?format=json", "institution": null}, {"id": 28963, "fullname": "Vijay rajakumar", "url": "http://mlsys.org/api/miniconf/users/28963?format=json", "institution": "Amazon"}, {"id": 28497, "fullname": "Rejith Joseph", "url": "http://mlsys.org/api/miniconf/users/28497?format=json", "institution": "Amazon"}, {"id": 27787, "fullname": "Parthasarathy Govindarajen", "url": "http://mlsys.org/api/miniconf/users/27787?format=json", "institution": "Amazon"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3608", "url": null, "sourceid": 98, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=JFEwQ821MS", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 902, "modified": "2026-03-23T21:52:47.116357-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=JFEwQ821MS", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "28", "related_events": ["http://mlsys.org/api/miniconf/events/3831?format=json"], "related_events_ids": [3831]}, {"id": 3831, "uid": "ed3d2c21991e3bef5e069713af9fa6ca", "name": "GUARD: SCALABLE STRAGGLER DETECTION AND NODE HEALTH MANAGEMENT FOR LARGE-SCALE TRAINING", "authors": [{"id": 25932, "fullname": "guanliang liu", "url": "http://mlsys.org/api/miniconf/users/25932?format=json", "institution": "Amazon"}, {"id": 27783, "fullname": "Abhinandan Patni", "url": "http://mlsys.org/api/miniconf/users/27783?format=json", "institution": ""}, {"id": 27782, "fullname": "congzhu lin", "url": "http://mlsys.org/api/miniconf/users/27782?format=json", "institution": null}, {"id": 21189, "fullname": "Zoe Zeng", "url": "http://mlsys.org/api/miniconf/users/21189?format=json", "institution": "Amazon Foundation Modeling"}, {"id": 27778, "fullname": "Jack Wittmayer", "url": "http://mlsys.org/api/miniconf/users/27778?format=json", "institution": null}, {"id": 27780, "fullname": "Yinghong Liu", "url": "http://mlsys.org/api/miniconf/users/27780?format=json", "institution": "Amazon"}, {"id": 27781, "fullname": "josh wu", "url": "http://mlsys.org/api/miniconf/users/27781?format=json", "institution": null}, {"id": 27788, "fullname": "Anthony Ko", "url": "http://mlsys.org/api/miniconf/users/27788?format=json", "institution": null}, {"id": 27785, "fullname": "Alexander Zhipa", "url": "http://mlsys.org/api/miniconf/users/27785?format=json", "institution": "Amazon"}, {"id": 27163, "fullname": "Ashvin Nihalani", "url": "http://mlsys.org/api/miniconf/users/27163?format=json", "institution": "Amazon"}, {"id": 27786, "fullname": "Binxuan Huang", "url": "http://mlsys.org/api/miniconf/users/27786?format=json", "institution": "Amazon"}, {"id": 17887, "fullname": "Cong Cheng", "url": "http://mlsys.org/api/miniconf/users/17887?format=json", "institution": "Amazon"}, {"id": 27779, "fullname": "Mi Sun", "url": "http://mlsys.org/api/miniconf/users/27779?format=json", "institution": null}, {"id": 28963, "fullname": "Vijay rajakumar", "url": "http://mlsys.org/api/miniconf/users/28963?format=json", "institution": "Amazon"}, {"id": 28497, "fullname": "Rejith Joseph", "url": "http://mlsys.org/api/miniconf/users/28497?format=json", "institution": "Amazon"}, {"id": 27787, "fullname": "Parthasarathy Govindarajen", "url": "http://mlsys.org/api/miniconf/users/27787?format=json", "institution": "Amazon"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Training 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3831", "url": null, "sourceid": -98, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T15:30:00-07:00", "endtime": "2026-05-21T15:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3713?format=json", "parent_id": 3713, "eventmedia": [{"id": 1019, "modified": "2026-05-15T20:25:10.100634-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3831_b41kyKe.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3608?format=json"], "related_events_ids": [3608]}, {"id": 3625, "uid": "c20ad4d76fe97759aa27a0c99bff6710", "name": "IntAttention: A Fully Integer Attention Pipeline for Efficient Edge Inference", "authors": [{"id": 25556, "fullname": "Wanli Zhong", "url": "http://mlsys.org/api/miniconf/users/25556?format=json", "institution": "Southern University of Science and Technology"}, {"id": 27848, "fullname": "Haibo Feng", "url": "http://mlsys.org/api/miniconf/users/27848?format=json", "institution": "Southern University of Science and Technology"}, {"id": 27849, "fullname": "Zirui Zhou", "url": "http://mlsys.org/api/miniconf/users/27849?format=json", "institution": "Southern University of Science and Technology"}, {"id": 27850, "fullname": "Hanyang Peng", "url": "http://mlsys.org/api/miniconf/users/27850?format=json", "institution": "Pengcheng Loboratory"}, {"id": 27851, "fullname": "Shiqi Yu", "url": "http://mlsys.org/api/miniconf/users/27851?format=json", "institution": "Southern University of Science and Technology, Shenzhen, China"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3625", "url": null, "sourceid": 12, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=CPCRITwAaP", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 919, "modified": "2026-03-23T21:52:47.824478-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=CPCRITwAaP", "resourcetype": "UriEventmedia"}, {"id": 1151, "file": "/media/PosterPDFs/MLSys%202026/3625.png", "modified": "2026-05-16T01:34:13.194518-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1152, "file": "/media/PosterPDFs/MLSys%202026/3625-thumb.png", "modified": "2026-05-16T01:34:13.305521-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1153, "modified": "2026-05-16T01:34:55.249034-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3625.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "13", "related_events": ["http://mlsys.org/api/miniconf/events/3848?format=json"], "related_events_ids": [3848]}, {"id": 3757, "uid": "a5771bce93e200c36f7cd9dfd0e5deaa", "name": "ApproxMLIR : Accuracy-Aware Compiler for Compound ML System", "authors": [{"id": 27335, "fullname": "Hao Ren", "url": "http://mlsys.org/api/miniconf/users/27335?format=json", "institution": "University of Illinois Urbana-Champaign"}, {"id": 27336, "fullname": "Yi Mu", "url": "http://mlsys.org/api/miniconf/users/27336?format=json", "institution": "University of Illinois at Urbana-Champaign"}, {"id": 16274, "fullname": "Sasa Misailovic", "url": "http://mlsys.org/api/miniconf/users/16274?format=json", "institution": "UIUC"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Compilers and Kernels", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3757", "url": null, "sourceid": -38, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T17:30:00-07:00", "endtime": "2026-05-21T17:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3718?format=json", "parent_id": 3718, "eventmedia": [{"id": 1118, "modified": "2026-05-15T17:17:31.063111-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3757.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3534?format=json"], "related_events_ids": [3534]}, {"id": 3848, "uid": "c20ad4d76fe97759aa27a0c99bff6710", "name": "IntAttention: A Fully Integer Attention Pipeline for Efficient Edge Inference", "authors": [{"id": 25556, "fullname": "Wanli Zhong", "url": "http://mlsys.org/api/miniconf/users/25556?format=json", "institution": "Southern University of Science and Technology"}, {"id": 27848, "fullname": "Haibo Feng", "url": "http://mlsys.org/api/miniconf/users/27848?format=json", "institution": "Southern University of Science and Technology"}, {"id": 27849, "fullname": "Zirui Zhou", "url": "http://mlsys.org/api/miniconf/users/27849?format=json", "institution": "Southern University of Science and Technology"}, {"id": 27850, "fullname": "Hanyang Peng", "url": "http://mlsys.org/api/miniconf/users/27850?format=json", "institution": "Pengcheng Loboratory"}, {"id": 27851, "fullname": "Shiqi Yu", "url": "http://mlsys.org/api/miniconf/users/27851?format=json", "institution": "Southern University of Science and Technology, Shenzhen, China"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient ML", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3848", "url": "https://github.com/WanliZhong/IntAttention", "sourceid": -12, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T13:15:00-07:00", "endtime": "2026-05-21T13:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3710?format=json", "parent_id": 3710, "eventmedia": [{"id": 1154, "modified": "2026-05-16T01:36:42.936736-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3848.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3625?format=json"], "related_events_ids": [3625]}, {"id": 3830, "uid": "fe9fc289c3ff0af142b6d3bead98a923", "name": "BOOST: BOttleneck-Optimized Scalable Training Framework for Low-Rank Large Language Models", "authors": [{"id": 23955, "fullname": "Zhengyang Wang", "url": "http://mlsys.org/api/miniconf/users/23955?format=json", "institution": "University of California, Santa Barbara"}, {"id": 23956, "fullname": "Ziyue Liu", "url": "http://mlsys.org/api/miniconf/users/23956?format=json", "institution": "University of California Santa Barbara"}, {"id": 27774, "fullname": "Ruijie Zhang", "url": "http://mlsys.org/api/miniconf/users/27774?format=json", "institution": "University of California, Santa Barbara"}, {"id": 27161, "fullname": "Avinash Maurya", "url": "http://mlsys.org/api/miniconf/users/27161?format=json", "institution": "Argonne National Laboratory"}, {"id": 27775, "fullname": "Bogdan Nicolae", "url": "http://mlsys.org/api/miniconf/users/27775?format=json", "institution": null}, {"id": 27776, "fullname": "Paul Hovland", "url": "http://mlsys.org/api/miniconf/users/27776?format=json", "institution": "Argonne National Laboratory"}, {"id": 27777, "fullname": "Franck Cappello", "url": "http://mlsys.org/api/miniconf/users/27777?format=json", "institution": null}, {"id": 24510, "fullname": "zheng Zhang", "url": "http://mlsys.org/api/miniconf/users/24510?format=json", "institution": "University of California, Santa Barbara"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3830", "url": null, "sourceid": -83, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T08:30:00-07:00", "endtime": "2026-05-20T08:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3679?format=json", "parent_id": 3679, "eventmedia": [{"id": 1235, "modified": "2026-05-19T23:00:40.932636-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3830.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3607?format=json"], "related_events_ids": [3607]}, {"id": 3514, "uid": "072b030ba126b2f4b2374f342be9ed44", "name": "FP8-Flow-MoE: A Casting-Free FP8 Recipe without Double Quantization Error", "authors": [{"id": 25853, "fullname": "Fengjuan Wang", "url": "http://mlsys.org/api/miniconf/users/25853?format=json", "institution": "zhejianglab"}, {"id": 27194, "fullname": "Zhiyi Su", "url": "http://mlsys.org/api/miniconf/users/27194?format=json", "institution": "Zhejiang Lab, Zhejiang Lab"}, {"id": 27195, "fullname": "Xingzhu Hu", "url": "http://mlsys.org/api/miniconf/users/27195?format=json", "institution": null}, {"id": 27196, "fullname": "Cheng Wang", "url": "http://mlsys.org/api/miniconf/users/27196?format=json", "institution": null}, {"id": 25609, "fullname": "Sun Mou", "url": "http://mlsys.org/api/miniconf/users/25609?format=json", "institution": "Zhejiang Lab"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3514", "url": null, "sourceid": 60, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=wyH60Su6G7", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 808, "modified": "2026-03-23T21:52:43.443255-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=wyH60Su6G7", "resourcetype": "UriEventmedia"}, {"id": 951, "file": "/media/PosterPDFs/MLSys%202026/3514-thumb.png", "modified": "2026-04-26T01:10:00.451292-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 950, "file": "/media/PosterPDFs/MLSys%202026/3514.png", "modified": "2026-04-26T01:10:00.379318-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "47", "related_events": ["http://mlsys.org/api/miniconf/events/3737?format=json"], "related_events_ids": [3737]}, {"id": 3516, "uid": "66f041e16a60928b05a7e228a89c3799", "name": "Toward Principled LLM Safety Testing: Solving the Jailbreak Oracle Problem", "authors": [{"id": 16907, "fullname": "Shuyi Lin", "url": "http://mlsys.org/api/miniconf/users/16907?format=json", "institution": "Northeastern University"}, {"id": 27199, "fullname": "Anshuman Suri", "url": "http://mlsys.org/api/miniconf/users/27199?format=json", "institution": "Northeastern University"}, {"id": 27200, "fullname": "Alina Oprea", "url": "http://mlsys.org/api/miniconf/users/27200?format=json", "institution": "Northeastern University"}, {"id": 16145, "fullname": "Cheng Tan", "url": "http://mlsys.org/api/miniconf/users/16145?format=json", "institution": "Northeastern"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3516", "url": "https://github.com/shuyilinn/BOA/tree/mlsys2026ae", "sourceid": 58, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=vr3Rrg6Xnm", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 810, "modified": "2026-03-23T21:52:43.509340-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=vr3Rrg6Xnm", "resourcetype": "UriEventmedia"}, {"id": 1089, "file": "/media/PosterPDFs/MLSys%202026/3516.png", "modified": "2026-05-15T11:11:03.217910-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1090, "file": "/media/PosterPDFs/MLSys%202026/3516-thumb.png", "modified": "2026-05-15T11:11:03.303661-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "36", "related_events": ["http://mlsys.org/api/miniconf/events/3739?format=json"], "related_events_ids": [3739]}, {"id": 3841, "uid": "d67d8ab4f4c10bf22aa353e27879133c", "name": "CAGE: Curvature-Aware Gradient Estimation For Accurate Quantization-Aware Training", "authors": [{"id": 27826, "fullname": "Soroush Tabesh", "url": "http://mlsys.org/api/miniconf/users/27826?format=json", "institution": "Institute of Science and Technology Austria"}, {"id": 28563, "fullname": "Mher Safaryan", "url": "http://mlsys.org/api/miniconf/users/28563?format=json", "institution": "ISTA, Austria | Lancaster University, UK"}, {"id": 27828, "fullname": "Andrei Panferov", "url": "http://mlsys.org/api/miniconf/users/27828?format=json", "institution": "Institute of Science and Technology Austria"}, {"id": 27829, "fullname": "Alexandra Volkova", "url": "http://mlsys.org/api/miniconf/users/27829?format=json", "institution": null}, {"id": 27830, "fullname": "Dan Alistarh", "url": "http://mlsys.org/api/miniconf/users/27830?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Model Compression", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3841", "url": null, "sourceid": -39, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T17:00:00-07:00", "endtime": "2026-05-20T17:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3696?format=json", "parent_id": 3696, "eventmedia": [{"id": 1234, "modified": "2026-05-19T23:05:17.285067-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3841_N6ZwMw7.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3618?format=json"], "related_events_ids": [3618]}, {"id": 3737, "uid": "072b030ba126b2f4b2374f342be9ed44", "name": "FP8-Flow-MoE: A Casting-Free FP8 Recipe without Double Quantization Error", "authors": [{"id": 25853, "fullname": "Fengjuan Wang", "url": "http://mlsys.org/api/miniconf/users/25853?format=json", "institution": "zhejianglab"}, {"id": 27194, "fullname": "Zhiyi Su", "url": "http://mlsys.org/api/miniconf/users/27194?format=json", "institution": "Zhejiang Lab, Zhejiang Lab"}, {"id": 27195, "fullname": "Xingzhu Hu", "url": "http://mlsys.org/api/miniconf/users/27195?format=json", "institution": null}, {"id": 27196, "fullname": "Cheng Wang", "url": "http://mlsys.org/api/miniconf/users/27196?format=json", "institution": null}, {"id": 25609, "fullname": "Sun Mou", "url": "http://mlsys.org/api/miniconf/users/25609?format=json", "institution": "Zhejiang Lab"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3737", "url": "https://github.com/021ai/FP8-FLOW-MOE-AE", "sourceid": -60, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T18:15:00-07:00", "endtime": "2026-05-20T18:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3695?format=json", "parent_id": 3695, "eventmedia": [{"id": 964, "modified": "2026-05-04T22:56:45.489180-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3737.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3514?format=json"], "related_events_ids": [3514]}, {"id": 3739, "uid": "66f041e16a60928b05a7e228a89c3799", "name": "Toward Principled LLM Safety Testing: Solving the Jailbreak Oracle Problem", "authors": [{"id": 16907, "fullname": "Shuyi Lin", "url": "http://mlsys.org/api/miniconf/users/16907?format=json", "institution": "Northeastern University"}, {"id": 27199, "fullname": "Anshuman Suri", "url": "http://mlsys.org/api/miniconf/users/27199?format=json", "institution": "Northeastern University"}, {"id": 27200, "fullname": "Alina Oprea", "url": "http://mlsys.org/api/miniconf/users/27200?format=json", "institution": "Northeastern University"}, {"id": 16145, "fullname": "Cheng Tan", "url": "http://mlsys.org/api/miniconf/users/16145?format=json", "institution": "Northeastern"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Security and Privacy", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3739", "url": "https://github.com/shuyilinn/BOA/tree/mlsys2026ae", "sourceid": -58, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T17:45:00-07:00", "endtime": "2026-05-19T18:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3673?format=json", "parent_id": 3673, "eventmedia": [{"id": 1119, "modified": "2026-05-15T17:20:49.144529-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3739.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3516?format=json"], "related_events_ids": [3516]}, {"id": 3847, "uid": "5f93f983524def3dca464469d2cf9f3e", "name": "Massive-Scale Out-Of-Core UMAP on the GPU", "authors": [{"id": 27164, "fullname": "Jinsol Park", "url": "http://mlsys.org/api/miniconf/users/27164?format=json", "institution": "NVIDIA"}, {"id": 11859, "fullname": "Corey Nolet", "url": "http://mlsys.org/api/miniconf/users/11859?format=json", "institution": "NVIDIA"}, {"id": 14733, "fullname": "Edward Raff", "url": "http://mlsys.org/api/miniconf/users/14733?format=json", "institution": "Booz Allen Hamilton"}, {"id": 27846, "fullname": "Tim Oates", "url": "http://mlsys.org/api/miniconf/users/27846?format=json", "institution": "University of Maryland, Baltimore County"}, {"id": 27847, "fullname": "Akira Naruse", "url": "http://mlsys.org/api/miniconf/users/27847?format=json", "institution": "NVIDIA"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3847", "url": null, "sourceid": -110, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T14:45:00-07:00", "endtime": "2026-05-21T15:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3714?format=json", "parent_id": 3714, "eventmedia": [{"id": 1041, "modified": "2026-05-14T10:14:43.312797-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3847.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3624?format=json"], "related_events_ids": [3624]}, {"id": 3791, "uid": "3def184ad8f4755ff269862ea77393dd", "name": "PARROT: Persuasion and Agreement Robustness Rating of Output Truth \u2014 A Sycophancy Robustness Benchmark for LLMs", "authors": [{"id": 28463, "fullname": "\u00d6zay Ezerceli", "url": "http://mlsys.org/api/miniconf/users/28463?format=json", "institution": "Isik University"}, {"id": 27598, "fullname": "Mahmoud ElHussieni", "url": "http://mlsys.org/api/miniconf/users/27598?format=json", "institution": "Istanbul Medipol University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3791", "url": null, "sourceid": -125, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T15:45:00-07:00", "endtime": "2026-05-21T16:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3714?format=json", "parent_id": 3714, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3568?format=json"], "related_events_ids": [3568]}, {"id": 3599, "uid": "d1f491a404d6854880943e5c3cd9ca25", "name": "Unleashing Scalable Context Parallelism for Foundation Models Pre-Training via FCP", "authors": [{"id": 20906, "fullname": "Yilong Zhao", "url": "http://mlsys.org/api/miniconf/users/20906?format=json", "institution": "University of California, Berkeley"}, {"id": 27733, "fullname": "Xiaonan Nie", "url": "http://mlsys.org/api/miniconf/users/27733?format=json", "institution": "ByteDance Seed"}, {"id": 17683, "fullname": "Kan Zhu", "url": "http://mlsys.org/api/miniconf/users/17683?format=json", "institution": "University of Washington"}, {"id": 27734, "fullname": "Shuang Ma", "url": "http://mlsys.org/api/miniconf/users/27734?format=json", "institution": null}, {"id": 27735, "fullname": "Zhichao Lai", "url": "http://mlsys.org/api/miniconf/users/27735?format=json", "institution": null}, {"id": 27736, "fullname": "Hongxiang Hao", "url": "http://mlsys.org/api/miniconf/users/27736?format=json", "institution": "ByteDance Inc."}, {"id": 19070, "fullname": "Yang Zhou", "url": "http://mlsys.org/api/miniconf/users/19070?format=json", "institution": "UC Davis"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3599", "url": null, "sourceid": 129, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=MPVycRsIn6", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 893, "modified": "2026-03-23T21:52:46.799467-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=MPVycRsIn6", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "3", "related_events": ["http://mlsys.org/api/miniconf/events/3822?format=json"], "related_events_ids": [3822]}, {"id": 3602, "uid": "7f39f8317fbdb1988ef4c628eba02591", "name": "HetRL: Efficient Reinforcement Learning for LLMs in Heterogeneous Environments", "authors": [{"id": 26252, "fullname": "Yongjun He", "url": "http://mlsys.org/api/miniconf/users/26252?format=json", "institution": "ETH Zurich"}, {"id": 12135, "fullname": "Shuai Zhang", "url": "http://mlsys.org/api/miniconf/users/12135?format=json", "institution": "Amazon Web Services"}, {"id": 28961, "fullname": "Jiading Gai", "url": "http://mlsys.org/api/miniconf/users/28961?format=json", "institution": "Amazon"}, {"id": 27748, "fullname": "Xiyuan Zhang", "url": "http://mlsys.org/api/miniconf/users/27748?format=json", "institution": "AWS"}, {"id": 27749, "fullname": "Boran Han", "url": "http://mlsys.org/api/miniconf/users/27749?format=json", "institution": "Amazon/AWS"}, {"id": 27750, "fullname": "Bernie Wang", "url": "http://mlsys.org/api/miniconf/users/27750?format=json", "institution": "Amazon"}, {"id": 28496, "fullname": "Huzefa Rangwala", "url": "http://mlsys.org/api/miniconf/users/28496?format=json", "institution": "Siemens Corporate Research"}, {"id": 27637, "fullname": "George Karypis", "url": "http://mlsys.org/api/miniconf/users/27637?format=json", "institution": "University of Minnesota, Minneapolis"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3602", "url": null, "sourceid": 61, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=LRLyuaz1W7", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 896, "modified": "2026-03-23T21:52:46.907660-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=LRLyuaz1W7", "resourcetype": "UriEventmedia"}, {"id": 1236, "file": "/media/PosterPDFs/MLSys%202026/3602.png", "modified": "2026-05-19T23:40:09.101390-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1237, "file": "/media/PosterPDFs/MLSys%202026/3602-thumb.png", "modified": "2026-05-19T23:45:25.766602-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "27", "related_events": ["http://mlsys.org/api/miniconf/events/3825?format=json"], "related_events_ids": [3825]}, {"id": 3772, "uid": "182be0c5cdcd5072bb1864cdee4d3d6e", "name": "When Machine Learning Isn\u2019t Sure: Building Resilient ML-Based Computer Systems by Embracing Uncertainty", "authors": [{"id": 27421, "fullname": "Varun Gohil", "url": "http://mlsys.org/api/miniconf/users/27421?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27422, "fullname": "Nevena Stojkovic", "url": "http://mlsys.org/api/miniconf/users/27422?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27423, "fullname": "Noman Bashir", "url": "http://mlsys.org/api/miniconf/users/27423?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 28958, "fullname": "Sundar Dev", "url": "http://mlsys.org/api/miniconf/users/28958?format=json", "institution": "Google"}, {"id": 27425, "fullname": "Gaurang Upasani", "url": "http://mlsys.org/api/miniconf/users/27425?format=json", "institution": "Google"}, {"id": 27426, "fullname": "David Lo", "url": "http://mlsys.org/api/miniconf/users/27426?format=json", "institution": "Google"}, {"id": 27427, "fullname": "Parthasarathy Ranganathan", "url": "http://mlsys.org/api/miniconf/users/27427?format=json", "institution": "Google"}, {"id": 20861, "fullname": "Christina Delimitrou", "url": "http://mlsys.org/api/miniconf/users/20861?format=json", "institution": "Cornell University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: ML for Systems", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3772", "url": null, "sourceid": -33, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T14:00:00-07:00", "endtime": "2026-05-20T14:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3688?format=json", "parent_id": 3688, "eventmedia": [{"id": 1043, "modified": "2026-05-15T17:42:35.310305-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3772_bJ5i4pq.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3549?format=json"], "related_events_ids": [3549]}, {"id": 3805, "uid": "2723d092b63885e0d7c260cc007e8b9d", "name": "MixLLM: LLM Quantization with Global Mixed-precision between Output-features and Highly-efficient System Design", "authors": [{"id": 28440, "fullname": "Zhen Zheng", "url": "http://mlsys.org/api/miniconf/users/28440?format=json", "institution": "ByteDance Inc."}, {"id": 27641, "fullname": "Xiaonan Song", "url": "http://mlsys.org/api/miniconf/users/27641?format=json", "institution": "Microsoft"}, {"id": 27642, "fullname": "Chuanjie Liu", "url": "http://mlsys.org/api/miniconf/users/27642?format=json", "institution": "Microsoft"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Model Compression", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3805", "url": null, "sourceid": -109, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T17:45:00-07:00", "endtime": "2026-05-20T18:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3696?format=json", "parent_id": 3696, "eventmedia": [{"id": 1157, "modified": "2026-05-16T04:34:50.765759-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3805.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3582?format=json"], "related_events_ids": [3582]}, {"id": 3613, "uid": "8e296a067a37563370ded05f5a3bf3ec", "name": "ReSpec: Towards Optimizing Speculative Decoding in Reinforcement Learning Systems", "authors": [{"id": 27808, "fullname": "Qiaoling Chen", "url": "http://mlsys.org/api/miniconf/users/27808?format=json", "institution": "Nanyang Technological University"}, {"id": 25950, "fullname": "Zijun Liu", "url": "http://mlsys.org/api/miniconf/users/25950?format=json", "institution": "Tsinghua University"}, {"id": 27809, "fullname": "Peng Sun", "url": "http://mlsys.org/api/miniconf/users/27809?format=json", "institution": "Harbin Institute of Technology"}, {"id": 27810, "fullname": "Shenggui Li", "url": "http://mlsys.org/api/miniconf/users/27810?format=json", "institution": "Nanyang Technological University"}, {"id": 27811, "fullname": "Guoteng Wang", "url": "http://mlsys.org/api/miniconf/users/27811?format=json", "institution": "Shanghai Artificial Intelligence Laboratory"}, {"id": 17655, "fullname": "Ziming Liu", "url": "http://mlsys.org/api/miniconf/users/17655?format=json", "institution": "national university of singaore, National University of Singapore"}, {"id": 20910, "fullname": "Yonggang Wen", "url": "http://mlsys.org/api/miniconf/users/20910?format=json", "institution": "Nanyang Technological University"}, {"id": 27812, "fullname": "Siyuan Feng", "url": "http://mlsys.org/api/miniconf/users/27812?format=json", "institution": "Shanghai Innovation Institute"}, {"id": 20894, "fullname": "Tianwei Zhang", "url": "http://mlsys.org/api/miniconf/users/20894?format=json", "institution": "Nanyang Technological University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3613", "url": null, "sourceid": 25, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=HhDSxs7x2R", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 907, "modified": "2026-03-23T21:52:47.330110-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=HhDSxs7x2R", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "26", "related_events": ["http://mlsys.org/api/miniconf/events/3836?format=json"], "related_events_ids": [3836]}, {"id": 3579, "uid": "eb160de1de89d9058fcb0b968dbbbd68", "name": "Efficient, VRAM-Constrained xLM Inference on Clients", "authors": [{"id": 27156, "fullname": "Aditya Ukarande", "url": "http://mlsys.org/api/miniconf/users/27156?format=json", "institution": "Nvidia"}, {"id": 27631, "fullname": "Deep Shekhar", "url": "http://mlsys.org/api/miniconf/users/27631?format=json", "institution": "Nvidia"}, {"id": 27632, "fullname": "Marc Blackstein", "url": "http://mlsys.org/api/miniconf/users/27632?format=json", "institution": null}, {"id": 27157, "fullname": "Ram Rangan", "url": "http://mlsys.org/api/miniconf/users/27157?format=json", "institution": "NVIDIA"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3579", "url": null, "sourceid": 117, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=VKqQYg6JPb", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 873, "modified": "2026-03-23T21:52:46.042387-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=VKqQYg6JPb", "resourcetype": "UriEventmedia"}, {"id": 1105, "file": "/media/PosterPDFs/MLSys%202026/3579.png", "modified": "2026-05-15T14:13:45.614993-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1106, "file": "/media/PosterPDFs/MLSys%202026/3579-thumb.png", "modified": "2026-05-15T14:13:45.716543-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "47", "related_events": ["http://mlsys.org/api/miniconf/events/3802?format=json"], "related_events_ids": [3802]}, {"id": 3561, "uid": "32bb90e8976aab5298d5da10fe66f21d", "name": "Breaking the Ice: Analyzing Cold Start Latency in vLLM", "authors": [{"id": 25925, "fullname": "Huzaifa Shaaban Kabakibo", "url": "http://mlsys.org/api/miniconf/users/25925?format=json", "institution": "Paderborn University"}, {"id": 27154, "fullname": "Animesh Trivedi", "url": "http://mlsys.org/api/miniconf/users/27154?format=json", "institution": "International Business Machines"}, {"id": 27565, "fullname": "Lin Wang", "url": "http://mlsys.org/api/miniconf/users/27565?format=json", "institution": "Paderborn University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3561", "url": "https://github.com/upb-cn/vllm-startup-profiler", "sourceid": 72, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=eoEobeKTNZ", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 855, "modified": "2026-03-23T21:52:45.294986-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=eoEobeKTNZ", "resourcetype": "UriEventmedia"}, {"id": 970, "file": "/media/PosterPDFs/MLSys%202026/3561-thumb.png", "modified": "2026-05-06T01:07:18.334103-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 969, "modified": "2026-05-15T03:08:58.164876-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3561_Se0amy6.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "9", "related_events": ["http://mlsys.org/api/miniconf/events/3784?format=json"], "related_events_ids": [3784]}, {"id": 3517, "uid": "6ea9ab1baa0efb9e19094440c317e21b", "name": "ProfInfer: An eBPF-based Fine-Grained LLM Inference Profiler", "authors": [{"id": 26249, "fullname": "Bohua Zou", "url": "http://mlsys.org/api/miniconf/users/26249?format=json", "institution": "Technical University of Munich"}, {"id": 27201, "fullname": "Debayan Roy", "url": "http://mlsys.org/api/miniconf/users/27201?format=json", "institution": null}, {"id": 27202, "fullname": "Dhimankumar Airao", "url": "http://mlsys.org/api/miniconf/users/27202?format=json", "institution": null}, {"id": 27203, "fullname": "Weihao Xu", "url": "http://mlsys.org/api/miniconf/users/27203?format=json", "institution": "TUM"}, {"id": 25570, "fullname": "Binqi Sun", "url": "http://mlsys.org/api/miniconf/users/25570?format=json", "institution": "Technical University of Munich"}, {"id": 27204, "fullname": "Yutao Liu", "url": "http://mlsys.org/api/miniconf/users/27204?format=json", "institution": null}, {"id": 27205, "fullname": "Haibo Chen", "url": "http://mlsys.org/api/miniconf/users/27205?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3517", "url": null, "sourceid": 29, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=tYHWS7YPof", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 811, "modified": "2026-03-23T21:52:43.546541-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=tYHWS7YPof", "resourcetype": "UriEventmedia"}, {"id": 1077, "file": "/media/PosterPDFs/MLSys%202026/3517.png", "modified": "2026-05-15T08:03:35.162868-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "42", "related_events": ["http://mlsys.org/api/miniconf/events/3740?format=json"], "related_events_ids": [3740]}, {"id": 3822, "uid": "d1f491a404d6854880943e5c3cd9ca25", "name": "Unleashing Scalable Context Parallelism for Foundation Models Pre-Training via FCP", "authors": [{"id": 20906, "fullname": "Yilong Zhao", "url": "http://mlsys.org/api/miniconf/users/20906?format=json", "institution": "University of California, Berkeley"}, {"id": 27733, "fullname": "Xiaonan Nie", "url": "http://mlsys.org/api/miniconf/users/27733?format=json", "institution": "ByteDance Seed"}, {"id": 17683, "fullname": "Kan Zhu", "url": "http://mlsys.org/api/miniconf/users/17683?format=json", "institution": "University of Washington"}, {"id": 27734, "fullname": "Shuang Ma", "url": "http://mlsys.org/api/miniconf/users/27734?format=json", "institution": null}, {"id": 27735, "fullname": "Zhichao Lai", "url": "http://mlsys.org/api/miniconf/users/27735?format=json", "institution": null}, {"id": 27736, "fullname": "Hongxiang Hao", "url": "http://mlsys.org/api/miniconf/users/27736?format=json", "institution": "ByteDance Inc."}, {"id": 19070, "fullname": "Yang Zhou", "url": "http://mlsys.org/api/miniconf/users/19070?format=json", "institution": "UC Davis"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3822", "url": null, "sourceid": -129, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T08:45:00-07:00", "endtime": "2026-05-20T09:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3679?format=json", "parent_id": 3679, "eventmedia": [{"id": 1162, "modified": "2026-05-20T00:22:57.862270-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3822_HdG9Mug.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3599?format=json"], "related_events_ids": [3599]}, {"id": 3860, "uid": "642e92efb79421734881b53e1e1b18b6", "name": "veScale-FSDP: Flexible and High-Performance FSDP at Scale", "authors": [{"id": 27954, "fullname": "Zezhou Wang", "url": "http://mlsys.org/api/miniconf/users/27954?format=json", "institution": "University of Washington"}, {"id": 27955, "fullname": "Youjie Li", "url": "http://mlsys.org/api/miniconf/users/27955?format=json", "institution": "ByteDance Seed, veScale"}, {"id": 27956, "fullname": "Zhiqi Lin", "url": "http://mlsys.org/api/miniconf/users/27956?format=json", "institution": "ByteDance Inc."}, {"id": 27957, "fullname": "Jiacheng Yang", "url": "http://mlsys.org/api/miniconf/users/27957?format=json", "institution": "ByteDance Inc."}, {"id": 27958, "fullname": "Cong Xie", "url": "http://mlsys.org/api/miniconf/users/27958?format=json", "institution": "ByteDance"}, {"id": 27959, "fullname": "Guanyu Feng", "url": "http://mlsys.org/api/miniconf/users/27959?format=json", "institution": null}, {"id": 27960, "fullname": "ZHENG ZHONG", "url": "http://mlsys.org/api/miniconf/users/27960?format=json", "institution": "Bytedance"}, {"id": 27961, "fullname": "Ziyue Huang", "url": "http://mlsys.org/api/miniconf/users/27961?format=json", "institution": ""}, {"id": 27962, "fullname": "Hongyu Zhu", "url": "http://mlsys.org/api/miniconf/users/27962?format=json", "institution": "ByteDance Inc."}, {"id": 27963, "fullname": "Zhi Zhang", "url": "http://mlsys.org/api/miniconf/users/27963?format=json", "institution": "ByteDance Inc."}, {"id": 27964, "fullname": "Yanghua Peng", "url": "http://mlsys.org/api/miniconf/users/27964?format=json", "institution": "ByteDance Inc."}, {"id": 20969, "fullname": "Xin Liu", "url": "http://mlsys.org/api/miniconf/users/20969?format=json", "institution": "ByteDance Inc."}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Training 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3860", "url": null, "sourceid": -48, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T15:00:00-07:00", "endtime": "2026-05-21T15:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3713?format=json", "parent_id": 3713, "eventmedia": [{"id": 1114, "modified": "2026-05-15T15:20:46.298586-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3860.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3637?format=json"], "related_events_ids": [3637]}, {"id": 3762, "uid": "9b8619251a19057cff70779273e95aa6", "name": "Practical Adversarial Multi-Armed Bandits with Sublinear Runtime", "authors": [{"id": 21072, "fullname": "Kasper Overgaard Mortensen", "url": "http://mlsys.org/api/miniconf/users/21072?format=json", "institution": "Aarhus University"}, {"id": 27348, "fullname": "Ama Bembua Bainson", "url": "http://mlsys.org/api/miniconf/users/27348?format=json", "institution": "Aarhus University"}, {"id": 27349, "fullname": "Mathias Tversted", "url": "http://mlsys.org/api/miniconf/users/27349?format=json", "institution": null}, {"id": 27350, "fullname": "Kristoffer Strube", "url": "http://mlsys.org/api/miniconf/users/27350?format=json", "institution": "Kristoffer Strube Consulting"}, {"id": 27351, "fullname": "Renata Borovica-Gajic", "url": "http://mlsys.org/api/miniconf/users/27351?format=json", "institution": "University of Melbourne"}, {"id": 27352, "fullname": "Andrea Paudice", "url": "http://mlsys.org/api/miniconf/users/27352?format=json", "institution": "Aarhus University"}, {"id": 21058, "fullname": "Davide Mottin", "url": "http://mlsys.org/api/miniconf/users/21058?format=json", "institution": "Aarhus University"}, {"id": 21084, "fullname": "Panagiotis Karras", "url": "http://mlsys.org/api/miniconf/users/21084?format=json", "institution": "Copenhagen University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: ML for Systems", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3762", "url": null, "sourceid": -130, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T14:15:00-07:00", "endtime": "2026-05-20T14:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3688?format=json", "parent_id": 3688, "eventmedia": [{"id": 1160, "modified": "2026-05-16T06:05:45.807951-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3762.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3539?format=json"], "related_events_ids": [3539]}, {"id": 3637, "uid": "642e92efb79421734881b53e1e1b18b6", "name": "veScale-FSDP: Flexible and High-Performance FSDP at Scale", "authors": [{"id": 27954, "fullname": "Zezhou Wang", "url": "http://mlsys.org/api/miniconf/users/27954?format=json", "institution": "University of Washington"}, {"id": 27955, "fullname": "Youjie Li", "url": "http://mlsys.org/api/miniconf/users/27955?format=json", "institution": "ByteDance Seed, veScale"}, {"id": 27956, "fullname": "Zhiqi Lin", "url": "http://mlsys.org/api/miniconf/users/27956?format=json", "institution": "ByteDance Inc."}, {"id": 27957, "fullname": "Jiacheng Yang", "url": "http://mlsys.org/api/miniconf/users/27957?format=json", "institution": "ByteDance Inc."}, {"id": 27958, "fullname": "Cong Xie", "url": "http://mlsys.org/api/miniconf/users/27958?format=json", "institution": "ByteDance"}, {"id": 27959, "fullname": "Guanyu Feng", "url": "http://mlsys.org/api/miniconf/users/27959?format=json", "institution": null}, {"id": 27960, "fullname": "ZHENG ZHONG", "url": "http://mlsys.org/api/miniconf/users/27960?format=json", "institution": "Bytedance"}, {"id": 27961, "fullname": "Ziyue Huang", "url": "http://mlsys.org/api/miniconf/users/27961?format=json", "institution": ""}, {"id": 27962, "fullname": "Hongyu Zhu", "url": "http://mlsys.org/api/miniconf/users/27962?format=json", "institution": "ByteDance Inc."}, {"id": 27963, "fullname": "Zhi Zhang", "url": "http://mlsys.org/api/miniconf/users/27963?format=json", "institution": "ByteDance Inc."}, {"id": 27964, "fullname": "Yanghua Peng", "url": "http://mlsys.org/api/miniconf/users/27964?format=json", "institution": "ByteDance Inc."}, {"id": 20969, "fullname": "Xin Liu", "url": "http://mlsys.org/api/miniconf/users/20969?format=json", "institution": "ByteDance Inc."}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3637", "url": null, "sourceid": 48, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=3Lj8R0F48P", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 931, "modified": "2026-03-23T21:52:48.342230-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=3Lj8R0F48P", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "25", "related_events": ["http://mlsys.org/api/miniconf/events/3860?format=json"], "related_events_ids": [3860]}, {"id": 3844, "uid": "1afa34a7f984eeabdbb0a7d494132ee5", "name": "OPKV: A High-Throughput Plugin-Driven Framework for Recallable Sparsity in Paged KV Cache Systems", "authors": [{"id": 27839, "fullname": "Huazheng Lao", "url": "http://mlsys.org/api/miniconf/users/27839?format=json", "institution": "Southeast University"}, {"id": 25856, "fullname": "Xiaofeng Li", "url": "http://mlsys.org/api/miniconf/users/25856?format=json", "institution": "Southeast University"}, {"id": 25589, "fullname": "Rui Xu", "url": "http://mlsys.org/api/miniconf/users/25589?format=json", "institution": ""}, {"id": 25641, "fullname": "Long Chen", "url": "http://mlsys.org/api/miniconf/users/25641?format=json", "institution": "Southeast University"}, {"id": 27840, "fullname": "Xia Zhu", "url": "http://mlsys.org/api/miniconf/users/27840?format=json", "institution": "Southeast University"}, {"id": 27841, "fullname": "Jinquan Zhang", "url": "http://mlsys.org/api/miniconf/users/27841?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3844", "url": null, "sourceid": -131, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T13:45:00-07:00", "endtime": "2026-05-20T14:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3687?format=json", "parent_id": 3687, "eventmedia": [{"id": 1081, "modified": "2026-05-16T08:30:32.604175-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3844_RqcbN0P.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3621?format=json"], "related_events_ids": [3621]}, {"id": 3518, "uid": "812b4ba287f5ee0bc9d43bbf5bbe87fb", "name": "Blueprint, Bootstrap, and Bridge: A Security Look at NVIDIA GPU Confidential Computing", "authors": [{"id": 27206, "fullname": "Zhongshu Gu", "url": "http://mlsys.org/api/miniconf/users/27206?format=json", "institution": "IBM Research"}, {"id": 27207, "fullname": "Enriquillo Valdez", "url": "http://mlsys.org/api/miniconf/users/27207?format=json", "institution": null}, {"id": 27208, "fullname": "Salman Ahmed", "url": "http://mlsys.org/api/miniconf/users/27208?format=json", "institution": "IBM"}, {"id": 27209, "fullname": "Julian James stephen", "url": "http://mlsys.org/api/miniconf/users/27209?format=json", "institution": "IBM"}, {"id": 27210, "fullname": "Michael Le", "url": "http://mlsys.org/api/miniconf/users/27210?format=json", "institution": null}, {"id": 27211, "fullname": "Hani Jamjoom", "url": "http://mlsys.org/api/miniconf/users/27211?format=json", "institution": null}, {"id": 27212, "fullname": "Shixuan Zhao", "url": "http://mlsys.org/api/miniconf/users/27212?format=json", "institution": "The Ohio State University"}, {"id": 27213, "fullname": "Zhiqiang Lin", "url": "http://mlsys.org/api/miniconf/users/27213?format=json", "institution": "Ohio State University, Columbus"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3518", "url": null, "sourceid": 95, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=t9RDCO1aL7", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 812, "modified": "2026-03-23T21:52:43.587993-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=t9RDCO1aL7", "resourcetype": "UriEventmedia"}, {"id": 1038, "file": "/media/PosterPDFs/MLSys%202026/3518-thumb.png", "modified": "2026-05-14T08:06:57.011110-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1037, "file": "/media/PosterPDFs/MLSys%202026/3518.png", "modified": "2026-05-14T08:06:56.880293-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "34", "related_events": ["http://mlsys.org/api/miniconf/events/3741?format=json"], "related_events_ids": [3741]}, {"id": 3745, "uid": "c16a5320fa475530d9583c34fd356ef5", "name": "Scaling Up Large Language Models Serving Systems for Semantic Job Search", "authors": [{"id": 27235, "fullname": "Kayhan Behdin", "url": "http://mlsys.org/api/miniconf/users/27235?format=json", "institution": "LinkedIn"}, {"id": 19093, "fullname": "Qingquan Song", "url": "http://mlsys.org/api/miniconf/users/19093?format=json", "institution": null}, {"id": 25809, "fullname": "Sriram Vasudevan", "url": "http://mlsys.org/api/miniconf/users/25809?format=json", "institution": "LinkedIn Corporation"}, {"id": 27236, "fullname": "Jian Sheng", "url": "http://mlsys.org/api/miniconf/users/27236?format=json", "institution": "LinkedIn"}, {"id": 27237, "fullname": "Xiaojing Ma", "url": "http://mlsys.org/api/miniconf/users/27237?format=json", "institution": "LinkedIn"}, {"id": 27238, "fullname": "Zhengze Zhou", "url": "http://mlsys.org/api/miniconf/users/27238?format=json", "institution": "LinkedIn"}, {"id": 26224, "fullname": "Chuanrui Zhu", "url": "http://mlsys.org/api/miniconf/users/26224?format=json", "institution": "LinkedIn"}, {"id": 27239, "fullname": "Guoyao Li", "url": "http://mlsys.org/api/miniconf/users/27239?format=json", "institution": "xAI"}, {"id": 19228, "fullname": "Chanh Nguyen", "url": "http://mlsys.org/api/miniconf/users/19228?format=json", "institution": "LinkedIn"}, {"id": 27240, "fullname": "Sayan Ghosh", "url": "http://mlsys.org/api/miniconf/users/27240?format=json", "institution": null}, {"id": 27241, "fullname": "Hejian Sang", "url": "http://mlsys.org/api/miniconf/users/27241?format=json", "institution": "LinkedIn"}, {"id": 24223, "fullname": "Ata Fatahi", "url": "http://mlsys.org/api/miniconf/users/24223?format=json", "institution": "LinkedIn Inc"}, {"id": 27242, "fullname": "Sundara Ramachandran", "url": "http://mlsys.org/api/miniconf/users/27242?format=json", "institution": null}, {"id": 27243, "fullname": "Xiaoqing Wang", "url": "http://mlsys.org/api/miniconf/users/27243?format=json", "institution": "LinkedIn"}, {"id": 26222, "fullname": "Qing Lan", "url": "http://mlsys.org/api/miniconf/users/26222?format=json", "institution": "LinkedIn"}, {"id": 27244, "fullname": "Vinay S", "url": "http://mlsys.org/api/miniconf/users/27244?format=json", "institution": null}, {"id": 27245, "fullname": "Qi Guo", "url": "http://mlsys.org/api/miniconf/users/27245?format=json", "institution": "LinkedIn"}, {"id": 27246, "fullname": "Caleb Johnson", "url": "http://mlsys.org/api/miniconf/users/27246?format=json", "institution": "University of Illinois at Urbana-Champaign"}, {"id": 17756, "fullname": "Zhipeng Wang", "url": "http://mlsys.org/api/miniconf/users/17756?format=json", "institution": "LinkedIn Corporation"}, {"id": 27247, "fullname": "Fedor Borisyuk", "url": "http://mlsys.org/api/miniconf/users/27247?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Serving 6", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3745", "url": null, "sourceid": -31, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T14:00:00-07:00", "endtime": "2026-05-21T14:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3709?format=json", "parent_id": 3709, "eventmedia": [{"id": 1238, "modified": "2026-05-20T01:16:05.016248-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3745_jivse2G.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3522?format=json"], "related_events_ids": [3522]}, {"id": 3741, "uid": "812b4ba287f5ee0bc9d43bbf5bbe87fb", "name": "Blueprint, Bootstrap, and Bridge: A Security Look at NVIDIA GPU Confidential Computing", "authors": [{"id": 27206, "fullname": "Zhongshu Gu", "url": "http://mlsys.org/api/miniconf/users/27206?format=json", "institution": "IBM Research"}, {"id": 27207, "fullname": "Enriquillo Valdez", "url": "http://mlsys.org/api/miniconf/users/27207?format=json", "institution": null}, {"id": 27208, "fullname": "Salman Ahmed", "url": "http://mlsys.org/api/miniconf/users/27208?format=json", "institution": "IBM"}, {"id": 27209, "fullname": "Julian James stephen", "url": "http://mlsys.org/api/miniconf/users/27209?format=json", "institution": "IBM"}, {"id": 27210, "fullname": "Michael Le", "url": "http://mlsys.org/api/miniconf/users/27210?format=json", "institution": null}, {"id": 27211, "fullname": "Hani Jamjoom", "url": "http://mlsys.org/api/miniconf/users/27211?format=json", "institution": null}, {"id": 27212, "fullname": "Shixuan Zhao", "url": "http://mlsys.org/api/miniconf/users/27212?format=json", "institution": "The Ohio State University"}, {"id": 27213, "fullname": "Zhiqiang Lin", "url": "http://mlsys.org/api/miniconf/users/27213?format=json", "institution": "Ohio State University, Columbus"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Security and Privacy", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3741", "url": null, "sourceid": -95, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T17:30:00-07:00", "endtime": "2026-05-19T17:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3673?format=json", "parent_id": 3673, "eventmedia": [{"id": 1034, "modified": "2026-05-14T07:38:44.096957-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3741.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3518?format=json"], "related_events_ids": [3518]}, {"id": 3835, "uid": "45c48cce2e2d7fbdea1afc51c7c6ad26", "name": "When Enough is Enough: Rank-Aware Early Termination for Vector Search", "authors": [{"id": 27807, "fullname": "Jianan Lu", "url": "http://mlsys.org/api/miniconf/users/27807?format=json", "institution": "Princeton University"}, {"id": 11918, "fullname": "Asaf Cidon", "url": "http://mlsys.org/api/miniconf/users/11918?format=json", "institution": "Columbia University"}, {"id": 11221, "fullname": "Michael None Freedman", "url": "http://mlsys.org/api/miniconf/users/11221?format=json", "institution": "Princeton University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3835", "url": null, "sourceid": -9, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T13:30:00-07:00", "endtime": "2026-05-19T13:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3668?format=json", "parent_id": 3668, "eventmedia": [{"id": 1074, "modified": "2026-05-15T19:33:08.591136-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3835_aLQTTRb.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3612?format=json"], "related_events_ids": [3612]}, {"id": 3836, "uid": "8e296a067a37563370ded05f5a3bf3ec", "name": "ReSpec: Towards Optimizing Speculative Decoding in Reinforcement Learning Systems", "authors": [{"id": 27808, "fullname": "Qiaoling Chen", "url": "http://mlsys.org/api/miniconf/users/27808?format=json", "institution": "Nanyang Technological University"}, {"id": 25950, "fullname": "Zijun Liu", "url": "http://mlsys.org/api/miniconf/users/25950?format=json", "institution": "Tsinghua University"}, {"id": 27809, "fullname": "Peng Sun", "url": "http://mlsys.org/api/miniconf/users/27809?format=json", "institution": "Harbin Institute of Technology"}, {"id": 27810, "fullname": "Shenggui Li", "url": "http://mlsys.org/api/miniconf/users/27810?format=json", "institution": "Nanyang Technological University"}, {"id": 27811, "fullname": "Guoteng Wang", "url": "http://mlsys.org/api/miniconf/users/27811?format=json", "institution": "Shanghai Artificial Intelligence Laboratory"}, {"id": 17655, "fullname": "Ziming Liu", "url": "http://mlsys.org/api/miniconf/users/17655?format=json", "institution": "national university of singaore, National University of Singapore"}, {"id": 20910, "fullname": "Yonggang Wen", "url": "http://mlsys.org/api/miniconf/users/20910?format=json", "institution": "Nanyang Technological University"}, {"id": 27812, "fullname": "Siyuan Feng", "url": "http://mlsys.org/api/miniconf/users/27812?format=json", "institution": "Shanghai Innovation Institute"}, {"id": 20894, "fullname": "Tianwei Zhang", "url": "http://mlsys.org/api/miniconf/users/20894?format=json", "institution": "Nanyang Technological University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3836", "url": null, "sourceid": -25, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T15:15:00-07:00", "endtime": "2026-05-20T15:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3692?format=json", "parent_id": 3692, "eventmedia": [{"id": 1161, "modified": "2026-05-16T08:48:24.585440-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3836.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3613?format=json"], "related_events_ids": [3613]}, {"id": 3732, "uid": "02e74f10e0327ad868d138f2b4fdd6f0", "name": "From Tokens to Layers: Redefining Stall-Free Scheduling for MoE Serving with Layered Prefill", "authors": [{"id": 26188, "fullname": "Gunjun Lee", "url": "http://mlsys.org/api/miniconf/users/26188?format=json", "institution": "Seoul National University"}, {"id": 27174, "fullname": "Jiwon Kim", "url": "http://mlsys.org/api/miniconf/users/27174?format=json", "institution": null}, {"id": 27175, "fullname": "Jaiyoung Park", "url": "http://mlsys.org/api/miniconf/users/27175?format=json", "institution": null}, {"id": 27176, "fullname": "Younjoo Lee", "url": "http://mlsys.org/api/miniconf/users/27176?format=json", "institution": "Seoul National University"}, {"id": 27177, "fullname": "Jung Ho Ahn", "url": "http://mlsys.org/api/miniconf/users/27177?format=json", "institution": "Seoul National University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3732", "url": null, "sourceid": -27, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T15:45:00-07:00", "endtime": "2026-05-19T16:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3675?format=json", "parent_id": 3675, "eventmedia": [{"id": 1073, "modified": "2026-05-16T09:59:20.708855-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3732_cXYJO0z.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3509?format=json"], "related_events_ids": [3509]}, {"id": 3804, "uid": "42a0e188f5033bc65bf8d78622277c4e", "name": "A Lightweight High-Throughput Collective-Capable NoC for Large-Scale ML Accelerators", "authors": [{"id": 25644, "fullname": "Luca Colagrande", "url": "http://mlsys.org/api/miniconf/users/25644?format=json", "institution": "ETH Zurich"}, {"id": 25669, "fullname": "Lorenzo Leone", "url": "http://mlsys.org/api/miniconf/users/25669?format=json", "institution": "ETH Zurich"}, {"id": 27638, "fullname": "Chen Wu", "url": "http://mlsys.org/api/miniconf/users/27638?format=json", "institution": "ETH Zurich"}, {"id": 27639, "fullname": "Tim Fischer", "url": "http://mlsys.org/api/miniconf/users/27639?format=json", "institution": null}, {"id": 27640, "fullname": "Raphael Roth", "url": "http://mlsys.org/api/miniconf/users/27640?format=json", "institution": null}, {"id": 21010, "fullname": "Luca Benini", "url": "http://mlsys.org/api/miniconf/users/21010?format=json", "institution": "ETHZ - ETH Zurich"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3804", "url": null, "sourceid": -136, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T17:45:00-07:00", "endtime": "2026-05-20T18:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3695?format=json", "parent_id": 3695, "eventmedia": [{"id": 1029, "modified": "2026-05-20T09:10:51.945587-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3804_dj4EVAy.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3581?format=json"], "related_events_ids": [3581]}, {"id": 3789, "uid": "65ded5353c5ee48d0b7d48c591b8f430", "name": "PRISM: Parametrically Refactor Inference for Speculative Decoding Draft Models", "authors": [{"id": 28462, "fullname": "Xuliang Wang", "url": "http://mlsys.org/api/miniconf/users/28462?format=json", "institution": "University of Waterloo"}, {"id": 27581, "fullname": "Yuetao Chen", "url": "http://mlsys.org/api/miniconf/users/27581?format=json", "institution": "The Chinese University of Hong Kong"}, {"id": 27582, "fullname": "Maochan Zhen", "url": "http://mlsys.org/api/miniconf/users/27582?format=json", "institution": "Central China Institute of Artificial Intelligence"}, {"id": 27583, "fullname": "Fang LIU", "url": "http://mlsys.org/api/miniconf/users/27583?format=json", "institution": "CIAI"}, {"id": 27584, "fullname": "Xinzhou Zheng", "url": "http://mlsys.org/api/miniconf/users/27584?format=json", "institution": "University of Science and Technology of China"}, {"id": 27585, "fullname": "Xingwu Liu", "url": "http://mlsys.org/api/miniconf/users/27585?format=json", "institution": "Dalian University of Technology"}, {"id": 27586, "fullname": "Hong Xu", "url": "http://mlsys.org/api/miniconf/users/27586?format=json", "institution": "The Chinese University of Hong Kong"}, {"id": 27587, "fullname": "Ming Li", "url": "http://mlsys.org/api/miniconf/users/27587?format=json", "institution": "University of Waterloo"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 5", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3789", "url": null, "sourceid": -132, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T08:30:00-07:00", "endtime": "2026-05-21T08:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3701?format=json", "parent_id": 3701, "eventmedia": [{"id": 1128, "modified": "2026-05-15T19:51:39.670560-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3789.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3566?format=json"], "related_events_ids": [3566]}, {"id": 3758, "uid": "ad61ab143223efbc24c7d2583be69251", "name": "SAKURAONE: An Open Ethernet\u2013Based AI HPC System and Its Observed Workload Dynamics in a Single-Tenant LLM Development Environment", "authors": [{"id": 27145, "fullname": "Fumikazu KONISHI", "url": "http://mlsys.org/api/miniconf/users/27145?format=json", "institution": "SAKURA internet inc."}, {"id": 26137, "fullname": "Yuuki Tsubouchi", "url": "http://mlsys.org/api/miniconf/users/26137?format=json", "institution": "SAKURA internet Inc."}, {"id": 25979, "fullname": "Hirofumi Tsuruta", "url": "http://mlsys.org/api/miniconf/users/25979?format=json", "institution": "SAKURA internet Inc."}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3758", "url": null, "sourceid": -74, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T17:00:00-07:00", "endtime": "2026-05-21T17:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3717?format=json", "parent_id": 3717, "eventmedia": [{"id": 1066, "modified": "2026-05-15T07:21:59.426414-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3758_d2pso2Y.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3535?format=json"], "related_events_ids": [3535]}, {"id": 3859, "uid": "26657d5ff9020d2abefe558796b99584", "name": "Zorse: Optimizing LLM Training Efficiency on Heterogeneous GPU Clusters", "authors": [{"id": 14867, "fullname": "Runsheng Guo", "url": "http://mlsys.org/api/miniconf/users/14867?format=json", "institution": "OpenAI"}, {"id": 27952, "fullname": "Utkarsh Anand", "url": "http://mlsys.org/api/miniconf/users/27952?format=json", "institution": "University of Waterloo"}, {"id": 14868, "fullname": "Khuzaima Daudjee", "url": "http://mlsys.org/api/miniconf/users/14868?format=json", "institution": "University of Waterloo"}, {"id": 27953, "fullname": "Rathijit Sen", "url": "http://mlsys.org/api/miniconf/users/27953?format=json", "institution": "Microsoft"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3859", "url": null, "sourceid": -96, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T17:00:00-07:00", "endtime": "2026-05-20T17:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3695?format=json", "parent_id": 3695, "eventmedia": [{"id": 1026, "modified": "2026-05-14T02:16:21.631110-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3859.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3636?format=json"], "related_events_ids": [3636]}, {"id": 3735, "uid": "2a38a4a9316c49e5a833517c45d31070", "name": "HipKittens: Fast and Furious AMD Kernels", "authors": [{"id": 27186, "fullname": "William Hu", "url": "http://mlsys.org/api/miniconf/users/27186?format=json", "institution": "Stanford University"}, {"id": 25851, "fullname": "Drew Wadsworth", "url": "http://mlsys.org/api/miniconf/users/25851?format=json", "institution": ""}, {"id": 27187, "fullname": "Sean Siddens", "url": "http://mlsys.org/api/miniconf/users/27187?format=json", "institution": "AMD"}, {"id": 27188, "fullname": "Stanley Winata", "url": "http://mlsys.org/api/miniconf/users/27188?format=json", "institution": null}, {"id": 27189, "fullname": "Daniel Fu", "url": "http://mlsys.org/api/miniconf/users/27189?format=json", "institution": "University of California, San Diego"}, {"id": 27190, "fullname": "Ryan Swann", "url": "http://mlsys.org/api/miniconf/users/27190?format=json", "institution": "AMD"}, {"id": 27191, "fullname": "Muhammad Osama", "url": "http://mlsys.org/api/miniconf/users/27191?format=json", "institution": "AMD"}, {"id": 11444, "fullname": "Christopher R\u00e9", "url": "http://mlsys.org/api/miniconf/users/11444?format=json", "institution": "Stanford University"}, {"id": 27192, "fullname": "Simran Arora", "url": "http://mlsys.org/api/miniconf/users/27192?format=json", "institution": "Computer Science Department, Stanford University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Compilers and Kernels", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3735", "url": null, "sourceid": -88, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T17:45:00-07:00", "endtime": "2026-05-21T18:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3718?format=json", "parent_id": 3718, "eventmedia": [{"id": 1134, "modified": "2026-05-15T22:05:04.779143-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3735.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3512?format=json"], "related_events_ids": [3512]}, {"id": 3747, "uid": "3416a75f4cea9109507cacd8e2f2aefc", "name": "Using Span Queries to Optimize Cache and Attention Locality", "authors": [{"id": 27258, "fullname": "Paul Castro", "url": "http://mlsys.org/api/miniconf/users/27258?format=json", "institution": "International Business Machines"}, {"id": 25924, "fullname": "Nick Mitchell", "url": "http://mlsys.org/api/miniconf/users/25924?format=json", "institution": "IBM Research"}, {"id": 27989, "fullname": "Nathan Ordonez", "url": "http://mlsys.org/api/miniconf/users/27989?format=json", "institution": "IBM Research"}, {"id": 27260, "fullname": "Thomas Parnell", "url": "http://mlsys.org/api/miniconf/users/27260?format=json", "institution": "IBM Research"}, {"id": 27261, "fullname": "Mudhakar Srivatsa", "url": "http://mlsys.org/api/miniconf/users/27261?format=json", "institution": "International Business Machines"}, {"id": 27262, "fullname": "Antoni Viros i Martin", "url": "http://mlsys.org/api/miniconf/users/27262?format=json", "institution": "International Business Machines"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3747", "url": null, "sourceid": -41, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T14:30:00-07:00", "endtime": "2026-05-20T14:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3687?format=json", "parent_id": 3687, "eventmedia": [{"id": 1079, "modified": "2026-05-18T12:32:42.070911-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3747_FfJdljm.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3524?format=json"], "related_events_ids": [3524]}, {"id": 3642, "uid": "6364d3f0f495b6ab9dcf8d3b5c6e0b01", "name": "OSWorld-Human: Benchmarking the Efficiency of Computer-Use Agents", "authors": [{"id": 27412, "fullname": "Reyna Abhyankar", "url": "http://mlsys.org/api/miniconf/users/27412?format=json", "institution": "Together AI"}, {"id": 27985, "fullname": "Qi Qi", "url": "http://mlsys.org/api/miniconf/users/27985?format=json", "institution": "University of California, San Diego"}, {"id": 26292, "fullname": "Yiying Zhang", "url": "http://mlsys.org/api/miniconf/users/26292?format=json", "institution": "UCSD and GenseeAI"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3642", "url": null, "sourceid": 32, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=0Cp8l6cvyq", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 936, "modified": "2026-03-23T21:52:48.518354-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=0Cp8l6cvyq", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "5", "related_events": ["http://mlsys.org/api/miniconf/events/3865?format=json"], "related_events_ids": [3865]}, {"id": 3801, "uid": "4e732ced3463d06de0ca9a15b6153677", "name": "Privatar: Scalable Privacy-preserving Multi-user VR via Secure Offloading", "authors": [{"id": 13393, "fullname": "Jianming Tong", "url": "http://mlsys.org/api/miniconf/users/13393?format=json", "institution": "Georgia Tech/Google"}, {"id": 27626, "fullname": "Hanshen Xiao", "url": "http://mlsys.org/api/miniconf/users/27626?format=json", "institution": "Purdue University"}, {"id": 27627, "fullname": "Krishna Nair", "url": "http://mlsys.org/api/miniconf/users/27627?format=json", "institution": null}, {"id": 19218, "fullname": "Hao Kang", "url": "http://mlsys.org/api/miniconf/users/19218?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27628, "fullname": "Ashish Sirasao", "url": "http://mlsys.org/api/miniconf/users/27628?format=json", "institution": "Amd inc"}, {"id": 27629, "fullname": "Ziqi Zhang", "url": "http://mlsys.org/api/miniconf/users/27629?format=json", "institution": "University of Illinois at Urbana-Champaign"}, {"id": 27630, "fullname": "G. Edward Suh", "url": "http://mlsys.org/api/miniconf/users/27630?format=json", "institution": "NVIDIA"}, {"id": 11662, "fullname": "Tushar Krishna", "url": "http://mlsys.org/api/miniconf/users/11662?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Security and Privacy", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3801", "url": null, "sourceid": -26, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T17:00:00-07:00", "endtime": "2026-05-19T17:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3673?format=json", "parent_id": 3673, "eventmedia": [{"id": 1131, "modified": "2026-05-20T09:31:22.541708-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3801_3ox1dQR.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3578?format=json"], "related_events_ids": [3578]}, {"id": 3819, "uid": "202cb962ac59075b964b07152d234b70", "name": "Beyond the Buzz: A Pragmatic Take on Inference Disaggregation", "authors": [{"id": 27700, "fullname": "Tiyasa Mitra", "url": "http://mlsys.org/api/miniconf/users/27700?format=json", "institution": "NVIDIA"}, {"id": 27701, "fullname": "Ritika Borkar", "url": "http://mlsys.org/api/miniconf/users/27701?format=json", "institution": "NVIDIA"}, {"id": 27702, "fullname": "Nidhi Bhatia", "url": "http://mlsys.org/api/miniconf/users/27702?format=json", "institution": "NVIDIA Corporation"}, {"id": 27703, "fullname": "Shivam Raj", "url": "http://mlsys.org/api/miniconf/users/27703?format=json", "institution": "NVIDIA"}, {"id": 25864, "fullname": "hongkuan zhou", "url": "http://mlsys.org/api/miniconf/users/25864?format=json", "institution": "Nvidia"}, {"id": 27704, "fullname": "Yan Ru Pei", "url": "http://mlsys.org/api/miniconf/users/27704?format=json", "institution": "NVIDIA"}, {"id": 27705, "fullname": "Vishwanath Venkatesan", "url": "http://mlsys.org/api/miniconf/users/27705?format=json", "institution": null}, {"id": 27706, "fullname": "Kyle Kranen", "url": "http://mlsys.org/api/miniconf/users/27706?format=json", "institution": "NVIDIA"}, {"id": 27707, "fullname": "Ramon Matas", "url": "http://mlsys.org/api/miniconf/users/27707?format=json", "institution": "NVIDIA"}, {"id": 18519, "fullname": "Dheevatsa Mudigere", "url": "http://mlsys.org/api/miniconf/users/18519?format=json", "institution": "NVIDIA"}, {"id": 27708, "fullname": "Ritchie Zhao", "url": "http://mlsys.org/api/miniconf/users/27708?format=json", "institution": "NVIDIA"}, {"id": 27709, "fullname": "Maximilian Golub", "url": "http://mlsys.org/api/miniconf/users/27709?format=json", "institution": "NVIDIA"}, {"id": 27710, "fullname": "Arpan Dutta", "url": "http://mlsys.org/api/miniconf/users/27710?format=json", "institution": "NVIDIA"}, {"id": 27711, "fullname": "Suresh Nambi", "url": "http://mlsys.org/api/miniconf/users/27711?format=json", "institution": null}, {"id": 27712, "fullname": "Sailaja Madduri", "url": "http://mlsys.org/api/miniconf/users/27712?format=json", "institution": "NVIDIA"}, {"id": 27713, "fullname": "Dharmesh Jani", "url": "http://mlsys.org/api/miniconf/users/27713?format=json", "institution": "NVIDIA"}, {"id": 27714, "fullname": "Brian Pharris", "url": "http://mlsys.org/api/miniconf/users/27714?format=json", "institution": "NVIDIA"}, {"id": 27715, "fullname": "Itay Neeman", "url": "http://mlsys.org/api/miniconf/users/27715?format=json", "institution": "NVIDIA"}, {"id": 27716, "fullname": "Bita Darvish Rouhani", "url": "http://mlsys.org/api/miniconf/users/27716?format=json", "institution": "NVIDIA"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Serving 6", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3819", "url": null, "sourceid": -123, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T13:15:00-07:00", "endtime": "2026-05-21T13:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3709?format=json", "parent_id": 3709, "eventmedia": [{"id": 1129, "modified": "2026-05-20T22:48:36.647235-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3819_593EcQk.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3596?format=json"], "related_events_ids": [3596]}, {"id": 3632, "uid": "35f4a8d465e6e1edc05f3d8ab658c551", "name": "VeriMoA: A Mixture-of-Agents Framework for Spec-to-HDL Generation", "authors": [{"id": 27902, "fullname": "Heng Ping", "url": "http://mlsys.org/api/miniconf/users/27902?format=json", "institution": "University of Southern California"}, {"id": 27903, "fullname": "Arijit Bhattacharjee", "url": "http://mlsys.org/api/miniconf/users/27903?format=json", "institution": "Iowa State University"}, {"id": 27904, "fullname": "Peiyu Zhang", "url": "http://mlsys.org/api/miniconf/users/27904?format=json", "institution": "University of Southern California"}, {"id": 27905, "fullname": "Shixuan Li", "url": "http://mlsys.org/api/miniconf/users/27905?format=json", "institution": "University of Southern California"}, {"id": 27906, "fullname": "Wei Yang", "url": "http://mlsys.org/api/miniconf/users/27906?format=json", "institution": "University of Southern California"}, {"id": 27907, "fullname": "Anzhe Cheng", "url": "http://mlsys.org/api/miniconf/users/27907?format=json", "institution": "University of Southern California"}, {"id": 27908, "fullname": "Xiaole Zhang", "url": "http://mlsys.org/api/miniconf/users/27908?format=json", "institution": "University of Southern California"}, {"id": 27909, "fullname": "Jesse Thomason", "url": "http://mlsys.org/api/miniconf/users/27909?format=json", "institution": "University of Southern California"}, {"id": 15789, "fullname": "Ali Jannesari", "url": "http://mlsys.org/api/miniconf/users/15789?format=json", "institution": "Iowa State University"}, {"id": 27910, "fullname": "Nesreen Ahmed", "url": "http://mlsys.org/api/miniconf/users/27910?format=json", "institution": "Cisco"}, {"id": 11952, "fullname": "Paul Bogdan", "url": "http://mlsys.org/api/miniconf/users/11952?format=json", "institution": "USC"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3632", "url": null, "sourceid": 78, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=5wgZXJ0kWA", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 926, "modified": "2026-03-23T21:52:48.099852-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=5wgZXJ0kWA", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "7", "related_events": ["http://mlsys.org/api/miniconf/events/3855?format=json"], "related_events_ids": [3855]}, {"id": 3754, "uid": "93db85ed909c13838ff95ccfa94cebd9", "name": "Efficient Long-Context Language Model Training by Core Attention Disaggregation", "authors": [{"id": 28964, "fullname": "Yonghao Zhuang", "url": "http://mlsys.org/api/miniconf/users/28964?format=json", "institution": "CMU, Carnegie Mellon University"}, {"id": 17900, "fullname": "Junda Chen", "url": "http://mlsys.org/api/miniconf/users/17900?format=json", "institution": "University of California San Diego"}, {"id": 27317, "fullname": "Bo Pang", "url": "http://mlsys.org/api/miniconf/users/27317?format=json", "institution": null}, {"id": 27318, "fullname": "Yi Gu", "url": "http://mlsys.org/api/miniconf/users/27318?format=json", "institution": "University of California, San Diego"}, {"id": 27319, "fullname": "Yibo Zhu", "url": "http://mlsys.org/api/miniconf/users/27319?format=json", "institution": "StepFun"}, {"id": 27320, "fullname": "Yimin Jiang", "url": "http://mlsys.org/api/miniconf/users/27320?format=json", "institution": "Anuttacon"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}, {"id": 27321, "fullname": "Hao Zhang", "url": "http://mlsys.org/api/miniconf/users/27321?format=json", "institution": "University of California, San Diego"}, {"id": 16300, "fullname": "Eric Xing", "url": "http://mlsys.org/api/miniconf/users/16300?format=json", "institution": "MBZUAI, CMU, and Petuum Inc."}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3754", "url": "https://github.com/hao-ai-lab/DistCA", "sourceid": -86, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T09:45:00-07:00", "endtime": "2026-05-20T10:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3679?format=json", "parent_id": 3679, "eventmedia": [{"id": 1239, "modified": "2026-05-20T09:32:22.907608-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3754.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3531?format=json"], "related_events_ids": [3531]}, {"id": 3612, "uid": "45c48cce2e2d7fbdea1afc51c7c6ad26", "name": "When Enough is Enough: Rank-Aware Early Termination for Vector Search", "authors": [{"id": 27807, "fullname": "Jianan Lu", "url": "http://mlsys.org/api/miniconf/users/27807?format=json", "institution": "Princeton University"}, {"id": 11918, "fullname": "Asaf Cidon", "url": "http://mlsys.org/api/miniconf/users/11918?format=json", "institution": "Columbia University"}, {"id": 11221, "fullname": "Michael None Freedman", "url": "http://mlsys.org/api/miniconf/users/11221?format=json", "institution": "Princeton University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3612", "url": null, "sourceid": 9, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=IFz0pROwF1", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 906, "modified": "2026-03-23T21:52:47.283768-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=IFz0pROwF1", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "9", "related_events": ["http://mlsys.org/api/miniconf/events/3835?format=json"], "related_events_ids": [3835]}, {"id": 3838, "uid": "76dc611d6ebaafc66cc0879c71b5db5c", "name": "FlexiCache: Leveraging Temporal Stability of Attention Heads for Efficient KV Cache Management", "authors": [{"id": 26134, "fullname": "Nazmul Takbir", "url": "http://mlsys.org/api/miniconf/users/26134?format=json", "institution": "University of California Irvine"}, {"id": 27819, "fullname": "Hamidreza Alikhani Koshkak", "url": "http://mlsys.org/api/miniconf/users/27819?format=json", "institution": "University of California, Irvine"}, {"id": 27820, "fullname": "Nikil Dutt", "url": "http://mlsys.org/api/miniconf/users/27820?format=json", "institution": "University of California, Irvine"}, {"id": 11050, "fullname": "Sangeetha Abdu Jyothi", "url": "http://mlsys.org/api/miniconf/users/11050?format=json", "institution": "UC Irvine / Amazon"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3838", "url": null, "sourceid": -128, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T14:00:00-07:00", "endtime": "2026-05-20T14:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3687?format=json", "parent_id": 3687, "eventmedia": [{"id": 1067, "modified": "2026-05-15T20:18:22.042860-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3838_zYgO11t.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3615?format=json"], "related_events_ids": [3615]}, {"id": 3820, "uid": "98dce83da57b0395e163467c9dae521b", "name": "Shannonic: Efficient Entropy-Optimal Compression for ML Workloads", "authors": [{"id": 17719, "fullname": "Kareem Ibrahim", "url": "http://mlsys.org/api/miniconf/users/17719?format=json", "institution": "University of Toronto"}, {"id": 28467, "fullname": "Mohammadjavad Maheronnaghsh", "url": "http://mlsys.org/api/miniconf/users/28467?format=json", "institution": "University of Toronto"}, {"id": 17666, "fullname": "Andreas Moshovos", "url": "http://mlsys.org/api/miniconf/users/17666?format=json", "institution": "University of Toronto"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Model Compression", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3820", "url": null, "sourceid": -93, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T17:15:00-07:00", "endtime": "2026-05-20T17:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3696?format=json", "parent_id": 3696, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3597?format=json"], "related_events_ids": [3597]}, {"id": 3550, "uid": "f457c545a9ded88f18ecee47145a72c0", "name": "SwiftGS: Algorithm and System Co-Optimization for Fast 3D Gaussian Splatting on GPUs", "authors": [{"id": 25558, "fullname": "Lingjun Gao", "url": "http://mlsys.org/api/miniconf/users/25558?format=json", "institution": "Imperial College London"}, {"id": 27429, "fullname": "Zhican Wang", "url": "http://mlsys.org/api/miniconf/users/27429?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 27430, "fullname": "Zhiwen Mo", "url": "http://mlsys.org/api/miniconf/users/27430?format=json", "institution": "Imperial College London"}, {"id": 27431, "fullname": "Hongxiang Fan", "url": "http://mlsys.org/api/miniconf/users/27431?format=json", "institution": "Imperial College London"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3550", "url": null, "sourceid": 49, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=i05mMLR9BX", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 844, "modified": "2026-03-23T21:52:44.827486-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=i05mMLR9BX", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "10", "related_events": ["http://mlsys.org/api/miniconf/events/3773?format=json"], "related_events_ids": [3773]}, {"id": 3600, "uid": "54229abfcfa5649e7003b83dd4755294", "name": "Optimizing PyTorch Inference with LLM-Based Multi-Agent Systems", "authors": [{"id": 27737, "fullname": "Kirill Nagaitsev", "url": "http://mlsys.org/api/miniconf/users/27737?format=json", "institution": "Northwestern University"}, {"id": 27738, "fullname": "Luka Grbcic", "url": "http://mlsys.org/api/miniconf/users/27738?format=json", "institution": "Lawrence Berkeley National Laboratory"}, {"id": 27739, "fullname": "Samuel Williams", "url": "http://mlsys.org/api/miniconf/users/27739?format=json", "institution": "Lawrence Berkeley National Lab"}, {"id": 27740, "fullname": "Costin Iancu", "url": "http://mlsys.org/api/miniconf/users/27740?format=json", "institution": "Ambassador University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3600", "url": null, "sourceid": 91, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=MJxhiX3sSd", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 894, "modified": "2026-03-23T21:52:46.841467-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=MJxhiX3sSd", "resourcetype": "UriEventmedia"}, {"id": 1094, "file": "/media/PosterPDFs/MLSys%202026/3600.png", "modified": "2026-05-15T12:58:38.670876-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1095, "file": "/media/PosterPDFs/MLSys%202026/3600-thumb.png", "modified": "2026-05-15T12:58:38.764167-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "11", "related_events": ["http://mlsys.org/api/miniconf/events/3823?format=json"], "related_events_ids": [3823]}, {"id": 3776, "uid": "069059b7ef840f0c74a814ec9237b6ec", "name": "FlexTrain: Scalable Hybrid-Parallel Training with Elastic Resource Utilization and Consistent Accuracy", "authors": [{"id": 25944, "fullname": "Weilin Cai", "url": "http://mlsys.org/api/miniconf/users/25944?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 27470, "fullname": "Diandian Gu", "url": "http://mlsys.org/api/miniconf/users/27470?format=json", "institution": "Bytedance Seed"}, {"id": 28455, "fullname": "Baoquan Zhong", "url": "http://mlsys.org/api/miniconf/users/28455?format=json", "institution": "Zhejiang University"}, {"id": 27471, "fullname": "Jun Wang", "url": "http://mlsys.org/api/miniconf/users/27471?format=json", "institution": "ByteDance Inc."}, {"id": 28456, "fullname": "Zhuolin Zheng", "url": "http://mlsys.org/api/miniconf/users/28456?format=json", "institution": "ByteDance Inc."}, {"id": 28457, "fullname": "Gaohong Liu", "url": "http://mlsys.org/api/miniconf/users/28457?format=json", "institution": "ByteDance Inc."}, {"id": 28458, "fullname": "Jiang Kaihua", "url": "http://mlsys.org/api/miniconf/users/28458?format=json", "institution": "University of Chinese Academy of Sciences"}, {"id": 28459, "fullname": "Shuguang Wang", "url": "http://mlsys.org/api/miniconf/users/28459?format=json", "institution": "Huazhong University of Science and Technology"}, {"id": 27472, "fullname": "Wencong Xiao", "url": "http://mlsys.org/api/miniconf/users/27472?format=json", "institution": null}, {"id": 19049, "fullname": "Jiayi Huang", "url": "http://mlsys.org/api/miniconf/users/19049?format=json", "institution": "HKUST(GZ)"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3776", "url": null, "sourceid": -126, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T16:15:00-07:00", "endtime": "2026-05-20T16:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3692?format=json", "parent_id": 3692, "eventmedia": [{"id": 1240, "modified": "2026-05-20T11:07:26.474565-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3776.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3553?format=json"], "related_events_ids": [3553]}, {"id": 3807, "uid": "c51ce410c124a10e0db5e4b97fc2af39", "name": "fabric-lib: RDMA Point-to-Point Communication for LLM Systems", "authors": [{"id": 27645, "fullname": "Nandor Licker", "url": "http://mlsys.org/api/miniconf/users/27645?format=json", "institution": "Perplexity AI"}, {"id": 23368, "fullname": "Kevin Hu", "url": "http://mlsys.org/api/miniconf/users/23368?format=json", "institution": "Perplexity AI"}, {"id": 23407, "fullname": "Vladimir Zaytsev", "url": "http://mlsys.org/api/miniconf/users/23407?format=json", "institution": "Perplexity AI"}, {"id": 21008, "fullname": "Lequn Chen", "url": "http://mlsys.org/api/miniconf/users/21008?format=json", "institution": "Perplexity AI"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3807", "url": null, "sourceid": -13, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T15:30:00-07:00", "endtime": "2026-05-20T15:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3691?format=json", "parent_id": 3691, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3584?format=json"], "related_events_ids": [3584]}, {"id": 3530, "uid": "f4b9ec30ad9f68f89b29639786cb62ef", "name": "Matrix: Peer-to-Peer Multi-Agent Synthetic Data Generation Framework", "authors": [{"id": 27301, "fullname": "Dong Wang", "url": "http://mlsys.org/api/miniconf/users/27301?format=json", "institution": "Meta FAIR"}, {"id": 27302, "fullname": "Yang Li", "url": "http://mlsys.org/api/miniconf/users/27302?format=json", "institution": "Facebook"}, {"id": 27303, "fullname": "Ansong Ni", "url": "http://mlsys.org/api/miniconf/users/27303?format=json", "institution": "Meta AI"}, {"id": 27304, "fullname": "Ching-Feng Yeh", "url": "http://mlsys.org/api/miniconf/users/27304?format=json", "institution": "Facebook"}, {"id": 27305, "fullname": "Youssef Emad", "url": "http://mlsys.org/api/miniconf/users/27305?format=json", "institution": "Facebook"}, {"id": 27306, "fullname": "Xinjie Lei", "url": "http://mlsys.org/api/miniconf/users/27306?format=json", "institution": "Meta"}, {"id": 27307, "fullname": "Liam Robbins", "url": "http://mlsys.org/api/miniconf/users/27307?format=json", "institution": "FAIR"}, {"id": 27308, "fullname": "Karthik Padthe", "url": "http://mlsys.org/api/miniconf/users/27308?format=json", "institution": "Meta AI"}, {"id": 27309, "fullname": "Hu Xu", "url": "http://mlsys.org/api/miniconf/users/27309?format=json", "institution": "FAIR, Foundation"}, {"id": 27310, "fullname": "Xian Li", "url": "http://mlsys.org/api/miniconf/users/27310?format=json", "institution": "Facebook AI"}, {"id": 27311, "fullname": "Asli Celikyilmaz", "url": "http://mlsys.org/api/miniconf/users/27311?format=json", "institution": "FAIR"}, {"id": 27312, "fullname": "Ramya Raghavendra", "url": "http://mlsys.org/api/miniconf/users/27312?format=json", "institution": "Facebook"}, {"id": 27313, "fullname": "LIFEI HUANG", "url": "http://mlsys.org/api/miniconf/users/27313?format=json", "institution": "Facebook"}, {"id": 27314, "fullname": "Carole-Jean Wu", "url": "http://mlsys.org/api/miniconf/users/27314?format=json", "institution": "Meta"}, {"id": 27315, "fullname": "Shang-Wen Li", "url": "http://mlsys.org/api/miniconf/users/27315?format=json", "institution": "Facebook"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3530", "url": null, "sourceid": 94, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=ok96wGyPdI", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 824, "modified": "2026-03-23T21:52:44.017842-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=ok96wGyPdI", "resourcetype": "UriEventmedia"}, {"id": 985, "file": "/media/PosterPDFs/MLSys%202026/3530.png", "modified": "2026-05-10T19:37:02.471082-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 986, "file": "/media/PosterPDFs/MLSys%202026/3530-thumb.png", "modified": "2026-05-10T19:37:02.531245-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "13", "related_events": ["http://mlsys.org/api/miniconf/events/3753?format=json"], "related_events_ids": [3753]}, {"id": 3809, "uid": "8f14e45fceea167a5a36dedd4bea2543", "name": "SuperInfer: SLO-Aware Rotary Scheduling and Memory Management for LLM Inference on Superchips", "authors": [{"id": 25942, "fullname": "Jiahuan Yu", "url": "http://mlsys.org/api/miniconf/users/25942?format=json", "institution": "University of Illinois Urbana-Champaign"}, {"id": 27649, "fullname": "Mingtao Hu", "url": "http://mlsys.org/api/miniconf/users/27649?format=json", "institution": "University of Illinois at Urbana-Champaign"}, {"id": 27650, "fullname": "Zichao Lin", "url": "http://mlsys.org/api/miniconf/users/27650?format=json", "institution": null}, {"id": 19015, "fullname": "Minjia Zhang", "url": "http://mlsys.org/api/miniconf/users/19015?format=json", "institution": "UIUC"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3809", "url": null, "sourceid": -7, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T15:00:00-07:00", "endtime": "2026-05-19T15:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3675?format=json", "parent_id": 3675, "eventmedia": [{"id": 1130, "modified": "2026-05-15T20:20:21.729124-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3809.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3586?format=json"], "related_events_ids": [3586]}, {"id": 3640, "uid": "d645920e395fedad7bbbed0eca3fe2e0", "name": "Hippocampus: An Efficient and Scalable Memory Module for Agentic AI", "authors": [{"id": 27978, "fullname": "Yi Li", "url": "http://mlsys.org/api/miniconf/users/27978?format=json", "institution": "University of Texas at Dallas"}, {"id": 12896, "fullname": "Lianjie Cao", "url": "http://mlsys.org/api/miniconf/users/12896?format=json", "institution": "HPE Labs"}, {"id": 15334, "fullname": "Faraz Ahmed", "url": "http://mlsys.org/api/miniconf/users/15334?format=json", "institution": "Hewlett Packard Labs"}, {"id": 14774, "fullname": "Puneet Sharma", "url": "http://mlsys.org/api/miniconf/users/14774?format=json", "institution": "HP Labs"}, {"id": 23337, "fullname": "Bingzhe Li", "url": "http://mlsys.org/api/miniconf/users/23337?format=json", "institution": "University of Texas at Dallas"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3640", "url": null, "sourceid": 40, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=0sUYZh9D4a", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 934, "modified": "2026-03-23T21:52:48.449896-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=0sUYZh9D4a", "resourcetype": "UriEventmedia"}, {"id": 962, "file": "/media/PosterPDFs/MLSys%202026/3640.png", "modified": "2026-05-04T19:19:08.611298-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 963, "file": "/media/PosterPDFs/MLSys%202026/3640-thumb.png", "modified": "2026-05-04T19:19:08.683924-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "15", "related_events": ["http://mlsys.org/api/miniconf/events/3863?format=json"], "related_events_ids": [3863]}, {"id": 3731, "uid": "17e62166fc8586dfa4d1bc0e1742c08b", "name": "CRAFT: Fine-Grained Cost-Aware Expert Replication For Efficient Mixture-of-Experts Serving", "authors": [{"id": 27141, "fullname": "Adrian Zhao", "url": "http://mlsys.org/api/miniconf/users/27141?format=json", "institution": "University of Toronto"}, {"id": 27170, "fullname": "Zhenkun Cai", "url": "http://mlsys.org/api/miniconf/users/27170?format=json", "institution": "Amazon"}, {"id": 27171, "fullname": "Zhenyu Song", "url": "http://mlsys.org/api/miniconf/users/27171?format=json", "institution": null}, {"id": 27172, "fullname": "Lingfan Yu", "url": "http://mlsys.org/api/miniconf/users/27172?format=json", "institution": "Amazon"}, {"id": 27173, "fullname": "Haozheng Fan", "url": "http://mlsys.org/api/miniconf/users/27173?format=json", "institution": "Amazon"}, {"id": 20941, "fullname": "Jun Wu", "url": "http://mlsys.org/api/miniconf/users/20941?format=json", "institution": "Amazon"}, {"id": 11990, "fullname": "Yida Wang", "url": "http://mlsys.org/api/miniconf/users/11990?format=json", "institution": "Amazon"}, {"id": 17626, "fullname": "Nandita Vijaykumar", "url": "http://mlsys.org/api/miniconf/users/17626?format=json", "institution": "Department of Computer Science, University of Toronto"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3731", "url": null, "sourceid": -43, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T16:30:00-07:00", "endtime": "2026-05-20T16:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3691?format=json", "parent_id": 3691, "eventmedia": [{"id": 1132, "modified": "2026-05-20T14:19:24.941409-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3731_3lg6KXh.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3508?format=json"], "related_events_ids": [3508]}, {"id": 3794, "uid": "5ef059938ba799aaa845e1c2e8a762bd", "name": "MAC-Attention: a Match--Amend--Complete scheme for fast and accurate attention computation", "authors": [{"id": 19233, "fullname": "Jinghan Yao", "url": "http://mlsys.org/api/miniconf/users/19233?format=json", "institution": "The Ohio State University"}, {"id": 21021, "fullname": "Sam Jacobs", "url": "http://mlsys.org/api/miniconf/users/21021?format=json", "institution": "Microsoft"}, {"id": 27604, "fullname": "Walid Krichene", "url": "http://mlsys.org/api/miniconf/users/27604?format=json", "institution": "Microsoft"}, {"id": 27605, "fullname": "Masahiro Tanaka", "url": "http://mlsys.org/api/miniconf/users/27605?format=json", "institution": "Anyscale"}, {"id": 20998, "fullname": "Dhabaleswar Panda", "url": "http://mlsys.org/api/miniconf/users/20998?format=json", "institution": "Ohio State University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3794", "url": "https://github.com/YJHMITWEB/MAC-Attention", "sourceid": -118, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T14:15:00-07:00", "endtime": "2026-05-20T14:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3687?format=json", "parent_id": 3687, "eventmedia": [{"id": 1062, "modified": "2026-05-20T13:14:10.286113-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3794_HiTCC0P.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3571?format=json"], "related_events_ids": [3571]}, {"id": 3583, "uid": "98f13708210194c475687be6106a3b84", "name": "AgenticCache: Cache-Driven Asynchronous Planning for Embodied AI Agents", "authors": [{"id": 25550, "fullname": "Hojoon Kim", "url": "http://mlsys.org/api/miniconf/users/25550?format=json", "institution": "Seoul National University"}, {"id": 27643, "fullname": "Yuheng Wu", "url": "http://mlsys.org/api/miniconf/users/27643?format=json", "institution": "Stanford University"}, {"id": 27644, "fullname": "Thierry Tambe", "url": "http://mlsys.org/api/miniconf/users/27644?format=json", "institution": "Stanford University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3583", "url": "https://github.com/hojoonleokim/MLSys26_AgenticCache", "sourceid": 20, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=UfABxFoSXH", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 877, "modified": "2026-03-23T21:52:46.202830-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=UfABxFoSXH", "resourcetype": "UriEventmedia"}, {"id": 995, "file": "/media/PosterPDFs/MLSys%202026/3583.png", "modified": "2026-05-12T21:37:32.515999-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 996, "file": "/media/PosterPDFs/MLSys%202026/3583-thumb.png", "modified": "2026-05-12T21:37:32.701093-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "18", "related_events": ["http://mlsys.org/api/miniconf/events/3806?format=json"], "related_events_ids": [3806]}, {"id": 3512, "uid": "2a38a4a9316c49e5a833517c45d31070", "name": "HipKittens: Fast and Furious AMD Kernels", "authors": [{"id": 27186, "fullname": "William Hu", "url": "http://mlsys.org/api/miniconf/users/27186?format=json", "institution": "Stanford University"}, {"id": 25851, "fullname": "Drew Wadsworth", "url": "http://mlsys.org/api/miniconf/users/25851?format=json", "institution": ""}, {"id": 27187, "fullname": "Sean Siddens", "url": "http://mlsys.org/api/miniconf/users/27187?format=json", "institution": "AMD"}, {"id": 27188, "fullname": "Stanley Winata", "url": "http://mlsys.org/api/miniconf/users/27188?format=json", "institution": null}, {"id": 27189, "fullname": "Daniel Fu", "url": "http://mlsys.org/api/miniconf/users/27189?format=json", "institution": "University of California, San Diego"}, {"id": 27190, "fullname": "Ryan Swann", "url": "http://mlsys.org/api/miniconf/users/27190?format=json", "institution": "AMD"}, {"id": 27191, "fullname": "Muhammad Osama", "url": "http://mlsys.org/api/miniconf/users/27191?format=json", "institution": "AMD"}, {"id": 11444, "fullname": "Christopher R\u00e9", "url": "http://mlsys.org/api/miniconf/users/11444?format=json", "institution": "Stanford University"}, {"id": 27192, "fullname": "Simran Arora", "url": "http://mlsys.org/api/miniconf/users/27192?format=json", "institution": "Computer Science Department, Stanford University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3512", "url": null, "sourceid": 88, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=xxSSrndQrI", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 806, "modified": "2026-03-23T21:52:43.387482-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=xxSSrndQrI", "resourcetype": "UriEventmedia"}, {"id": 1219, "file": "/media/PosterPDFs/MLSys%202026/3512-thumb.png", "modified": "2026-05-18T14:19:13.137038-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1218, "file": "/media/PosterPDFs/MLSys%202026/3512.png", "modified": "2026-05-18T21:26:25.426593-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "43", "related_events": ["http://mlsys.org/api/miniconf/events/3735?format=json"], "related_events_ids": [3735]}, {"id": 3521, "uid": "e4da3b7fbbce2345d7772b0674a318d5", "name": "TokenWeave: Efficient Compute-Communication Overlap for Distributed LLM Inference", "authors": [{"id": 19241, "fullname": "Raja Gond", "url": "http://mlsys.org/api/miniconf/users/19241?format=json", "institution": "Independent Researcher"}, {"id": 17734, "fullname": "Nipun Kwatra", "url": "http://mlsys.org/api/miniconf/users/17734?format=json", "institution": "Microsoft Research India"}, {"id": 16198, "fullname": "Ramachandran Ramjee", "url": "http://mlsys.org/api/miniconf/users/16198?format=json", "institution": "Microsoft Research"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3521", "url": "https://github.com/microsoft/tokenweave", "sourceid": 5, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=rh2Ylffkq6", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 815, "modified": "2026-03-23T21:52:43.699125-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=rh2Ylffkq6", "resourcetype": "UriEventmedia"}, {"id": 943, "file": "/media/PosterPDFs/MLSys%202026/3521-thumb.png", "modified": "2026-04-30T15:18:37.306561-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 979, "file": "/media/PosterPDFs/MLSys%202026/3521.png", "modified": "2026-05-09T03:27:37.154922-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1249, "modified": "2026-05-22T14:12:19.449220-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3521.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "22", "related_events": ["http://mlsys.org/api/miniconf/events/3744?format=json"], "related_events_ids": [3744]}, {"id": 3851, "uid": "1679091c5a880faf6fb5e6087eb1b2dc", "name": "GriNNder: Breaking the Memory Capacity Wall in Full-Graph GNN Training with Storage Offloading", "authors": [{"id": 27858, "fullname": "Jaeyong Song", "url": "http://mlsys.org/api/miniconf/users/27858?format=json", "institution": "Seoul National University"}, {"id": 27859, "fullname": "Seongyeon Park", "url": "http://mlsys.org/api/miniconf/users/27859?format=json", "institution": "Seoul National University"}, {"id": 27860, "fullname": "Hongsun Jang", "url": "http://mlsys.org/api/miniconf/users/27860?format=json", "institution": "Seoul National University"}, {"id": 27861, "fullname": "Jaewon Jung", "url": "http://mlsys.org/api/miniconf/users/27861?format=json", "institution": "Seoul National University"}, {"id": 26223, "fullname": "Hunseong Lim", "url": "http://mlsys.org/api/miniconf/users/26223?format=json", "institution": "Seoul National University"}, {"id": 27862, "fullname": "Junguk Hong", "url": "http://mlsys.org/api/miniconf/users/27862?format=json", "institution": "Seoul National University"}, {"id": 27863, "fullname": "Jinho Lee", "url": "http://mlsys.org/api/miniconf/users/27863?format=json", "institution": "Seoul National University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3851", "url": "https://github.com/AIS-SNU/GriNNder", "sourceid": -6, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T17:15:00-07:00", "endtime": "2026-05-20T17:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3695?format=json", "parent_id": 3695, "eventmedia": [{"id": 978, "modified": "2026-05-20T13:48:37.255036-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3851_xn3JSf6.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3628?format=json"], "related_events_ids": [3628]}, {"id": 3515, "uid": "70efdf2ec9b086079795c442636b55fb", "name": "Ontology-Guided Long-Term Agent Memory for Conversational RAG", "authors": [{"id": 27197, "fullname": "Sharon Cao", "url": "http://mlsys.org/api/miniconf/users/27197?format=json", "institution": "Hill Research"}, {"id": 27198, "fullname": "Rui Li", "url": "http://mlsys.org/api/miniconf/users/27198?format=json", "institution": "Hill Research"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3515", "url": null, "sourceid": 17, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=wpZHLPz4N0", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 809, "modified": "2026-03-23T21:52:43.477104-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=wpZHLPz4N0", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "23", "related_events": ["http://mlsys.org/api/miniconf/events/3738?format=json"], "related_events_ids": [3738]}, {"id": 3554, "uid": "ea5d2f1c4608232e07d3aa3d998e5135", "name": "Virtual Machine NUMA Placement at Scale: Learning the Norm, Shielding the Tail", "authors": [{"id": 26262, "fullname": "Yibo Zhao", "url": "http://mlsys.org/api/miniconf/users/26262?format=json", "institution": "Northeastern University"}, {"id": 27473, "fullname": "Tianyuan Wu", "url": "http://mlsys.org/api/miniconf/users/27473?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27474, "fullname": "HUI XUE", "url": "http://mlsys.org/api/miniconf/users/27474?format=json", "institution": "Research, Microsoft"}, {"id": 27475, "fullname": "Qi Chen", "url": "http://mlsys.org/api/miniconf/users/27475?format=json", "institution": "Microsoft Research"}, {"id": 27476, "fullname": "Zhenhua Han", "url": "http://mlsys.org/api/miniconf/users/27476?format=json", "institution": "Microsoft"}, {"id": 27477, "fullname": "Zikai Xu", "url": "http://mlsys.org/api/miniconf/users/27477?format=json", "institution": null}, {"id": 27478, "fullname": "Yuntai Chang", "url": "http://mlsys.org/api/miniconf/users/27478?format=json", "institution": null}, {"id": 27479, "fullname": "Rui Gao", "url": "http://mlsys.org/api/miniconf/users/27479?format=json", "institution": null}, {"id": 27480, "fullname": "Steve Deng", "url": "http://mlsys.org/api/miniconf/users/27480?format=json", "institution": null}, {"id": 27481, "fullname": "Jui-Hao Chiang", "url": "http://mlsys.org/api/miniconf/users/27481?format=json", "institution": "Microsoft"}, {"id": 27482, "fullname": "Mingxia Li", "url": "http://mlsys.org/api/miniconf/users/27482?format=json", "institution": "Alibaba Group"}, {"id": 16293, "fullname": "Yuqing Yang", "url": "http://mlsys.org/api/miniconf/users/16293?format=json", "institution": "Microsoft Research"}, {"id": 16145, "fullname": "Cheng Tan", "url": "http://mlsys.org/api/miniconf/users/16145?format=json", "institution": "Northeastern"}, {"id": 27483, "fullname": "Fan Yang", "url": "http://mlsys.org/api/miniconf/users/27483?format=json", "institution": "Research, Microsoft"}, {"id": 15807, "fullname": "Peng Cheng", "url": "http://mlsys.org/api/miniconf/users/15807?format=json", "institution": "Microsoft Research"}, {"id": 27484, "fullname": "Yongqiang Xiong", "url": "http://mlsys.org/api/miniconf/users/27484?format=json", "institution": "Microsoft Research"}, {"id": 27469, "fullname": "Lili Qiu", "url": "http://mlsys.org/api/miniconf/users/27469?format=json", "institution": "Microsoft Research Asia"}, {"id": 26227, "fullname": "Lidong Zhou", "url": "http://mlsys.org/api/miniconf/users/26227?format=json", "institution": "Microsoft"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3554", "url": null, "sourceid": 64, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=guCUThRvX5", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 848, "modified": "2026-03-23T21:52:44.998424-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=guCUThRvX5", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "16", "related_events": ["http://mlsys.org/api/miniconf/events/3777?format=json"], "related_events_ids": [3777]}, {"id": 3628, "uid": "1679091c5a880faf6fb5e6087eb1b2dc", "name": "GriNNder: Breaking the Memory Capacity Wall in Full-Graph GNN Training with Storage Offloading", "authors": [{"id": 27858, "fullname": "Jaeyong Song", "url": "http://mlsys.org/api/miniconf/users/27858?format=json", "institution": "Seoul National University"}, {"id": 27859, "fullname": "Seongyeon Park", "url": "http://mlsys.org/api/miniconf/users/27859?format=json", "institution": "Seoul National University"}, {"id": 27860, "fullname": "Hongsun Jang", "url": "http://mlsys.org/api/miniconf/users/27860?format=json", "institution": "Seoul National University"}, {"id": 27861, "fullname": "Jaewon Jung", "url": "http://mlsys.org/api/miniconf/users/27861?format=json", "institution": "Seoul National University"}, {"id": 26223, "fullname": "Hunseong Lim", "url": "http://mlsys.org/api/miniconf/users/26223?format=json", "institution": "Seoul National University"}, {"id": 27862, "fullname": "Junguk Hong", "url": "http://mlsys.org/api/miniconf/users/27862?format=json", "institution": "Seoul National University"}, {"id": 27863, "fullname": "Jinho Lee", "url": "http://mlsys.org/api/miniconf/users/27863?format=json", "institution": "Seoul National University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3628", "url": "https://github.com/AIS-SNU/GriNNder", "sourceid": 6, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=8SNPzGRldN", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 922, "modified": "2026-03-23T21:52:47.956516-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=8SNPzGRldN", "resourcetype": "UriEventmedia"}, {"id": 975, "file": "/media/PosterPDFs/MLSys%202026/3628.png", "modified": "2026-05-08T17:55:01.109921-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 976, "file": "/media/PosterPDFs/MLSys%202026/3628-thumb.png", "modified": "2026-05-08T17:55:01.202861-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 977, "modified": "2026-05-20T13:49:00.679894-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3628_fwRBDdZ.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "39", "related_events": ["http://mlsys.org/api/miniconf/events/3851?format=json"], "related_events_ids": [3851]}, {"id": 3777, "uid": "ea5d2f1c4608232e07d3aa3d998e5135", "name": "Virtual Machine NUMA Placement at Scale: Learning the Norm, Shielding the Tail", "authors": [{"id": 26262, "fullname": "Yibo Zhao", "url": "http://mlsys.org/api/miniconf/users/26262?format=json", "institution": "Northeastern University"}, {"id": 27473, "fullname": "Tianyuan Wu", "url": "http://mlsys.org/api/miniconf/users/27473?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27474, "fullname": "HUI XUE", "url": "http://mlsys.org/api/miniconf/users/27474?format=json", "institution": "Research, Microsoft"}, {"id": 27475, "fullname": "Qi Chen", "url": "http://mlsys.org/api/miniconf/users/27475?format=json", "institution": "Microsoft Research"}, {"id": 27476, "fullname": "Zhenhua Han", "url": "http://mlsys.org/api/miniconf/users/27476?format=json", "institution": "Microsoft"}, {"id": 27477, "fullname": "Zikai Xu", "url": "http://mlsys.org/api/miniconf/users/27477?format=json", "institution": null}, {"id": 27478, "fullname": "Yuntai Chang", "url": "http://mlsys.org/api/miniconf/users/27478?format=json", "institution": null}, {"id": 27479, "fullname": "Rui Gao", "url": "http://mlsys.org/api/miniconf/users/27479?format=json", "institution": null}, {"id": 27480, "fullname": "Steve Deng", "url": "http://mlsys.org/api/miniconf/users/27480?format=json", "institution": null}, {"id": 27481, "fullname": "Jui-Hao Chiang", "url": "http://mlsys.org/api/miniconf/users/27481?format=json", "institution": "Microsoft"}, {"id": 27482, "fullname": "Mingxia Li", "url": "http://mlsys.org/api/miniconf/users/27482?format=json", "institution": "Alibaba Group"}, {"id": 16293, "fullname": "Yuqing Yang", "url": "http://mlsys.org/api/miniconf/users/16293?format=json", "institution": "Microsoft Research"}, {"id": 16145, "fullname": "Cheng Tan", "url": "http://mlsys.org/api/miniconf/users/16145?format=json", "institution": "Northeastern"}, {"id": 27483, "fullname": "Fan Yang", "url": "http://mlsys.org/api/miniconf/users/27483?format=json", "institution": "Research, Microsoft"}, {"id": 15807, "fullname": "Peng Cheng", "url": "http://mlsys.org/api/miniconf/users/15807?format=json", "institution": "Microsoft Research"}, {"id": 27484, "fullname": "Yongqiang Xiong", "url": "http://mlsys.org/api/miniconf/users/27484?format=json", "institution": "Microsoft Research"}, {"id": 27469, "fullname": "Lili Qiu", "url": "http://mlsys.org/api/miniconf/users/27469?format=json", "institution": "Microsoft Research Asia"}, {"id": 26227, "fullname": "Lidong Zhou", "url": "http://mlsys.org/api/miniconf/users/26227?format=json", "institution": "Microsoft"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: ML for Systems", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3777", "url": null, "sourceid": -64, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T13:45:00-07:00", "endtime": "2026-05-20T14:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3688?format=json", "parent_id": 3688, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3554?format=json"], "related_events_ids": [3554]}, {"id": 3748, "uid": "a3f390d88e4c41f2747bfa2f1b5f87db", "name": "Automated Algorithm Design for Auto-Tuning Optimizers", "authors": [{"id": 27263, "fullname": "Floris-Jan Willemsen", "url": "http://mlsys.org/api/miniconf/users/27263?format=json", "institution": "Leiden University LIACS"}, {"id": 27264, "fullname": "Niki van Stein", "url": "http://mlsys.org/api/miniconf/users/27264?format=json", "institution": "LIACS, Leiden University"}, {"id": 27143, "fullname": "Ben van Werkhoven", "url": "http://mlsys.org/api/miniconf/users/27143?format=json", "institution": "Leiden University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: ML for Systems", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3748", "url": null, "sourceid": -68, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T14:45:00-07:00", "endtime": "2026-05-20T15:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3688?format=json", "parent_id": 3688, "eventmedia": [{"id": 1080, "modified": "2026-05-20T14:25:31.877940-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3748_4D9zX0g.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3525?format=json"], "related_events_ids": [3525]}, {"id": 3588, "uid": "d09bf41544a3365a46c9077ebb5e35c3", "name": "G-HEMP: FAST MULTI-GPU PRIVATE INFERENCE FOR LARGE-SCALE GCNS WITH HOMOMORPHIC ENCRYPTION", "authors": [{"id": 27655, "fullname": "Ran Ran", "url": "http://mlsys.org/api/miniconf/users/27655?format=json", "institution": "North Carolina State University"}, {"id": 27656, "fullname": "Zhaoting Gong", "url": "http://mlsys.org/api/miniconf/users/27656?format=json", "institution": "North Carolina State University"}, {"id": 27657, "fullname": "Zhaowei Li", "url": "http://mlsys.org/api/miniconf/users/27657?format=json", "institution": "North Carolina State University"}, {"id": 27658, "fullname": "Xianting Lu", "url": "http://mlsys.org/api/miniconf/users/27658?format=json", "institution": "North Carolina State University"}, {"id": 27659, "fullname": "Jiajia Li", "url": "http://mlsys.org/api/miniconf/users/27659?format=json", "institution": "North Carolina State University"}, {"id": 27660, "fullname": "Wujie Wen", "url": "http://mlsys.org/api/miniconf/users/27660?format=json", "institution": "North Carolina State University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3588", "url": null, "sourceid": 75, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=RSTrFSPIMy", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 882, "modified": "2026-03-23T21:52:46.377970-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=RSTrFSPIMy", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "26", "related_events": ["http://mlsys.org/api/miniconf/events/3811?format=json"], "related_events_ids": [3811]}, {"id": 3627, "uid": "3988c7f88ebcb58c6ce932b957b6f332", "name": "ProToken: Token-Level Attribution for Federated Large Language Models", "authors": [{"id": 27165, "fullname": "Waris Gill", "url": "http://mlsys.org/api/miniconf/users/27165?format=json", "institution": "Virginia Tech"}, {"id": 27856, "fullname": "Ahmad Humayun", "url": "http://mlsys.org/api/miniconf/users/27856?format=json", "institution": "Virginia Polytechnic Institute and State University"}, {"id": 20986, "fullname": "Ali Anwar", "url": "http://mlsys.org/api/miniconf/users/20986?format=json", "institution": "University of Minnesota"}, {"id": 27857, "fullname": "Muhammad Ali Gulzar", "url": "http://mlsys.org/api/miniconf/users/27857?format=json", "institution": "Virginia Tech"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3627", "url": null, "sourceid": 137, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=8WXUjbFr0Z", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 921, "modified": "2026-03-23T21:52:47.894190-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=8WXUjbFr0Z", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "27", "related_events": ["http://mlsys.org/api/miniconf/events/3850?format=json"], "related_events_ids": [3850]}, {"id": 3589, "uid": "6c8349cc7260ae62e3b1396831a8398f", "name": "CSLE: A Reinforcement Learning Platform for Autonomous Security Management", "authors": [{"id": 27661, "fullname": "Kim Hammar", "url": "http://mlsys.org/api/miniconf/users/27661?format=json", "institution": "University of Melbourne"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3589", "url": "https://kim-hammar.github.io/csle/", "sourceid": 45, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=QGuRWjFsnm", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 883, "modified": "2026-03-23T21:52:46.423159-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=QGuRWjFsnm", "resourcetype": "UriEventmedia"}, {"id": 946, "file": "/media/PosterPDFs/MLSys%202026/3589.png", "modified": "2026-04-29T21:24:27.052824-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 947, "file": "/media/PosterPDFs/MLSys%202026/3589-thumb.png", "modified": "2026-04-29T21:24:27.137280-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 972, "modified": "2026-05-06T21:20:02.629974-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3589.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "28", "related_events": ["http://mlsys.org/api/miniconf/events/3812?format=json"], "related_events_ids": [3812]}, {"id": 3767, "uid": "37693cfc748049e45d87b8c7d8b9aacd", "name": "NEST: Network- and Memory-Aware Device Placement for Distributed Deep Learning", "authors": [{"id": 26264, "fullname": "Irene Wang", "url": "http://mlsys.org/api/miniconf/users/26264?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27364, "fullname": "Vishnu Venkata", "url": "http://mlsys.org/api/miniconf/users/27364?format=json", "institution": null}, {"id": 11122, "fullname": "Arvind Krishnamurthy", "url": "http://mlsys.org/api/miniconf/users/11122?format=json", "institution": "University of Washington"}, {"id": 27358, "fullname": "Divya Mahajan", "url": "http://mlsys.org/api/miniconf/users/27358?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3767", "url": "https://github.com/scai-tech/Nest", "sourceid": -23, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T09:30:00-07:00", "endtime": "2026-05-20T09:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3679?format=json", "parent_id": 3679, "eventmedia": [{"id": 1064, "modified": "2026-05-19T19:51:14.288436-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3767_u5zq5Pz.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3544?format=json"], "related_events_ids": [3544]}, {"id": 3522, "uid": "c16a5320fa475530d9583c34fd356ef5", "name": "Scaling Up Large Language Models Serving Systems for Semantic Job Search", "authors": [{"id": 27235, "fullname": "Kayhan Behdin", "url": "http://mlsys.org/api/miniconf/users/27235?format=json", "institution": "LinkedIn"}, {"id": 19093, "fullname": "Qingquan Song", "url": "http://mlsys.org/api/miniconf/users/19093?format=json", "institution": null}, {"id": 25809, "fullname": "Sriram Vasudevan", "url": "http://mlsys.org/api/miniconf/users/25809?format=json", "institution": "LinkedIn Corporation"}, {"id": 27236, "fullname": "Jian Sheng", "url": "http://mlsys.org/api/miniconf/users/27236?format=json", "institution": "LinkedIn"}, {"id": 27237, "fullname": "Xiaojing Ma", "url": "http://mlsys.org/api/miniconf/users/27237?format=json", "institution": "LinkedIn"}, {"id": 27238, "fullname": "Zhengze Zhou", "url": "http://mlsys.org/api/miniconf/users/27238?format=json", "institution": "LinkedIn"}, {"id": 26224, "fullname": "Chuanrui Zhu", "url": "http://mlsys.org/api/miniconf/users/26224?format=json", "institution": "LinkedIn"}, {"id": 27239, "fullname": "Guoyao Li", "url": "http://mlsys.org/api/miniconf/users/27239?format=json", "institution": "xAI"}, {"id": 19228, "fullname": "Chanh Nguyen", "url": "http://mlsys.org/api/miniconf/users/19228?format=json", "institution": "LinkedIn"}, {"id": 27240, "fullname": "Sayan Ghosh", "url": "http://mlsys.org/api/miniconf/users/27240?format=json", "institution": null}, {"id": 27241, "fullname": "Hejian Sang", "url": "http://mlsys.org/api/miniconf/users/27241?format=json", "institution": "LinkedIn"}, {"id": 24223, "fullname": "Ata Fatahi", "url": "http://mlsys.org/api/miniconf/users/24223?format=json", "institution": "LinkedIn Inc"}, {"id": 27242, "fullname": "Sundara Ramachandran", "url": "http://mlsys.org/api/miniconf/users/27242?format=json", "institution": null}, {"id": 27243, "fullname": "Xiaoqing Wang", "url": "http://mlsys.org/api/miniconf/users/27243?format=json", "institution": "LinkedIn"}, {"id": 26222, "fullname": "Qing Lan", "url": "http://mlsys.org/api/miniconf/users/26222?format=json", "institution": "LinkedIn"}, {"id": 27244, "fullname": "Vinay S", "url": "http://mlsys.org/api/miniconf/users/27244?format=json", "institution": null}, {"id": 27245, "fullname": "Qi Guo", "url": "http://mlsys.org/api/miniconf/users/27245?format=json", "institution": "LinkedIn"}, {"id": 27246, "fullname": "Caleb Johnson", "url": "http://mlsys.org/api/miniconf/users/27246?format=json", "institution": "University of Illinois at Urbana-Champaign"}, {"id": 17756, "fullname": "Zhipeng Wang", "url": "http://mlsys.org/api/miniconf/users/17756?format=json", "institution": "LinkedIn Corporation"}, {"id": 27247, "fullname": "Fedor Borisyuk", "url": "http://mlsys.org/api/miniconf/users/27247?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3522", "url": null, "sourceid": 31, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=re82zZczHj", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 816, "modified": "2026-03-23T21:52:43.728713-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=re82zZczHj", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "21", "related_events": ["http://mlsys.org/api/miniconf/events/3745?format=json"], "related_events_ids": [3745]}, {"id": 3855, "uid": "35f4a8d465e6e1edc05f3d8ab658c551", "name": "VeriMoA: A Mixture-of-Agents Framework for Spec-to-HDL Generation", "authors": [{"id": 27902, "fullname": "Heng Ping", "url": "http://mlsys.org/api/miniconf/users/27902?format=json", "institution": "University of Southern California"}, {"id": 27903, "fullname": "Arijit Bhattacharjee", "url": "http://mlsys.org/api/miniconf/users/27903?format=json", "institution": "Iowa State University"}, {"id": 27904, "fullname": "Peiyu Zhang", "url": "http://mlsys.org/api/miniconf/users/27904?format=json", "institution": "University of Southern California"}, {"id": 27905, "fullname": "Shixuan Li", "url": "http://mlsys.org/api/miniconf/users/27905?format=json", "institution": "University of Southern California"}, {"id": 27906, "fullname": "Wei Yang", "url": "http://mlsys.org/api/miniconf/users/27906?format=json", "institution": "University of Southern California"}, {"id": 27907, "fullname": "Anzhe Cheng", "url": "http://mlsys.org/api/miniconf/users/27907?format=json", "institution": "University of Southern California"}, {"id": 27908, "fullname": "Xiaole Zhang", "url": "http://mlsys.org/api/miniconf/users/27908?format=json", "institution": "University of Southern California"}, {"id": 27909, "fullname": "Jesse Thomason", "url": "http://mlsys.org/api/miniconf/users/27909?format=json", "institution": "University of Southern California"}, {"id": 15789, "fullname": "Ali Jannesari", "url": "http://mlsys.org/api/miniconf/users/15789?format=json", "institution": "Iowa State University"}, {"id": 27910, "fullname": "Nesreen Ahmed", "url": "http://mlsys.org/api/miniconf/users/27910?format=json", "institution": "Cisco"}, {"id": 11952, "fullname": "Paul Bogdan", "url": "http://mlsys.org/api/miniconf/users/11952?format=json", "institution": "USC"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3855", "url": null, "sourceid": -78, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T13:15:00-07:00", "endtime": "2026-05-19T13:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3668?format=json", "parent_id": 3668, "eventmedia": [{"id": 1221, "modified": "2026-05-19T00:49:57.374039-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3855_j54FoJa.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3632?format=json"], "related_events_ids": [3632]}, {"id": 3526, "uid": "5fd0b37cd7dbbb00f97ba6ce92bf5add", "name": "The OpenHands Software Agent SDK: A Composable and Extensible Foundation for Production Agents", "authors": [{"id": 27265, "fullname": "Xingyao Wang", "url": "http://mlsys.org/api/miniconf/users/27265?format=json", "institution": "All Hands AI"}, {"id": 28441, "fullname": "Simon Rosenberg", "url": "http://mlsys.org/api/miniconf/users/28441?format=json", "institution": "C3 AI"}, {"id": 27267, "fullname": "Juan Michelini", "url": "http://mlsys.org/api/miniconf/users/27267?format=json", "institution": "Universidad de la Rep\u00fablica"}, {"id": 27268, "fullname": "Calvin Smith", "url": "http://mlsys.org/api/miniconf/users/27268?format=json", "institution": "OpenHands"}, {"id": 28442, "fullname": "Hoang Tran", "url": "http://mlsys.org/api/miniconf/users/28442?format=json", "institution": "VinUniversity"}, {"id": 27270, "fullname": "Engel Nyst", "url": "http://mlsys.org/api/miniconf/users/27270?format=json", "institution": null}, {"id": 28443, "fullname": "Rohit Malhotra", "url": "http://mlsys.org/api/miniconf/users/28443?format=json", "institution": "Carnegie Mellon University"}, {"id": 28444, "fullname": "Xuhui Zhou", "url": "http://mlsys.org/api/miniconf/users/28444?format=json", "institution": "CMU, Carnegie Mellon University"}, {"id": 28445, "fullname": "Valerie Chen", "url": "http://mlsys.org/api/miniconf/users/28445?format=json", "institution": "Carnegie Mellon University"}, {"id": 28446, "fullname": "Robert Brennan", "url": "http://mlsys.org/api/miniconf/users/28446?format=json", "institution": "All Hands AI"}, {"id": 28447, "fullname": "Graham Neubig", "url": "http://mlsys.org/api/miniconf/users/28447?format=json", "institution": "Carnegie Mellon University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3526", "url": null, "sourceid": 114, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=pzVmWs6yGq", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 820, "modified": "2026-03-23T21:52:43.861434-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=pzVmWs6yGq", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "9", "related_events": ["http://mlsys.org/api/miniconf/events/3749?format=json"], "related_events_ids": [3749]}, {"id": 3749, "uid": "5fd0b37cd7dbbb00f97ba6ce92bf5add", "name": "The OpenHands Software Agent SDK: A Composable and Extensible Foundation for Production Agents", "authors": [{"id": 27265, "fullname": "Xingyao Wang", "url": "http://mlsys.org/api/miniconf/users/27265?format=json", "institution": "All Hands AI"}, {"id": 28441, "fullname": "Simon Rosenberg", "url": "http://mlsys.org/api/miniconf/users/28441?format=json", "institution": "C3 AI"}, {"id": 27267, "fullname": "Juan Michelini", "url": "http://mlsys.org/api/miniconf/users/27267?format=json", "institution": "Universidad de la Rep\u00fablica"}, {"id": 27268, "fullname": "Calvin Smith", "url": "http://mlsys.org/api/miniconf/users/27268?format=json", "institution": "OpenHands"}, {"id": 28442, "fullname": "Hoang Tran", "url": "http://mlsys.org/api/miniconf/users/28442?format=json", "institution": "VinUniversity"}, {"id": 27270, "fullname": "Engel Nyst", "url": "http://mlsys.org/api/miniconf/users/27270?format=json", "institution": null}, {"id": 28443, "fullname": "Rohit Malhotra", "url": "http://mlsys.org/api/miniconf/users/28443?format=json", "institution": "Carnegie Mellon University"}, {"id": 28444, "fullname": "Xuhui Zhou", "url": "http://mlsys.org/api/miniconf/users/28444?format=json", "institution": "CMU, Carnegie Mellon University"}, {"id": 28445, "fullname": "Valerie Chen", "url": "http://mlsys.org/api/miniconf/users/28445?format=json", "institution": "Carnegie Mellon University"}, {"id": 28446, "fullname": "Robert Brennan", "url": "http://mlsys.org/api/miniconf/users/28446?format=json", "institution": "All Hands AI"}, {"id": 28447, "fullname": "Graham Neubig", "url": "http://mlsys.org/api/miniconf/users/28447?format=json", "institution": "Carnegie Mellon University"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Agentic AI/MLSys", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3749", "url": null, "sourceid": -114, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T09:30:00-07:00", "endtime": "2026-05-21T09:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3700?format=json", "parent_id": 3700, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3526?format=json"], "related_events_ids": [3526]}, {"id": 3527, "uid": "ec8956637a99787bd197eacd77acce5e", "name": "StreamDiffusionV2: A Streaming System for Dynamic and Interactive Video Generation", "authors": [{"id": 27276, "fullname": "Tianrui Feng", "url": "http://mlsys.org/api/miniconf/users/27276?format=json", "institution": "The University of Texas at Austin"}, {"id": 27277, "fullname": "Zhi Li", "url": "http://mlsys.org/api/miniconf/users/27277?format=json", "institution": "University of California, Berkeley"}, {"id": 27278, "fullname": "Shuo Yang", "url": "http://mlsys.org/api/miniconf/users/27278?format=json", "institution": "University of California, Berkeley"}, {"id": 27279, "fullname": "Haocheng Xi", "url": "http://mlsys.org/api/miniconf/users/27279?format=json", "institution": "University of California, Berkeley"}, {"id": 27280, "fullname": "Muyang Li", "url": "http://mlsys.org/api/miniconf/users/27280?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 24423, "fullname": "Xiuyu Li", "url": "http://mlsys.org/api/miniconf/users/24423?format=json", "institution": "UC Berkeley"}, {"id": 27281, "fullname": "Lvmin Zhang", "url": "http://mlsys.org/api/miniconf/users/27281?format=json", "institution": null}, {"id": 27282, "fullname": "Keting Yang", "url": "http://mlsys.org/api/miniconf/users/27282?format=json", "institution": "Google"}, {"id": 27283, "fullname": "Kelly Peng", "url": "http://mlsys.org/api/miniconf/users/27283?format=json", "institution": "Stanford University"}, {"id": 12133, "fullname": "Song Han", "url": "http://mlsys.org/api/miniconf/users/12133?format=json", "institution": "MIT"}, {"id": 27284, "fullname": "Maneesh Agrawala", "url": "http://mlsys.org/api/miniconf/users/27284?format=json", "institution": "Stanford University"}, {"id": 11240, "fullname": "Kurt Keutzer", "url": "http://mlsys.org/api/miniconf/users/11240?format=json", "institution": "EECS, UC Berkeley"}, {"id": 27285, "fullname": "Akio Kodaira", "url": "http://mlsys.org/api/miniconf/users/27285?format=json", "institution": "Shizuku AI"}, {"id": 24298, "fullname": "Chenfeng Xu", "url": "http://mlsys.org/api/miniconf/users/24298?format=json", "institution": "Together AI/UT Austin"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3527", "url": null, "sourceid": 102, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=p9WALNBvc6", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 821, "modified": "2026-03-23T21:52:43.907988-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=p9WALNBvc6", "resourcetype": "UriEventmedia"}, {"id": 958, "file": "/media/PosterPDFs/MLSys%202026/3527-thumb.png", "modified": "2026-05-15T11:11:45.393959-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 957, "file": "/media/PosterPDFs/MLSys%202026/3527.png", "modified": "2026-05-15T11:06:15.133439-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "1", "related_events": ["http://mlsys.org/api/miniconf/events/3750?format=json"], "related_events_ids": [3750]}, {"id": 3750, "uid": "ec8956637a99787bd197eacd77acce5e", "name": "StreamDiffusionV2: A Streaming System for Dynamic and Interactive Video Generation", "authors": [{"id": 27276, "fullname": "Tianrui Feng", "url": "http://mlsys.org/api/miniconf/users/27276?format=json", "institution": "The University of Texas at Austin"}, {"id": 27277, "fullname": "Zhi Li", "url": "http://mlsys.org/api/miniconf/users/27277?format=json", "institution": "University of California, Berkeley"}, {"id": 27278, "fullname": "Shuo Yang", "url": "http://mlsys.org/api/miniconf/users/27278?format=json", "institution": "University of California, Berkeley"}, {"id": 27279, "fullname": "Haocheng Xi", "url": "http://mlsys.org/api/miniconf/users/27279?format=json", "institution": "University of California, Berkeley"}, {"id": 27280, "fullname": "Muyang Li", "url": "http://mlsys.org/api/miniconf/users/27280?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 24423, "fullname": "Xiuyu Li", "url": "http://mlsys.org/api/miniconf/users/24423?format=json", "institution": "UC Berkeley"}, {"id": 27281, "fullname": "Lvmin Zhang", "url": "http://mlsys.org/api/miniconf/users/27281?format=json", "institution": null}, {"id": 27282, "fullname": "Keting Yang", "url": "http://mlsys.org/api/miniconf/users/27282?format=json", "institution": "Google"}, {"id": 27283, "fullname": "Kelly Peng", "url": "http://mlsys.org/api/miniconf/users/27283?format=json", "institution": "Stanford University"}, {"id": 12133, "fullname": "Song Han", "url": "http://mlsys.org/api/miniconf/users/12133?format=json", "institution": "MIT"}, {"id": 27284, "fullname": "Maneesh Agrawala", "url": "http://mlsys.org/api/miniconf/users/27284?format=json", "institution": "Stanford University"}, {"id": 11240, "fullname": "Kurt Keutzer", "url": "http://mlsys.org/api/miniconf/users/11240?format=json", "institution": "EECS, UC Berkeley"}, {"id": 27285, "fullname": "Akio Kodaira", "url": "http://mlsys.org/api/miniconf/users/27285?format=json", "institution": "Shizuku AI"}, {"id": 24298, "fullname": "Chenfeng Xu", "url": "http://mlsys.org/api/miniconf/users/24298?format=json", "institution": "Together AI/UT Austin"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Best Paper Session", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3750", "url": null, "sourceid": -102, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T08:45:00-07:00", "endtime": "2026-05-19T09:05:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3659?format=json", "parent_id": 3659, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3527?format=json"], "related_events_ids": [3527]}, {"id": 3760, "uid": "b6d767d2f8ed5d21a44b0e5886680cb9", "name": "FlashAgents: Accelerating Multi-Agent LLM Systems via Streaming Prefill Overlap", "authors": [{"id": 25922, "fullname": "Taosong Fang", "url": "http://mlsys.org/api/miniconf/users/25922?format=json", "institution": "Institute of Software Chinese Academy of Sciences"}, {"id": 28440, "fullname": "Zhen Zheng", "url": "http://mlsys.org/api/miniconf/users/28440?format=json", "institution": "ByteDance Inc."}, {"id": 27342, "fullname": "Zhengzhao Ma", "url": "http://mlsys.org/api/miniconf/users/27342?format=json", "institution": "University of the Chinese Academy of Sciences"}, {"id": 25829, "fullname": "Yaojie Lu", "url": "http://mlsys.org/api/miniconf/users/25829?format=json", "institution": null}, {"id": 27343, "fullname": "Hongyu Lin", "url": "http://mlsys.org/api/miniconf/users/27343?format=json", "institution": "Institute of Software, Chinese Academy of Sciences"}, {"id": 27344, "fullname": "Xianpei Han", "url": "http://mlsys.org/api/miniconf/users/27344?format=json", "institution": "Institute of Software, CAS"}, {"id": 27345, "fullname": "Le Sun", "url": "http://mlsys.org/api/miniconf/users/27345?format=json", "institution": "Institute of Software, Chinese Academy of Sciences"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3760", "url": null, "sourceid": -22, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T15:30:00-07:00", "endtime": "2026-05-19T15:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3674?format=json", "parent_id": 3674, "eventmedia": [{"id": 1175, "modified": "2026-05-18T21:56:08.888655-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3760_dJT5ZOY.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3537?format=json"], "related_events_ids": [3537]}, {"id": 3834, "uid": "7647966b7343c29048673252e490f736", "name": "SHIP: SRAM-Based Huge Inference Pipelines for Fast LLM Serving", "authors": [{"id": 28469, "fullname": "Andrew Bitar", "url": "http://mlsys.org/api/miniconf/users/28469?format=json", "institution": "NVIDIA"}, {"id": 28499, "fullname": "Aravind Vayalapra", "url": "http://mlsys.org/api/miniconf/users/28499?format=json", "institution": null}, {"id": 28500, "fullname": "Baorui Zhou", "url": "http://mlsys.org/api/miniconf/users/28500?format=json", "institution": "Nvidia"}, {"id": 28501, "fullname": "Matthew Boyd", "url": "http://mlsys.org/api/miniconf/users/28501?format=json", "institution": "NVIDIA"}, {"id": 28502, "fullname": "Charlie Wang", "url": "http://mlsys.org/api/miniconf/users/28502?format=json", "institution": "Nvidia"}, {"id": 28503, "fullname": "Sahil Parmar", "url": "http://mlsys.org/api/miniconf/users/28503?format=json", "institution": null}, {"id": 28470, "fullname": "Eugene Sha", "url": "http://mlsys.org/api/miniconf/users/28470?format=json", "institution": "NVIDIA"}, {"id": 28504, "fullname": "Gautam Rayaprolu", "url": "http://mlsys.org/api/miniconf/users/28504?format=json", "institution": null}, {"id": 28505, "fullname": "Peter Hicks", "url": "http://mlsys.org/api/miniconf/users/28505?format=json", "institution": null}, {"id": 28506, "fullname": "Alex Bowe", "url": "http://mlsys.org/api/miniconf/users/28506?format=json", "institution": "NVIDIA"}, {"id": 28507, "fullname": "Roberto DiCecco", "url": "http://mlsys.org/api/miniconf/users/28507?format=json", "institution": null}, {"id": 28508, "fullname": "Santosh Raghavan", "url": "http://mlsys.org/api/miniconf/users/28508?format=json", "institution": "NVIDIA"}, {"id": 28509, "fullname": "Evan Patrick", "url": "http://mlsys.org/api/miniconf/users/28509?format=json", "institution": null}, {"id": 28510, "fullname": "Josip Smolcic", "url": "http://mlsys.org/api/miniconf/users/28510?format=json", "institution": null}, {"id": 28511, "fullname": "David Han", "url": "http://mlsys.org/api/miniconf/users/28511?format=json", "institution": null}, {"id": 28512, "fullname": "Kris Kang", "url": "http://mlsys.org/api/miniconf/users/28512?format=json", "institution": "Nvidia"}, {"id": 28513, "fullname": "Andy Rock", "url": "http://mlsys.org/api/miniconf/users/28513?format=json", "institution": null}, {"id": 28514, "fullname": "Josh Hay", "url": "http://mlsys.org/api/miniconf/users/28514?format=json", "institution": null}, {"id": 28515, "fullname": "Mohamed Eldafrawy", "url": "http://mlsys.org/api/miniconf/users/28515?format=json", "institution": "Nvidia"}, {"id": 28516, "fullname": "Mikhail Kandel", "url": "http://mlsys.org/api/miniconf/users/28516?format=json", "institution": null}, {"id": 28517, "fullname": "Daulet Zhanguzin", "url": "http://mlsys.org/api/miniconf/users/28517?format=json", "institution": null}, {"id": 28518, "fullname": "Omar Kilani", "url": "http://mlsys.org/api/miniconf/users/28518?format=json", "institution": null}, {"id": 28519, "fullname": "Liming Gong", "url": "http://mlsys.org/api/miniconf/users/28519?format=json", "institution": null}, {"id": 28520, "fullname": "Andrew Paprotskyi", "url": "http://mlsys.org/api/miniconf/users/28520?format=json", "institution": ""}, {"id": 28521, "fullname": "Arash Taheri-Dezfouli", "url": "http://mlsys.org/api/miniconf/users/28521?format=json", "institution": "Nvidia"}, {"id": 28522, "fullname": "Josh Fender", "url": "http://mlsys.org/api/miniconf/users/28522?format=json", "institution": null}, {"id": 28471, "fullname": "Andrew Ling", "url": "http://mlsys.org/api/miniconf/users/28471?format=json", "institution": "University of Toronto"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Serving 6", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3834", "url": null, "sourceid": -89, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T13:00:00-07:00", "endtime": "2026-05-21T13:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3709?format=json", "parent_id": 3709, "eventmedia": [{"id": 1224, "modified": "2026-05-20T14:32:18.045328-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3834_VmkjzHq.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3611?format=json"], "related_events_ids": [3611]}, {"id": 3590, "uid": "d2ddea18f00665ce8623e36bd4e3c7c5", "name": "PLayer-FL: A Principled Approach to Personalized Layer-wise Cross-Silo Federated Learning", "authors": [{"id": 27662, "fullname": "Ahmed Elhussein", "url": "http://mlsys.org/api/miniconf/users/27662?format=json", "institution": "Columbia University"}, {"id": 25923, "fullname": "Florent Pollet", "url": "http://mlsys.org/api/miniconf/users/25923?format=json", "institution": "Columbia University"}, {"id": 28492, "fullname": "Gamze Gursoy", "url": "http://mlsys.org/api/miniconf/users/28492?format=json", "institution": "University of Cambridge"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3590", "url": "https://github.com/G2Lab/PLayer-FL", "sourceid": 73, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=QBUy1HdKrZ", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 884, "modified": "2026-03-23T21:52:46.459439-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=QBUy1HdKrZ", "resourcetype": "UriEventmedia"}, {"id": 992, "file": "/media/PosterPDFs/MLSys%202026/3590.png", "modified": "2026-05-12T19:48:42.705617-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 993, "file": "/media/PosterPDFs/MLSys%202026/3590-thumb.png", "modified": "2026-05-12T19:48:42.829949-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 994, "modified": "2026-05-12T19:56:51.521808-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3590.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "33", "related_events": ["http://mlsys.org/api/miniconf/events/3813?format=json"], "related_events_ids": [3813]}, {"id": 3528, "uid": "67c6a1e7ce56d3d6fa748ab6d9af3fd7", "name": "TiDAR: Think in Diffusion, Talk in Autoregression", "authors": [{"id": 27286, "fullname": "Jingyu Liu", "url": "http://mlsys.org/api/miniconf/users/27286?format=json", "institution": "University of Chicago"}, {"id": 27287, "fullname": "Xin Dong", "url": "http://mlsys.org/api/miniconf/users/27287?format=json", "institution": "Seed"}, {"id": 27288, "fullname": "Zhifan Ye", "url": "http://mlsys.org/api/miniconf/users/27288?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27289, "fullname": "Rishabh Mehta", "url": "http://mlsys.org/api/miniconf/users/27289?format=json", "institution": null}, {"id": 27290, "fullname": "Yonggan Fu", "url": "http://mlsys.org/api/miniconf/users/27290?format=json", "institution": "NVIDIA"}, {"id": 27291, "fullname": "vartika singh", "url": "http://mlsys.org/api/miniconf/users/27291?format=json", "institution": "State University of New York, Buffalo"}, {"id": 18868, "fullname": "Ce Zhang", "url": "http://mlsys.org/api/miniconf/users/18868?format=json", "institution": null}, {"id": 27292, "fullname": "Pavlo Molchanov", "url": "http://mlsys.org/api/miniconf/users/27292?format=json", "institution": "NVIDIA Research"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3528", "url": null, "sourceid": 47, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=onfxEjoE4L", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 822, "modified": "2026-03-23T21:52:43.945409-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=onfxEjoE4L", "resourcetype": "UriEventmedia"}, {"id": 1222, "file": "/media/PosterPDFs/MLSys%202026/3528.png", "modified": "2026-05-18T22:23:57.514230-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "14", "related_events": ["http://mlsys.org/api/miniconf/events/3751?format=json"], "related_events_ids": [3751]}, {"id": 3580, "uid": "da4fb5c6e93e74d3df8527599fa62642", "name": "Zero redundancy distributed learning with differential privacy", "authors": [{"id": 27633, "fullname": "Zhiqi Bu", "url": "http://mlsys.org/api/miniconf/users/27633?format=json", "institution": "FAIR MSL"}, {"id": 27634, "fullname": "Justin Chiu", "url": "http://mlsys.org/api/miniconf/users/27634?format=json", "institution": "University of Washington"}, {"id": 27635, "fullname": "Ruixuan Liu", "url": "http://mlsys.org/api/miniconf/users/27635?format=json", "institution": "Emory University"}, {"id": 27636, "fullname": "Sheng Zha", "url": "http://mlsys.org/api/miniconf/users/27636?format=json", "institution": "Amazon"}, {"id": 27637, "fullname": "George Karypis", "url": "http://mlsys.org/api/miniconf/users/27637?format=json", "institution": "University of Minnesota, Minneapolis"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3580", "url": null, "sourceid": 120, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=VGacNNZfgo", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 874, "modified": "2026-03-23T21:52:46.076093-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=VGacNNZfgo", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "35", "related_events": ["http://mlsys.org/api/miniconf/events/3803?format=json"], "related_events_ids": [3803]}, {"id": 3537, "uid": "b6d767d2f8ed5d21a44b0e5886680cb9", "name": "FlashAgents: Accelerating Multi-Agent LLM Systems via Streaming Prefill Overlap", "authors": [{"id": 25922, "fullname": "Taosong Fang", "url": "http://mlsys.org/api/miniconf/users/25922?format=json", "institution": "Institute of Software Chinese Academy of Sciences"}, {"id": 28440, "fullname": "Zhen Zheng", "url": "http://mlsys.org/api/miniconf/users/28440?format=json", "institution": "ByteDance Inc."}, {"id": 27342, "fullname": "Zhengzhao Ma", "url": "http://mlsys.org/api/miniconf/users/27342?format=json", "institution": "University of the Chinese Academy of Sciences"}, {"id": 25829, "fullname": "Yaojie Lu", "url": "http://mlsys.org/api/miniconf/users/25829?format=json", "institution": null}, {"id": 27343, "fullname": "Hongyu Lin", "url": "http://mlsys.org/api/miniconf/users/27343?format=json", "institution": "Institute of Software, Chinese Academy of Sciences"}, {"id": 27344, "fullname": "Xianpei Han", "url": "http://mlsys.org/api/miniconf/users/27344?format=json", "institution": "Institute of Software, CAS"}, {"id": 27345, "fullname": "Le Sun", "url": "http://mlsys.org/api/miniconf/users/27345?format=json", "institution": "Institute of Software, Chinese Academy of Sciences"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3537", "url": null, "sourceid": 22, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=m14PPUfgEc", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 831, "modified": "2026-03-23T21:52:44.294163-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=m14PPUfgEc", "resourcetype": "UriEventmedia"}, {"id": 1171, "file": "/media/PosterPDFs/MLSys%202026/3537.png", "modified": "2026-05-17T07:51:55.765005-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1172, "file": "/media/PosterPDFs/MLSys%202026/3537-thumb.png", "modified": "2026-05-17T07:51:55.866421-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1176, "modified": "2026-05-18T21:56:46.667817-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3537_WMw6BYe.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "21", "related_events": ["http://mlsys.org/api/miniconf/events/3760?format=json"], "related_events_ids": [3760]}, {"id": 3840, "uid": "eccbc87e4b5ce2fe28308fd9f2a7baf3", "name": "FLoRIST: Singular Value Thresholding for Efficient and Accurate Federated Fine-Tuning of Large Language Models", "authors": [{"id": 27825, "fullname": "Hariharan Ramesh", "url": "http://mlsys.org/api/miniconf/users/27825?format=json", "institution": "University of Arizona"}, {"id": 23907, "fullname": "Jyotikrishna Dass", "url": "http://mlsys.org/api/miniconf/users/23907?format=json", "institution": "University of Arizona"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Federated Learning", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3840", "url": null, "sourceid": -3, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T17:00:00-07:00", "endtime": "2026-05-19T17:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3672?format=json", "parent_id": 3672, "eventmedia": [{"id": 1143, "modified": "2026-05-20T14:42:01.022017-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3840_BwPF7aI.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3617?format=json"], "related_events_ids": [3617]}, {"id": 3531, "uid": "93db85ed909c13838ff95ccfa94cebd9", "name": "Efficient Long-Context Language Model Training by Core Attention Disaggregation", "authors": [{"id": 28964, "fullname": "Yonghao Zhuang", "url": "http://mlsys.org/api/miniconf/users/28964?format=json", "institution": "CMU, Carnegie Mellon University"}, {"id": 17900, "fullname": "Junda Chen", "url": "http://mlsys.org/api/miniconf/users/17900?format=json", "institution": "University of California San Diego"}, {"id": 27317, "fullname": "Bo Pang", "url": "http://mlsys.org/api/miniconf/users/27317?format=json", "institution": null}, {"id": 27318, "fullname": "Yi Gu", "url": "http://mlsys.org/api/miniconf/users/27318?format=json", "institution": "University of California, San Diego"}, {"id": 27319, "fullname": "Yibo Zhu", "url": "http://mlsys.org/api/miniconf/users/27319?format=json", "institution": "StepFun"}, {"id": 27320, "fullname": "Yimin Jiang", "url": "http://mlsys.org/api/miniconf/users/27320?format=json", "institution": "Anuttacon"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}, {"id": 27321, "fullname": "Hao Zhang", "url": "http://mlsys.org/api/miniconf/users/27321?format=json", "institution": "University of California, San Diego"}, {"id": 16300, "fullname": "Eric Xing", "url": "http://mlsys.org/api/miniconf/users/16300?format=json", "institution": "MBZUAI, CMU, and Petuum Inc."}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3531", "url": "https://github.com/hao-ai-lab/DistCA", "sourceid": 86, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=oIonqkc8hM", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 825, "modified": "2026-03-23T21:52:44.055719-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=oIonqkc8hM", "resourcetype": "UriEventmedia"}, {"id": 1048, "modified": "2026-05-14T14:00:54.802540-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3531.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "12", "related_events": ["http://mlsys.org/api/miniconf/events/3754?format=json"], "related_events_ids": [3754]}, {"id": 3617, "uid": "eccbc87e4b5ce2fe28308fd9f2a7baf3", "name": "FLoRIST: Singular Value Thresholding for Efficient and Accurate Federated Fine-Tuning of Large Language Models", "authors": [{"id": 27825, "fullname": "Hariharan Ramesh", "url": "http://mlsys.org/api/miniconf/users/27825?format=json", "institution": "University of Arizona"}, {"id": 23907, "fullname": "Jyotikrishna Dass", "url": "http://mlsys.org/api/miniconf/users/23907?format=json", "institution": "University of Arizona"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3617", "url": null, "sourceid": 3, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=GTZRs756YJ", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 911, "modified": "2026-03-23T21:52:47.495721-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=GTZRs756YJ", "resourcetype": "UriEventmedia"}, {"id": 1138, "file": "/media/PosterPDFs/MLSys%202026/3617.png", "modified": "2026-05-20T14:45:18.604078-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1139, "file": "/media/PosterPDFs/MLSys%202026/3617-thumb.png", "modified": "2026-05-20T14:47:24.685008-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "29", "related_events": ["http://mlsys.org/api/miniconf/events/3840?format=json"], "related_events_ids": [3840]}, {"id": 3742, "uid": "34173cb38f07f89ddbebc2ac9128303f", "name": "MLCommons Chakra: Advancing Performance Benchmarking and Co-design using Standardized Execution Traces", "authors": [{"id": 27214, "fullname": "Srinivas", "url": "http://mlsys.org/api/miniconf/users/27214?format=json", "institution": "NVIDIA"}, {"id": 27225, "fullname": "Andrey Balogh", "url": "http://mlsys.org/api/miniconf/users/27225?format=json", "institution": ""}, {"id": 27227, "fullname": "Brad B", "url": "http://mlsys.org/api/miniconf/users/27227?format=json", "institution": ""}, {"id": 27216, "fullname": "Brian Coutinho", "url": "http://mlsys.org/api/miniconf/users/27216?format=json", "institution": null}, {"id": 20878, "fullname": "Louis Feng", "url": "http://mlsys.org/api/miniconf/users/20878?format=json", "institution": "University of California, Davis"}, {"id": 27217, "fullname": "Sheng Fu", "url": "http://mlsys.org/api/miniconf/users/27217?format=json", "institution": null}, {"id": 27218, "fullname": "Sanshan Gao", "url": "http://mlsys.org/api/miniconf/users/27218?format=json", "institution": null}, {"id": 27231, "fullname": "Mehryar Garakani", "url": "http://mlsys.org/api/miniconf/users/27231?format=json", "institution": null}, {"id": 27215, "fullname": "Taekyung Heo", "url": "http://mlsys.org/api/miniconf/users/27215?format=json", "institution": null}, {"id": 14827, "fullname": "David Kanter", "url": "http://mlsys.org/api/miniconf/users/14827?format=json", "institution": "MLCommons"}, {"id": 27220, "fullname": "Josh Ladd", "url": "http://mlsys.org/api/miniconf/users/27220?format=json", "institution": null}, {"id": 27224, "fullname": "Ziwei Li", "url": "http://mlsys.org/api/miniconf/users/27224?format=json", "institution": null}, {"id": 28956, "fullname": "Winston Liu", "url": "http://mlsys.org/api/miniconf/users/28956?format=json", "institution": "Keysight Technologies"}, {"id": 16517, "fullname": "Changhai Man", "url": "http://mlsys.org/api/miniconf/users/16517?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27226, "fullname": "Dan Mihailescu", "url": "http://mlsys.org/api/miniconf/users/27226?format=json", "institution": "Keysight Technologies"}, {"id": 27228, "fullname": "Spandan More", "url": "http://mlsys.org/api/miniconf/users/27228?format=json", "institution": "AMD"}, {"id": 27221, "fullname": "Joongun Park", "url": "http://mlsys.org/api/miniconf/users/27221?format=json", "institution": null}, {"id": 27230, "fullname": "Ashwin Ramachandran", "url": "http://mlsys.org/api/miniconf/users/27230?format=json", "institution": ""}, {"id": 26285, "fullname": "Vinay Ramakrishnaiah", "url": "http://mlsys.org/api/miniconf/users/26285?format=json", "institution": "AMD"}, {"id": 27229, "fullname": "Saeed Rashidi", "url": "http://mlsys.org/api/miniconf/users/27229?format=json", "institution": "Meta"}, {"id": 10754, "fullname": "Vijay Janapa Reddi", "url": "http://mlsys.org/api/miniconf/users/10754?format=json", "institution": "Harvard University"}, {"id": 14774, "fullname": "Puneet Sharma", "url": "http://mlsys.org/api/miniconf/users/14774?format=json", "institution": "HP Labs"}, {"id": 27219, "fullname": "Phio Tian", "url": "http://mlsys.org/api/miniconf/users/27219?format=json", "institution": null}, {"id": 14298, "fullname": "William Won", "url": "http://mlsys.org/api/miniconf/users/14298?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27142, "fullname": "Hanjiang Wu", "url": "http://mlsys.org/api/miniconf/users/27142?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27223, "fullname": "Huan Xu", "url": "http://mlsys.org/api/miniconf/users/27223?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27222, "fullname": "Jinsun Yoo", "url": "http://mlsys.org/api/miniconf/users/27222?format=json", "institution": "Georgia Institute of Technology"}, {"id": 11662, "fullname": "Tushar Krishna", "url": "http://mlsys.org/api/miniconf/users/11662?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3742", "url": null, "sourceid": -30, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T17:15:00-07:00", "endtime": "2026-05-21T17:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3717?format=json", "parent_id": 3717, "eventmedia": [{"id": 1168, "modified": "2026-05-20T15:51:06.343857-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3742_UFSQJ36.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3519?format=json"], "related_events_ids": [3519]}, {"id": 3577, "uid": "a3c65c2974270fd093ee8a9bf8ae7d0b", "name": "ProTrain: Efficient LLM Training via Automatic Memory Management", "authors": [{"id": 27620, "fullname": "Hanmei Yang", "url": "http://mlsys.org/api/miniconf/users/27620?format=json", "institution": "UMass Amherst"}, {"id": 28465, "fullname": "Jin Zhou", "url": "http://mlsys.org/api/miniconf/users/28465?format=json", "institution": "University of Massachusetts at Amherst"}, {"id": 27622, "fullname": "Yao Fu", "url": "http://mlsys.org/api/miniconf/users/27622?format=json", "institution": "Advanced Micro Devices"}, {"id": 28466, "fullname": "Xiaoqun Wang", "url": "http://mlsys.org/api/miniconf/users/28466?format=json", "institution": "Advanced Micro Devices"}, {"id": 27624, "fullname": "Ramine Roane", "url": "http://mlsys.org/api/miniconf/users/27624?format=json", "institution": "Advanced Micro Devices"}, {"id": 11878, "fullname": "Hui Guan", "url": "http://mlsys.org/api/miniconf/users/11878?format=json", "institution": "University of Massachusetts, Amherst; Amazon"}, {"id": 27625, "fullname": "Tongping Liu", "url": "http://mlsys.org/api/miniconf/users/27625?format=json", "institution": "XPeng Motors"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3577", "url": null, "sourceid": 108, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=XDkOn0iTiH", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 871, "modified": "2026-03-23T21:52:45.964855-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=XDkOn0iTiH", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "5", "related_events": ["http://mlsys.org/api/miniconf/events/3800?format=json"], "related_events_ids": [3800]}, {"id": 3572, "uid": "d9d4f495e875a2e075a1a4a6e1b9770f", "name": "BOute: Cost-Efficient LLM Serving with Heterogeneous LLMs and GPUs via Multi-Objective Bayesian Optimization", "authors": [{"id": 21099, "fullname": "YOUHE JIANG", "url": "http://mlsys.org/api/miniconf/users/21099?format=json", "institution": "University of Cambridge"}, {"id": 27606, "fullname": "Fangcheng Fu", "url": "http://mlsys.org/api/miniconf/users/27606?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 10630, "fullname": "Eiko Yoneki", "url": "http://mlsys.org/api/miniconf/users/10630?format=json", "institution": "University of Cambridge"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3572", "url": null, "sourceid": 46, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=ZVQb92umqX", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 866, "modified": "2026-03-23T21:52:45.770781-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=ZVQb92umqX", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "6", "related_events": ["http://mlsys.org/api/miniconf/events/3795?format=json"], "related_events_ids": [3795]}, {"id": 3605, "uid": "9a1158154dfa42caddbd0694a4e9bdc8", "name": "HexiScale: Facilitating Large Language Model Training over Heterogeneous Hardware", "authors": [{"id": 25937, "fullname": "Ran Yan", "url": "http://mlsys.org/api/miniconf/users/25937?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 21099, "fullname": "YOUHE JIANG", "url": "http://mlsys.org/api/miniconf/users/21099?format=json", "institution": "University of Cambridge"}, {"id": 27733, "fullname": "Xiaonan Nie", "url": "http://mlsys.org/api/miniconf/users/27733?format=json", "institution": "ByteDance Seed"}, {"id": 27606, "fullname": "Fangcheng Fu", "url": "http://mlsys.org/api/miniconf/users/27606?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 21049, "fullname": "Bin CUI", "url": "http://mlsys.org/api/miniconf/users/21049?format=json", "institution": "Peking University"}, {"id": 26259, "fullname": "Binhang Yuan", "url": "http://mlsys.org/api/miniconf/users/26259?format=json", "institution": "HKUST"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3605", "url": null, "sourceid": 52, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=KgcqSNio0U", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 899, "modified": "2026-03-23T21:52:47.001246-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=KgcqSNio0U", "resourcetype": "UriEventmedia"}, {"id": 1068, "file": "/media/PosterPDFs/MLSys%202026/3605.png", "modified": "2026-05-15T21:03:18.492764-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1069, "file": "/media/PosterPDFs/MLSys%202026/3605-thumb.png", "modified": "2026-05-15T21:03:18.577950-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "41", "related_events": ["http://mlsys.org/api/miniconf/events/3828?format=json"], "related_events_ids": [3828]}, {"id": 3532, "uid": "14bfa6bb14875e45bba028a21ed38046", "name": "SpecDiff-2: Scaling Diffusion Drafter Alignment For Faster Speculative Decoding", "authors": [{"id": 27322, "fullname": "Jameson Sandler", "url": "http://mlsys.org/api/miniconf/users/27322?format=json", "institution": "University of Virginia"}, {"id": 27323, "fullname": "Jacob K Christopher", "url": "http://mlsys.org/api/miniconf/users/27323?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27324, "fullname": "Tom Hartvigsen", "url": "http://mlsys.org/api/miniconf/users/27324?format=json", "institution": null}, {"id": 27325, "fullname": "Ferdinando Fioretto", "url": "http://mlsys.org/api/miniconf/users/27325?format=json", "institution": "University of Virginia"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3532", "url": null, "sourceid": 69, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=o42VU86ZsV", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 826, "modified": "2026-03-23T21:52:44.093141-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=o42VU86ZsV", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "8", "related_events": ["http://mlsys.org/api/miniconf/events/3755?format=json"], "related_events_ids": [3755]}, {"id": 3785, "uid": "7cbbc409ec990f19c78c75bd1e06f215", "name": "CDLM: Consistency Diffusion Language Models for Faster Sampling", "authors": [{"id": 25522, "fullname": "Minseo Kim", "url": "http://mlsys.org/api/miniconf/users/25522?format=json", "institution": "Seoul National University"}, {"id": 24298, "fullname": "Chenfeng Xu", "url": "http://mlsys.org/api/miniconf/users/24298?format=json", "institution": "Together AI/UT Austin"}, {"id": 17672, "fullname": "Coleman Hooper", "url": "http://mlsys.org/api/miniconf/users/17672?format=json", "institution": "University of California, Berkeley"}, {"id": 27566, "fullname": "Harman Singh", "url": "http://mlsys.org/api/miniconf/users/27566?format=json", "institution": "University of California, Berkeley"}, {"id": 18231, "fullname": "Ben Athiwaratkun", "url": "http://mlsys.org/api/miniconf/users/18231?format=json", "institution": null}, {"id": 18868, "fullname": "Ce Zhang", "url": "http://mlsys.org/api/miniconf/users/18868?format=json", "institution": null}, {"id": 11240, "fullname": "Kurt Keutzer", "url": "http://mlsys.org/api/miniconf/users/11240?format=json", "institution": "EECS, UC Berkeley"}, {"id": 11237, "fullname": "Amir Gholami", "url": "http://mlsys.org/api/miniconf/users/11237?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 5", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3785", "url": null, "sourceid": -70, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T08:45:00-07:00", "endtime": "2026-05-21T09:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3701?format=json", "parent_id": 3701, "eventmedia": [{"id": 1022, "modified": "2026-05-18T22:24:09.932282-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3785_4lDloP6.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3562?format=json"], "related_events_ids": [3562]}, {"id": 3763, "uid": "b53b3a3d6ab90ce0268229151c9bde11", "name": "Flashlight: PyTorch Compiler Extensions to Accelerate Attention Variants", "authors": [{"id": 27353, "fullname": "Bozhi You", "url": "http://mlsys.org/api/miniconf/users/27353?format=json", "institution": ""}, {"id": 26264, "fullname": "Irene Wang", "url": "http://mlsys.org/api/miniconf/users/26264?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27354, "fullname": "Zelal Mustafaoglu", "url": "http://mlsys.org/api/miniconf/users/27354?format=json", "institution": null}, {"id": 27355, "fullname": "Abhinav Jangda", "url": "http://mlsys.org/api/miniconf/users/27355?format=json", "institution": "Microsoft"}, {"id": 27356, "fullname": "Ang\u00e9lica Moreira", "url": "http://mlsys.org/api/miniconf/users/27356?format=json", "institution": "Research, Microsoft"}, {"id": 27357, "fullname": "Roshan Dathathri", "url": "http://mlsys.org/api/miniconf/users/27357?format=json", "institution": "Microsoft Research"}, {"id": 27358, "fullname": "Divya Mahajan", "url": "http://mlsys.org/api/miniconf/users/27358?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27359, "fullname": "Keshav Pingali", "url": "http://mlsys.org/api/miniconf/users/27359?format=json", "institution": ", University of Texas, Austin"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient Computation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3763", "url": "https://github.com/bozhiyou/flashlight/tree/mlsys26-ae", "sourceid": -55, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-22T08:45:00-07:00", "endtime": "2026-05-22T09:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3722?format=json", "parent_id": 3722, "eventmedia": [{"id": 1141, "modified": "2026-05-20T16:28:27.118354-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3763_pOXWfhT.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3540?format=json"], "related_events_ids": [3540]}, {"id": 3573, "uid": "a1d0c6e83f027327d8461063f4ac58a6", "name": "TeleRAG: Efficient Retrieval-Augmented Generation Inference with Lookahead Retrieval", "authors": [{"id": 27607, "fullname": "Chien-Yu Lin", "url": "http://mlsys.org/api/miniconf/users/27607?format=json", "institution": "Meta"}, {"id": 26295, "fullname": "Keisuke Kamahori", "url": "http://mlsys.org/api/miniconf/users/26295?format=json", "institution": "University of Washington"}, {"id": 27608, "fullname": "Yiyu Liu", "url": "http://mlsys.org/api/miniconf/users/27608?format=json", "institution": "Harvard University"}, {"id": 27609, "fullname": "Xiaoxiang Shi", "url": "http://mlsys.org/api/miniconf/users/27609?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 27610, "fullname": "Madhav Kashyap", "url": "http://mlsys.org/api/miniconf/users/27610?format=json", "institution": "University of Washington"}, {"id": 27416, "fullname": "Yile Gu", "url": "http://mlsys.org/api/miniconf/users/27416?format=json", "institution": "Department of Computer Science, University of Washington"}, {"id": 27611, "fullname": "Rulin Shao", "url": "http://mlsys.org/api/miniconf/users/27611?format=json", "institution": "University of Washington"}, {"id": 12026, "fullname": "Zihao Ye", "url": "http://mlsys.org/api/miniconf/users/12026?format=json", "institution": "NVIDIA"}, {"id": 17683, "fullname": "Kan Zhu", "url": "http://mlsys.org/api/miniconf/users/17683?format=json", "institution": "University of Washington"}, {"id": 27612, "fullname": "Rohan Kadekodi", "url": "http://mlsys.org/api/miniconf/users/27612?format=json", "institution": "University of Washington"}, {"id": 17972, "fullname": "Stephanie Wang", "url": "http://mlsys.org/api/miniconf/users/17972?format=json", "institution": "UW &amp; Anyscale"}, {"id": 11122, "fullname": "Arvind Krishnamurthy", "url": "http://mlsys.org/api/miniconf/users/11122?format=json", "institution": "University of Washington"}, {"id": 11020, "fullname": "Luis Ceze", "url": "http://mlsys.org/api/miniconf/users/11020?format=json", "institution": "University of Washington and NVIDIA"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3573", "url": null, "sourceid": 42, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=YsOyCpMUYD", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 867, "modified": "2026-03-23T21:52:45.805417-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=YsOyCpMUYD", "resourcetype": "UriEventmedia"}, {"id": 1055, "file": "/media/PosterPDFs/MLSys%202026/3573.png", "modified": "2026-05-14T19:14:33.926341-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1056, "file": "/media/PosterPDFs/MLSys%202026/3573-thumb.png", "modified": "2026-05-14T19:14:33.998784-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "19", "related_events": ["http://mlsys.org/api/miniconf/events/3796?format=json"], "related_events_ids": [3796]}, {"id": 3533, "uid": "6974ce5ac660610b44d9b9fed0ff9548", "name": "TriInfer: Hybrid EPD Disaggregation for Efficient Multimodal Large Language Model Inference", "authors": [{"id": 27326, "fullname": "Xianzhe Dong", "url": "http://mlsys.org/api/miniconf/users/27326?format=json", "institution": "University of Science and Technology of China"}, {"id": 27327, "fullname": "Tongxuan Liu", "url": "http://mlsys.org/api/miniconf/users/27327?format=json", "institution": "JD.com"}, {"id": 27328, "fullname": "Yuting Zeng", "url": "http://mlsys.org/api/miniconf/users/27328?format=json", "institution": "University of Science and Technology of China"}, {"id": 27144, "fullname": "Weizhe Huang", "url": "http://mlsys.org/api/miniconf/users/27144?format=json", "institution": "University of Science and Technology of China"}, {"id": 25671, "fullname": "Xiaoyang Zhao", "url": "http://mlsys.org/api/miniconf/users/25671?format=json", "institution": null}, {"id": 27329, "fullname": "Siyu Wu", "url": "http://mlsys.org/api/miniconf/users/27329?format=json", "institution": "Beihang University"}, {"id": 27330, "fullname": "Liangyu Liu", "url": "http://mlsys.org/api/miniconf/users/27330?format=json", "institution": null}, {"id": 27331, "fullname": "Liu Yang", "url": "http://mlsys.org/api/miniconf/users/27331?format=json", "institution": ""}, {"id": 26165, "fullname": "Yu Wu", "url": "http://mlsys.org/api/miniconf/users/26165?format=json", "institution": "University of Science and Technology of China"}, {"id": 27332, "fullname": "Hailong Yang", "url": "http://mlsys.org/api/miniconf/users/27332?format=json", "institution": null}, {"id": 27333, "fullname": "Ke Zhang", "url": "http://mlsys.org/api/miniconf/users/27333?format=json", "institution": null}, {"id": 27334, "fullname": "Jing Li", "url": "http://mlsys.org/api/miniconf/users/27334?format=json", "institution": "University of Science and Technology of China"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3533", "url": null, "sourceid": 103, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=nNovi8fvGN", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 827, "modified": "2026-03-23T21:52:44.125266-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=nNovi8fvGN", "resourcetype": "UriEventmedia"}, {"id": 952, "file": "/media/PosterPDFs/MLSys%202026/3533.png", "modified": "2026-04-26T04:49:04.769910-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 953, "file": "/media/PosterPDFs/MLSys%202026/3533-thumb.png", "modified": "2026-04-26T04:49:04.863903-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "12", "related_events": ["http://mlsys.org/api/miniconf/events/3756?format=json"], "related_events_ids": [3756]}, {"id": 3770, "uid": "3ef815416f775098fe977004015c6193", "name": "Search Your Block Floating Point Scales!", "authors": [{"id": 27410, "fullname": "Tanmaey Gupta", "url": "http://mlsys.org/api/miniconf/users/27410?format=json", "institution": "Cornell University"}, {"id": 27411, "fullname": "Hayden Prairie", "url": "http://mlsys.org/api/miniconf/users/27411?format=json", "institution": "University of California, San Diego                    Together AI"}, {"id": 23865, "fullname": "Xiaoxia Wu", "url": "http://mlsys.org/api/miniconf/users/23865?format=json", "institution": "TogtherAI"}, {"id": 27412, "fullname": "Reyna Abhyankar", "url": "http://mlsys.org/api/miniconf/users/27412?format=json", "institution": "Together AI"}, {"id": 25635, "fullname": "Qingyang Wu", "url": "http://mlsys.org/api/miniconf/users/25635?format=json", "institution": "Together AI"}, {"id": 24490, "fullname": "Austin Silveria", "url": "http://mlsys.org/api/miniconf/users/24490?format=json", "institution": "University of California, San Diego"}, {"id": 27413, "fullname": "Pragaash Ponnusamy", "url": "http://mlsys.org/api/miniconf/users/27413?format=json", "institution": "Together AI"}, {"id": 27251, "fullname": "Jue Wang", "url": "http://mlsys.org/api/miniconf/users/27251?format=json", "institution": "Together AI"}, {"id": 18231, "fullname": "Ben Athiwaratkun", "url": "http://mlsys.org/api/miniconf/users/18231?format=json", "institution": null}, {"id": 14753, "fullname": "Shuaiwen Song", "url": "http://mlsys.org/api/miniconf/users/14753?format=json", "institution": "University of Sydney"}, {"id": 27414, "fullname": "Tri Dao", "url": "http://mlsys.org/api/miniconf/users/27414?format=json", "institution": "Princeton, TogetherAI"}, {"id": 27189, "fullname": "Daniel Fu", "url": "http://mlsys.org/api/miniconf/users/27189?format=json", "institution": "University of California, San Diego"}, {"id": 11289, "fullname": "Christopher De Sa", "url": "http://mlsys.org/api/miniconf/users/11289?format=json", "institution": "Cornell University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Model Compression", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3770", "url": null, "sourceid": -85, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T18:00:00-07:00", "endtime": "2026-05-20T18:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3696?format=json", "parent_id": 3696, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3547?format=json"], "related_events_ids": [3547]}, {"id": 3756, "uid": "6974ce5ac660610b44d9b9fed0ff9548", "name": "TriInfer: Hybrid EPD Disaggregation for Efficient Multimodal Large Language Model Inference", "authors": [{"id": 27326, "fullname": "Xianzhe Dong", "url": "http://mlsys.org/api/miniconf/users/27326?format=json", "institution": "University of Science and Technology of China"}, {"id": 27327, "fullname": "Tongxuan Liu", "url": "http://mlsys.org/api/miniconf/users/27327?format=json", "institution": "JD.com"}, {"id": 27328, "fullname": "Yuting Zeng", "url": "http://mlsys.org/api/miniconf/users/27328?format=json", "institution": "University of Science and Technology of China"}, {"id": 27144, "fullname": "Weizhe Huang", "url": "http://mlsys.org/api/miniconf/users/27144?format=json", "institution": "University of Science and Technology of China"}, {"id": 25671, "fullname": "Xiaoyang Zhao", "url": "http://mlsys.org/api/miniconf/users/25671?format=json", "institution": null}, {"id": 27329, "fullname": "Siyu Wu", "url": "http://mlsys.org/api/miniconf/users/27329?format=json", "institution": "Beihang University"}, {"id": 27330, "fullname": "Liangyu Liu", "url": "http://mlsys.org/api/miniconf/users/27330?format=json", "institution": null}, {"id": 27331, "fullname": "Liu Yang", "url": "http://mlsys.org/api/miniconf/users/27331?format=json", "institution": ""}, {"id": 26165, "fullname": "Yu Wu", "url": "http://mlsys.org/api/miniconf/users/26165?format=json", "institution": "University of Science and Technology of China"}, {"id": 27332, "fullname": "Hailong Yang", "url": "http://mlsys.org/api/miniconf/users/27332?format=json", "institution": null}, {"id": 27333, "fullname": "Ke Zhang", "url": "http://mlsys.org/api/miniconf/users/27333?format=json", "institution": null}, {"id": 27334, "fullname": "Jing Li", "url": "http://mlsys.org/api/miniconf/users/27334?format=json", "institution": "University of Science and Technology of China"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Multimodal and Generative Models", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3756", "url": null, "sourceid": -103, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T13:45:00-07:00", "endtime": "2026-05-19T14:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3669?format=json", "parent_id": 3669, "eventmedia": [{"id": 981, "modified": "2026-05-10T08:36:13.622313-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3756.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3533?format=json"], "related_events_ids": [3533]}, {"id": 3828, "uid": "9a1158154dfa42caddbd0694a4e9bdc8", "name": "HexiScale: Facilitating Large Language Model Training over Heterogeneous Hardware", "authors": [{"id": 25937, "fullname": "Ran Yan", "url": "http://mlsys.org/api/miniconf/users/25937?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 21099, "fullname": "YOUHE JIANG", "url": "http://mlsys.org/api/miniconf/users/21099?format=json", "institution": "University of Cambridge"}, {"id": 27733, "fullname": "Xiaonan Nie", "url": "http://mlsys.org/api/miniconf/users/27733?format=json", "institution": "ByteDance Seed"}, {"id": 27606, "fullname": "Fangcheng Fu", "url": "http://mlsys.org/api/miniconf/users/27606?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 21049, "fullname": "Bin CUI", "url": "http://mlsys.org/api/miniconf/users/21049?format=json", "institution": "Peking University"}, {"id": 26259, "fullname": "Binhang Yuan", "url": "http://mlsys.org/api/miniconf/users/26259?format=json", "institution": "HKUST"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3828", "url": null, "sourceid": -52, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T17:30:00-07:00", "endtime": "2026-05-20T17:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3695?format=json", "parent_id": 3695, "eventmedia": [{"id": 1070, "modified": "2026-05-15T21:08:11.933789-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3828_GyjCel6.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3605?format=json"], "related_events_ids": [3605]}, {"id": 3786, "uid": "093f65e080a295f8076b1c5722a46aa2", "name": "LEANN: A Low-Storage Overhead Vector Index", "authors": [{"id": 27567, "fullname": "Yichuan Wang", "url": "http://mlsys.org/api/miniconf/users/27567?format=json", "institution": "University of California, Berkeley"}, {"id": 27568, "fullname": "Zhifei Li", "url": "http://mlsys.org/api/miniconf/users/27568?format=json", "institution": "UC Berkeley, University of California, Berkeley"}, {"id": 21025, "fullname": "Shu Liu", "url": "http://mlsys.org/api/miniconf/users/21025?format=json", "institution": "University of California, Berkeley"}, {"id": 17645, "fullname": "Yongji Wu", "url": "http://mlsys.org/api/miniconf/users/17645?format=json", "institution": "Duke University"}, {"id": 27569, "fullname": "Ziming Mao", "url": "http://mlsys.org/api/miniconf/users/27569?format=json", "institution": "University of California, Berkeley"}, {"id": 20906, "fullname": "Yilong Zhao", "url": "http://mlsys.org/api/miniconf/users/20906?format=json", "institution": "University of California, Berkeley"}, {"id": 27570, "fullname": "Xiao Yan", "url": "http://mlsys.org/api/miniconf/users/27570?format=json", "institution": "Wuhan University"}, {"id": 20979, "fullname": "Zhiying Xu", "url": "http://mlsys.org/api/miniconf/users/20979?format=json", "institution": "Amazon"}, {"id": 19070, "fullname": "Yang Zhou", "url": "http://mlsys.org/api/miniconf/users/19070?format=json", "institution": "UC Davis"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}, {"id": 27571, "fullname": "Sewon Min", "url": "http://mlsys.org/api/miniconf/users/27571?format=json", "institution": "University of California, Berkeley"}, {"id": 21014, "fullname": "Matei Zaharia", "url": "http://mlsys.org/api/miniconf/users/21014?format=json", "institution": "University of California, Berkeley"}, {"id": 11239, "fullname": "Joseph Gonzalez", "url": "http://mlsys.org/api/miniconf/users/11239?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Best Paper Session", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3786", "url": "https://github.com/yichuan-w/LEANN", "sourceid": -59, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T09:05:00-07:00", "endtime": "2026-05-19T09:25:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3659?format=json", "parent_id": 3659, "eventmedia": [{"id": 1155, "modified": "2026-05-19T00:12:08.308782-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3786_vlIWXsd.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3563?format=json"], "related_events_ids": [3563]}, {"id": 3540, "uid": "b53b3a3d6ab90ce0268229151c9bde11", "name": "Flashlight: PyTorch Compiler Extensions to Accelerate Attention Variants", "authors": [{"id": 27353, "fullname": "Bozhi You", "url": "http://mlsys.org/api/miniconf/users/27353?format=json", "institution": ""}, {"id": 26264, "fullname": "Irene Wang", "url": "http://mlsys.org/api/miniconf/users/26264?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27354, "fullname": "Zelal Mustafaoglu", "url": "http://mlsys.org/api/miniconf/users/27354?format=json", "institution": null}, {"id": 27355, "fullname": "Abhinav Jangda", "url": "http://mlsys.org/api/miniconf/users/27355?format=json", "institution": "Microsoft"}, {"id": 27356, "fullname": "Ang\u00e9lica Moreira", "url": "http://mlsys.org/api/miniconf/users/27356?format=json", "institution": "Research, Microsoft"}, {"id": 27357, "fullname": "Roshan Dathathri", "url": "http://mlsys.org/api/miniconf/users/27357?format=json", "institution": "Microsoft Research"}, {"id": 27358, "fullname": "Divya Mahajan", "url": "http://mlsys.org/api/miniconf/users/27358?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27359, "fullname": "Keshav Pingali", "url": "http://mlsys.org/api/miniconf/users/27359?format=json", "institution": ", University of Texas, Austin"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3540", "url": "https://github.com/bozhiyou/flashlight/tree/mlsys26-ae", "sourceid": 55, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=lboOMA8XWr", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 834, "modified": "2026-03-23T21:52:44.426020-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=lboOMA8XWr", "resourcetype": "UriEventmedia"}, {"id": 1241, "file": "/media/PosterPDFs/MLSys%202026/3540.png", "modified": "2026-05-20T17:27:13.950658-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1242, "file": "/media/PosterPDFs/MLSys%202026/3540-thumb.png", "modified": "2026-05-20T17:27:14.044369-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1243, "modified": "2026-05-20T17:29:17.714474-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3540.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "50", "related_events": ["http://mlsys.org/api/miniconf/events/3763?format=json"], "related_events_ids": [3763]}, {"id": 3814, "uid": "aab3238922bcc25a6f606eb525ffdc56", "name": "Rethinking DVFS for Mobile LLMs: Unified Energy-Aware Scheduling with CORE", "authors": [{"id": 27664, "fullname": "Zongpu Zhang", "url": "http://mlsys.org/api/miniconf/users/27664?format=json", "institution": "Purdue University"}, {"id": 27665, "fullname": "Pranab Dash", "url": "http://mlsys.org/api/miniconf/users/27665?format=json", "institution": null}, {"id": 27667, "fullname": "Qiang Xu", "url": "http://mlsys.org/api/miniconf/users/27667?format=json", "institution": "Purdue University"}, {"id": 27666, "fullname": "Y. Charlie Hu", "url": "http://mlsys.org/api/miniconf/users/27666?format=json", "institution": "Purdue University"}, {"id": 27668, "fullname": "Jian Li", "url": "http://mlsys.org/api/miniconf/users/27668?format=json", "institution": "Shanghai Jiao Tong University"}, {"id": 27669, "fullname": "Haibing Guan", "url": "http://mlsys.org/api/miniconf/users/27669?format=json", "institution": "Shanghai Jiao Tong University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient ML", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3814", "url": null, "sourceid": -14, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T13:45:00-07:00", "endtime": "2026-05-21T14:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3710?format=json", "parent_id": 3710, "eventmedia": [{"id": 1124, "modified": "2026-05-20T19:39:02.338030-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3814_0uuYG7Z.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3591?format=json"], "related_events_ids": [3591]}, {"id": 3615, "uid": "76dc611d6ebaafc66cc0879c71b5db5c", "name": "FlexiCache: Leveraging Temporal Stability of Attention Heads for Efficient KV Cache Management", "authors": [{"id": 26134, "fullname": "Nazmul Takbir", "url": "http://mlsys.org/api/miniconf/users/26134?format=json", "institution": "University of California Irvine"}, {"id": 27819, "fullname": "Hamidreza Alikhani Koshkak", "url": "http://mlsys.org/api/miniconf/users/27819?format=json", "institution": "University of California, Irvine"}, {"id": 27820, "fullname": "Nikil Dutt", "url": "http://mlsys.org/api/miniconf/users/27820?format=json", "institution": "University of California, Irvine"}, {"id": 11050, "fullname": "Sangeetha Abdu Jyothi", "url": "http://mlsys.org/api/miniconf/users/11050?format=json", "institution": "UC Irvine / Amazon"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3615", "url": null, "sourceid": 128, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=GgX6dPJx9M", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 909, "modified": "2026-03-23T21:52:47.421836-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=GgX6dPJx9M", "resourcetype": "UriEventmedia"}, {"id": 1032, "file": "/media/PosterPDFs/MLSys%202026/3615.png", "modified": "2026-05-14T06:56:00.980571-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1033, "file": "/media/PosterPDFs/MLSys%202026/3615-thumb.png", "modified": "2026-05-14T06:56:01.047803-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "17", "related_events": ["http://mlsys.org/api/miniconf/events/3838?format=json"], "related_events_ids": [3838]}, {"id": 3761, "uid": "9778d5d219c5080b9a6a17bef029331c", "name": "Unified LLM Model for Power, Performance, and Area Prediction from Hardware Code", "authors": [{"id": 25630, "fullname": "Armin Abdollahi", "url": "http://mlsys.org/api/miniconf/users/25630?format=json", "institution": "University of Southern California"}, {"id": 27346, "fullname": "Mehdi Kamal", "url": "http://mlsys.org/api/miniconf/users/27346?format=json", "institution": "University of Southern California"}, {"id": 27347, "fullname": "Massoud Pedram", "url": "http://mlsys.org/api/miniconf/users/27347?format=json", "institution": "University of Southern California"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: ML for Systems", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3761", "url": null, "sourceid": -82, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T14:30:00-07:00", "endtime": "2026-05-20T14:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3688?format=json", "parent_id": 3688, "eventmedia": [{"id": 1052, "modified": "2026-05-14T18:42:16.684329-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3761.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3538?format=json"], "related_events_ids": [3538]}, {"id": 3536, "uid": "72b32a1f754ba1c09b3695e0cb6cde7f", "name": "FlashAttention-4: Algorithm and Kernel Pipelining Co-Design for Asymmetric Hardware Scaling", "authors": [{"id": 27338, "fullname": "Ted Zadouri", "url": "http://mlsys.org/api/miniconf/users/27338?format=json", "institution": "University of California, Los Angeles"}, {"id": 27339, "fullname": "Markus Hoehnerbach", "url": "http://mlsys.org/api/miniconf/users/27339?format=json", "institution": "Meta"}, {"id": 25645, "fullname": "Jay Shah", "url": "http://mlsys.org/api/miniconf/users/25645?format=json", "institution": "Colfax Research"}, {"id": 27340, "fullname": "Vijay Thakkar", "url": "http://mlsys.org/api/miniconf/users/27340?format=json", "institution": null}, {"id": 27341, "fullname": "Tri Dao", "url": "http://mlsys.org/api/miniconf/users/27341?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3536", "url": null, "sourceid": 57, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=mN5RtvuYl3", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 830, "modified": "2026-03-23T21:52:44.253699-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=mN5RtvuYl3", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "52", "related_events": ["http://mlsys.org/api/miniconf/events/3759?format=json"], "related_events_ids": [3759]}, {"id": 3564, "uid": "ec5decca5ed3d6b8079e2e7e7bacc9f2", "name": "PLA-Serve: A Prefill-Length-Aware LLM Serving System", "authors": [{"id": 17078, "fullname": "Jianshu She", "url": "http://mlsys.org/api/miniconf/users/17078?format=json", "institution": "MBZUAI"}, {"id": 27572, "fullname": "Zonghang Li", "url": "http://mlsys.org/api/miniconf/users/27572?format=json", "institution": "Mohamed bin Zayed University of Artificial Intelligence"}, {"id": 27573, "fullname": "HONGCHAO DU", "url": "http://mlsys.org/api/miniconf/users/27573?format=json", "institution": ""}, {"id": 27574, "fullname": "Shangyu Wu", "url": "http://mlsys.org/api/miniconf/users/27574?format=json", "institution": "Mohamed bin Zayed University of Artificial Intelligence"}, {"id": 27575, "fullname": "Wenhao Zheng", "url": "http://mlsys.org/api/miniconf/users/27575?format=json", "institution": "University of North Carolina at Chapel Hill"}, {"id": 16300, "fullname": "Eric Xing", "url": "http://mlsys.org/api/miniconf/users/16300?format=json", "institution": "MBZUAI, CMU, and Petuum Inc."}, {"id": 27577, "fullname": "Zhengzhong Liu", "url": "http://mlsys.org/api/miniconf/users/27577?format=json", "institution": "Mohamed bin Zayed University of Artificial Intelligence"}, {"id": 27578, "fullname": "Huaxiu Yao", "url": "http://mlsys.org/api/miniconf/users/27578?format=json", "institution": ""}, {"id": 27579, "fullname": "Chun Jason Xue", "url": "http://mlsys.org/api/miniconf/users/27579?format=json", "institution": "Mohamed bin Zayed University of Artificial Intelligence"}, {"id": 16309, "fullname": "Qirong Ho", "url": "http://mlsys.org/api/miniconf/users/16309?format=json", "institution": "MBZUAI"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3564", "url": null, "sourceid": 127, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=dzjCkSEDyG", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 858, "modified": "2026-03-23T21:52:45.430681-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=dzjCkSEDyG", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "20", "related_events": ["http://mlsys.org/api/miniconf/events/3787?format=json"], "related_events_ids": [3787]}, {"id": 3538, "uid": "9778d5d219c5080b9a6a17bef029331c", "name": "Unified LLM Model for Power, Performance, and Area Prediction from Hardware Code", "authors": [{"id": 25630, "fullname": "Armin Abdollahi", "url": "http://mlsys.org/api/miniconf/users/25630?format=json", "institution": "University of Southern California"}, {"id": 27346, "fullname": "Mehdi Kamal", "url": "http://mlsys.org/api/miniconf/users/27346?format=json", "institution": "University of Southern California"}, {"id": 27347, "fullname": "Massoud Pedram", "url": "http://mlsys.org/api/miniconf/users/27347?format=json", "institution": "University of Southern California"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3538", "url": null, "sourceid": 82, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=lpO7kxiayb", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 832, "modified": "2026-03-23T21:52:44.335537-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=lpO7kxiayb", "resourcetype": "UriEventmedia"}, {"id": 966, "file": "/media/PosterPDFs/MLSys%202026/3538-thumb.png", "modified": "2026-05-16T17:31:58.661788-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 965, "file": "/media/PosterPDFs/MLSys%202026/3538.png", "modified": "2026-05-16T17:31:58.578737-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "21", "related_events": ["http://mlsys.org/api/miniconf/events/3761?format=json"], "related_events_ids": [3761]}, {"id": 3524, "uid": "3416a75f4cea9109507cacd8e2f2aefc", "name": "Using Span Queries to Optimize Cache and Attention Locality", "authors": [{"id": 27258, "fullname": "Paul Castro", "url": "http://mlsys.org/api/miniconf/users/27258?format=json", "institution": "International Business Machines"}, {"id": 25924, "fullname": "Nick Mitchell", "url": "http://mlsys.org/api/miniconf/users/25924?format=json", "institution": "IBM Research"}, {"id": 27989, "fullname": "Nathan Ordonez", "url": "http://mlsys.org/api/miniconf/users/27989?format=json", "institution": "IBM Research"}, {"id": 27260, "fullname": "Thomas Parnell", "url": "http://mlsys.org/api/miniconf/users/27260?format=json", "institution": "IBM Research"}, {"id": 27261, "fullname": "Mudhakar Srivatsa", "url": "http://mlsys.org/api/miniconf/users/27261?format=json", "institution": "International Business Machines"}, {"id": 27262, "fullname": "Antoni Viros i Martin", "url": "http://mlsys.org/api/miniconf/users/27262?format=json", "institution": "International Business Machines"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3524", "url": null, "sourceid": 41, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=qcGGSXpFcM", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 818, "modified": "2026-03-23T21:52:43.795108-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=qcGGSXpFcM", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "22", "related_events": ["http://mlsys.org/api/miniconf/events/3747?format=json"], "related_events_ids": [3747]}, {"id": 3525, "uid": "a3f390d88e4c41f2747bfa2f1b5f87db", "name": "Automated Algorithm Design for Auto-Tuning Optimizers", "authors": [{"id": 27263, "fullname": "Floris-Jan Willemsen", "url": "http://mlsys.org/api/miniconf/users/27263?format=json", "institution": "Leiden University LIACS"}, {"id": 27264, "fullname": "Niki van Stein", "url": "http://mlsys.org/api/miniconf/users/27264?format=json", "institution": "LIACS, Leiden University"}, {"id": 27143, "fullname": "Ben van Werkhoven", "url": "http://mlsys.org/api/miniconf/users/27143?format=json", "institution": "Leiden University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3525", "url": null, "sourceid": 68, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=qKlHJCbY6m", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 819, "modified": "2026-03-23T21:52:43.828851-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=qKlHJCbY6m", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "23", "related_events": ["http://mlsys.org/api/miniconf/events/3748?format=json"], "related_events_ids": [3748]}, {"id": 3746, "uid": "e369853df766fa44e1ed0ff613f563bd", "name": "Kitty: Accurate and Efficient 2-bit KV Cache Quantization with Dynamic Channel-wise Precision Boost", "authors": [{"id": 27248, "fullname": "Haojun Xia", "url": "http://mlsys.org/api/miniconf/users/27248?format=json", "institution": "Google Research (Australia)"}, {"id": 23865, "fullname": "Xiaoxia Wu", "url": "http://mlsys.org/api/miniconf/users/23865?format=json", "institution": "TogtherAI"}, {"id": 25960, "fullname": "Jisen Li", "url": "http://mlsys.org/api/miniconf/users/25960?format=json", "institution": "Together AI"}, {"id": 27249, "fullname": "Tsai-chuan Wu", "url": "http://mlsys.org/api/miniconf/users/27249?format=json", "institution": "AMD"}, {"id": 27250, "fullname": "Junxiong Wang", "url": "http://mlsys.org/api/miniconf/users/27250?format=json", "institution": "TogetherAI"}, {"id": 27251, "fullname": "Jue Wang", "url": "http://mlsys.org/api/miniconf/users/27251?format=json", "institution": "Together AI"}, {"id": 27252, "fullname": "Chenxi Li", "url": "http://mlsys.org/api/miniconf/users/27252?format=json", "institution": "Together AI"}, {"id": 27253, "fullname": "Aman Singhal", "url": "http://mlsys.org/api/miniconf/users/27253?format=json", "institution": "Together AI"}, {"id": 24132, "fullname": "Alay Dilipbhai Shah", "url": "http://mlsys.org/api/miniconf/users/24132?format=json", "institution": "Together AI"}, {"id": 28439, "fullname": "Alpay Ariyak", "url": "http://mlsys.org/api/miniconf/users/28439?format=json", "institution": "TogetherAI"}, {"id": 27255, "fullname": "Donglin Zhuang", "url": "http://mlsys.org/api/miniconf/users/27255?format=json", "institution": "The University of Sydney"}, {"id": 27256, "fullname": "Zhongzhu Zhou", "url": "http://mlsys.org/api/miniconf/users/27256?format=json", "institution": "Together.AI &amp; University of Sydney"}, {"id": 18231, "fullname": "Ben Athiwaratkun", "url": "http://mlsys.org/api/miniconf/users/18231?format=json", "institution": null}, {"id": 28440, "fullname": "Zhen Zheng", "url": "http://mlsys.org/api/miniconf/users/28440?format=json", "institution": "ByteDance Inc."}, {"id": 14753, "fullname": "Shuaiwen Song", "url": "http://mlsys.org/api/miniconf/users/14753?format=json", "institution": "University of Sydney"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3746", "url": "https://github.com/Summer-Summer/Kitty", "sourceid": -34, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T14:45:00-07:00", "endtime": "2026-05-20T15:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3687?format=json", "parent_id": 3687, "eventmedia": [{"id": 998, "modified": "2026-05-13T06:38:19.231659-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3746.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3523?format=json"], "related_events_ids": [3523]}, {"id": 3759, "uid": "72b32a1f754ba1c09b3695e0cb6cde7f", "name": "FlashAttention-4: Algorithm and Kernel Pipelining Co-Design for Asymmetric Hardware Scaling", "authors": [{"id": 27338, "fullname": "Ted Zadouri", "url": "http://mlsys.org/api/miniconf/users/27338?format=json", "institution": "University of California, Los Angeles"}, {"id": 27339, "fullname": "Markus Hoehnerbach", "url": "http://mlsys.org/api/miniconf/users/27339?format=json", "institution": "Meta"}, {"id": 25645, "fullname": "Jay Shah", "url": "http://mlsys.org/api/miniconf/users/25645?format=json", "institution": "Colfax Research"}, {"id": 27340, "fullname": "Vijay Thakkar", "url": "http://mlsys.org/api/miniconf/users/27340?format=json", "institution": null}, {"id": 27341, "fullname": "Tri Dao", "url": "http://mlsys.org/api/miniconf/users/27341?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient Computation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3759", "url": null, "sourceid": -57, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-22T09:00:00-07:00", "endtime": "2026-05-22T09:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3722?format=json", "parent_id": 3722, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3536?format=json"], "related_events_ids": [3536]}, {"id": 3523, "uid": "e369853df766fa44e1ed0ff613f563bd", "name": "Kitty: Accurate and Efficient 2-bit KV Cache Quantization with Dynamic Channel-wise Precision Boost", "authors": [{"id": 27248, "fullname": "Haojun Xia", "url": "http://mlsys.org/api/miniconf/users/27248?format=json", "institution": "Google Research (Australia)"}, {"id": 23865, "fullname": "Xiaoxia Wu", "url": "http://mlsys.org/api/miniconf/users/23865?format=json", "institution": "TogtherAI"}, {"id": 25960, "fullname": "Jisen Li", "url": "http://mlsys.org/api/miniconf/users/25960?format=json", "institution": "Together AI"}, {"id": 27249, "fullname": "Tsai-chuan Wu", "url": "http://mlsys.org/api/miniconf/users/27249?format=json", "institution": "AMD"}, {"id": 27250, "fullname": "Junxiong Wang", "url": "http://mlsys.org/api/miniconf/users/27250?format=json", "institution": "TogetherAI"}, {"id": 27251, "fullname": "Jue Wang", "url": "http://mlsys.org/api/miniconf/users/27251?format=json", "institution": "Together AI"}, {"id": 27252, "fullname": "Chenxi Li", "url": "http://mlsys.org/api/miniconf/users/27252?format=json", "institution": "Together AI"}, {"id": 27253, "fullname": "Aman Singhal", "url": "http://mlsys.org/api/miniconf/users/27253?format=json", "institution": "Together AI"}, {"id": 24132, "fullname": "Alay Dilipbhai Shah", "url": "http://mlsys.org/api/miniconf/users/24132?format=json", "institution": "Together AI"}, {"id": 28439, "fullname": "Alpay Ariyak", "url": "http://mlsys.org/api/miniconf/users/28439?format=json", "institution": "TogetherAI"}, {"id": 27255, "fullname": "Donglin Zhuang", "url": "http://mlsys.org/api/miniconf/users/27255?format=json", "institution": "The University of Sydney"}, {"id": 27256, "fullname": "Zhongzhu Zhou", "url": "http://mlsys.org/api/miniconf/users/27256?format=json", "institution": "Together.AI &amp; University of Sydney"}, {"id": 18231, "fullname": "Ben Athiwaratkun", "url": "http://mlsys.org/api/miniconf/users/18231?format=json", "institution": null}, {"id": 28440, "fullname": "Zhen Zheng", "url": "http://mlsys.org/api/miniconf/users/28440?format=json", "institution": "ByteDance Inc."}, {"id": 14753, "fullname": "Shuaiwen Song", "url": "http://mlsys.org/api/miniconf/users/14753?format=json", "institution": "University of Sydney"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3523", "url": "https://github.com/Summer-Summer/Kitty", "sourceid": 34, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=r3mQiuYKIN", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 817, "modified": "2026-03-23T21:52:43.761494-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=r3mQiuYKIN", "resourcetype": "UriEventmedia"}, {"id": 1252, "file": "/media/PosterPDFs/MLSys%202026/3523.png", "modified": "2026-07-02T06:04:25.872900-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1253, "file": "/media/PosterPDFs/MLSys%202026/3523-thumb.png", "modified": "2026-07-07T06:23:20.775090-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "24", "related_events": ["http://mlsys.org/api/miniconf/events/3746?format=json"], "related_events_ids": [3746]}, {"id": 3633, "uid": "f033ab37c30201f73f142449d037028d", "name": "RaidServe: High-performance Resilient Serving", "authors": [{"id": 20912, "fullname": "Ziyi Xu", "url": "http://mlsys.org/api/miniconf/users/20912?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 20911, "fullname": "Zhiqiang Xie", "url": "http://mlsys.org/api/miniconf/users/20911?format=json", "institution": "Stanford University"}, {"id": 23398, "fullname": "Swapnil Gandhi", "url": "http://mlsys.org/api/miniconf/users/23398?format=json", "institution": "Stanford"}, {"id": 20928, "fullname": "Christos Kozyrakis", "url": "http://mlsys.org/api/miniconf/users/20928?format=json", "institution": "Computer Science Department, Stanford University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3633", "url": null, "sourceid": 80, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=5pl9fdbEkq", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 927, "modified": "2026-03-23T21:52:48.141148-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=5pl9fdbEkq", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "25", "related_events": ["http://mlsys.org/api/miniconf/events/3856?format=json"], "related_events_ids": [3856]}, {"id": 3584, "uid": "c51ce410c124a10e0db5e4b97fc2af39", "name": "fabric-lib: RDMA Point-to-Point Communication for LLM Systems", "authors": [{"id": 27645, "fullname": "Nandor Licker", "url": "http://mlsys.org/api/miniconf/users/27645?format=json", "institution": "Perplexity AI"}, {"id": 23368, "fullname": "Kevin Hu", "url": "http://mlsys.org/api/miniconf/users/23368?format=json", "institution": "Perplexity AI"}, {"id": 23407, "fullname": "Vladimir Zaytsev", "url": "http://mlsys.org/api/miniconf/users/23407?format=json", "institution": "Perplexity AI"}, {"id": 21008, "fullname": "Lequn Chen", "url": "http://mlsys.org/api/miniconf/users/21008?format=json", "institution": "Perplexity AI"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3584", "url": null, "sourceid": 13, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=SjVa05wEiY", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 878, "modified": "2026-03-23T21:52:46.236179-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=SjVa05wEiY", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "28", "related_events": ["http://mlsys.org/api/miniconf/events/3807?format=json"], "related_events_ids": [3807]}, {"id": 3856, "uid": "f033ab37c30201f73f142449d037028d", "name": "RaidServe: High-performance Resilient Serving", "authors": [{"id": 20912, "fullname": "Ziyi Xu", "url": "http://mlsys.org/api/miniconf/users/20912?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 20911, "fullname": "Zhiqiang Xie", "url": "http://mlsys.org/api/miniconf/users/20911?format=json", "institution": "Stanford University"}, {"id": 23398, "fullname": "Swapnil Gandhi", "url": "http://mlsys.org/api/miniconf/users/23398?format=json", "institution": "Stanford"}, {"id": 20928, "fullname": "Christos Kozyrakis", "url": "http://mlsys.org/api/miniconf/users/20928?format=json", "institution": "Computer Science Department, Stanford University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3856", "url": null, "sourceid": -80, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T15:15:00-07:00", "endtime": "2026-05-20T15:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3691?format=json", "parent_id": 3691, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3633?format=json"], "related_events_ids": [3633]}, {"id": 3827, "uid": "c74d97b01eae257e44aa9d5bade97baf", "name": "XProf: An Open, Scalable, and Extensible Profiling System for the Modern ML Stack", "authors": [{"id": 28962, "fullname": "Robert Hundt", "url": "http://mlsys.org/api/miniconf/users/28962?format=json", "institution": "Google"}, {"id": 11194, "fullname": "Naveen Kumar", "url": "http://mlsys.org/api/miniconf/users/11194?format=json", "institution": "Google"}, {"id": 27182, "fullname": "Jose Baiocchi Paredes", "url": "http://mlsys.org/api/miniconf/users/27182?format=json", "institution": "Google"}, {"id": 27766, "fullname": "Scott Goodson", "url": "http://mlsys.org/api/miniconf/users/27766?format=json", "institution": null}, {"id": 27160, "fullname": "Clive Verghese", "url": "http://mlsys.org/api/miniconf/users/27160?format=json", "institution": "Google"}, {"id": 26196, "fullname": "Prasanna Rengasamy", "url": "http://mlsys.org/api/miniconf/users/26196?format=json", "institution": "google"}, {"id": 27761, "fullname": "Kelvin Le", "url": "http://mlsys.org/api/miniconf/users/27761?format=json", "institution": null}, {"id": 25661, "fullname": "Jiya Zhang", "url": "http://mlsys.org/api/miniconf/users/25661?format=json", "institution": "Google"}, {"id": 26205, "fullname": "Charles Alaras", "url": "http://mlsys.org/api/miniconf/users/26205?format=json", "institution": "Google"}, {"id": 26287, "fullname": "Yin Zhang", "url": "http://mlsys.org/api/miniconf/users/26287?format=json", "institution": "Google"}, {"id": 27754, "fullname": "Kan Cai", "url": "http://mlsys.org/api/miniconf/users/27754?format=json", "institution": null}, {"id": 27753, "fullname": "Jiten Thakkar", "url": "http://mlsys.org/api/miniconf/users/27753?format=json", "institution": null}, {"id": 27759, "fullname": "Sai Ganesh Bandiatmakuri", "url": "http://mlsys.org/api/miniconf/users/27759?format=json", "institution": "Google"}, {"id": 27769, "fullname": "Yogesh SY", "url": "http://mlsys.org/api/miniconf/users/27769?format=json", "institution": null}, {"id": 23805, "fullname": "Ani Udipi", "url": "http://mlsys.org/api/miniconf/users/23805?format=json", "institution": "Google"}, {"id": 27760, "fullname": "Vikas Agarwal", "url": "http://mlsys.org/api/miniconf/users/27760?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3827", "url": "https://openxla.org/xprof", "sourceid": -16, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T16:30:00-07:00", "endtime": "2026-05-21T16:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3717?format=json", "parent_id": 3717, "eventmedia": [{"id": 1085, "modified": "2026-05-15T09:57:27.625082-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3827.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3604?format=json"], "related_events_ids": [3604]}, {"id": 3736, "uid": "1c383cd30b7c298ab50293adfecb7b18", "name": "GhostServe: A Lightweight Checkpointing System in the Shadow for Fault-Tolerant LLM Serving", "authors": [{"id": 25189, "fullname": "Shakya Jayakody", "url": "http://mlsys.org/api/miniconf/users/25189?format=json", "institution": "University of Central Florida"}, {"id": 17878, "fullname": "Youpeng Zhao", "url": "http://mlsys.org/api/miniconf/users/17878?format=json", "institution": "University of Central Florida"}, {"id": 27193, "fullname": "Chinmay Dhanraj Nehate", "url": "http://mlsys.org/api/miniconf/users/27193?format=json", "institution": "University of Central Florida"}, {"id": 26288, "fullname": "Jun Wang", "url": "http://mlsys.org/api/miniconf/users/26288?format=json", "institution": "University of Central Florida"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3736", "url": "https://github.com/project-ghostserve/26mlsys-AE-GhostServe", "sourceid": -35, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T16:15:00-07:00", "endtime": "2026-05-20T16:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3691?format=json", "parent_id": 3691, "eventmedia": [{"id": 989, "modified": "2026-05-15T06:51:48.791631-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3736_8a0AKFA.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3513?format=json"], "related_events_ids": [3513]}, {"id": 3539, "uid": "9b8619251a19057cff70779273e95aa6", "name": "Practical Adversarial Multi-Armed Bandits with Sublinear Runtime", "authors": [{"id": 21072, "fullname": "Kasper Overgaard Mortensen", "url": "http://mlsys.org/api/miniconf/users/21072?format=json", "institution": "Aarhus University"}, {"id": 27348, "fullname": "Ama Bembua Bainson", "url": "http://mlsys.org/api/miniconf/users/27348?format=json", "institution": "Aarhus University"}, {"id": 27349, "fullname": "Mathias Tversted", "url": "http://mlsys.org/api/miniconf/users/27349?format=json", "institution": null}, {"id": 27350, "fullname": "Kristoffer Strube", "url": "http://mlsys.org/api/miniconf/users/27350?format=json", "institution": "Kristoffer Strube Consulting"}, {"id": 27351, "fullname": "Renata Borovica-Gajic", "url": "http://mlsys.org/api/miniconf/users/27351?format=json", "institution": "University of Melbourne"}, {"id": 27352, "fullname": "Andrea Paudice", "url": "http://mlsys.org/api/miniconf/users/27352?format=json", "institution": "Aarhus University"}, {"id": 21058, "fullname": "Davide Mottin", "url": "http://mlsys.org/api/miniconf/users/21058?format=json", "institution": "Aarhus University"}, {"id": 21084, "fullname": "Panagiotis Karras", "url": "http://mlsys.org/api/miniconf/users/21084?format=json", "institution": "Copenhagen University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3539", "url": null, "sourceid": 130, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=lfHvcstuo2", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 833, "modified": "2026-03-23T21:52:44.377815-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=lfHvcstuo2", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "20", "related_events": ["http://mlsys.org/api/miniconf/events/3762?format=json"], "related_events_ids": [3762]}, {"id": 3601, "uid": "c45147dee729311ef5b5c3003946c48f", "name": "Pylo: Towards Accessible Learned Optimizers in PyTorch", "authors": [{"id": 27741, "fullname": "Paul Janson", "url": "http://mlsys.org/api/miniconf/users/27741?format=json", "institution": "Concordia University"}, {"id": 27742, "fullname": "Benjamin Th\u00e9rien", "url": "http://mlsys.org/api/miniconf/users/27742?format=json", "institution": "Mila / Universit\u00e9 de Montr\u00e9al"}, {"id": 27743, "fullname": "Quentin Anthony", "url": "http://mlsys.org/api/miniconf/users/27743?format=json", "institution": "EleutherAI"}, {"id": 27744, "fullname": "Xiaolong Huang", "url": "http://mlsys.org/api/miniconf/users/27744?format=json", "institution": "Concordia University"}, {"id": 27745, "fullname": "Abhinav Moudgil", "url": "http://mlsys.org/api/miniconf/users/27745?format=json", "institution": "Concordia University"}, {"id": 27746, "fullname": "Eugene Belilovsky", "url": "http://mlsys.org/api/miniconf/users/27746?format=json", "institution": "Concordia University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3601", "url": "https://belilovsky-lab.github.io/pylo/", "sourceid": 116, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=M9V1n4KxSd", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 895, "modified": "2026-03-23T21:52:46.873684-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=M9V1n4KxSd", "resourcetype": "UriEventmedia"}, {"id": 1004, "file": "/media/PosterPDFs/MLSys%202026/3601-thumb.png", "modified": "2026-05-13T08:40:38.841225-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1011, "file": "/media/PosterPDFs/MLSys%202026/3601.png", "modified": "2026-05-13T14:50:52.734099-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "29", "related_events": ["http://mlsys.org/api/miniconf/events/3824?format=json"], "related_events_ids": [3824]}, {"id": 3604, "uid": "c74d97b01eae257e44aa9d5bade97baf", "name": "XProf: An Open, Scalable, and Extensible Profiling System for the Modern ML Stack", "authors": [{"id": 28962, "fullname": "Robert Hundt", "url": "http://mlsys.org/api/miniconf/users/28962?format=json", "institution": "Google"}, {"id": 11194, "fullname": "Naveen Kumar", "url": "http://mlsys.org/api/miniconf/users/11194?format=json", "institution": "Google"}, {"id": 27182, "fullname": "Jose Baiocchi Paredes", "url": "http://mlsys.org/api/miniconf/users/27182?format=json", "institution": "Google"}, {"id": 27766, "fullname": "Scott Goodson", "url": "http://mlsys.org/api/miniconf/users/27766?format=json", "institution": null}, {"id": 27160, "fullname": "Clive Verghese", "url": "http://mlsys.org/api/miniconf/users/27160?format=json", "institution": "Google"}, {"id": 26196, "fullname": "Prasanna Rengasamy", "url": "http://mlsys.org/api/miniconf/users/26196?format=json", "institution": "google"}, {"id": 27761, "fullname": "Kelvin Le", "url": "http://mlsys.org/api/miniconf/users/27761?format=json", "institution": null}, {"id": 25661, "fullname": "Jiya Zhang", "url": "http://mlsys.org/api/miniconf/users/25661?format=json", "institution": "Google"}, {"id": 26205, "fullname": "Charles Alaras", "url": "http://mlsys.org/api/miniconf/users/26205?format=json", "institution": "Google"}, {"id": 26287, "fullname": "Yin Zhang", "url": "http://mlsys.org/api/miniconf/users/26287?format=json", "institution": "Google"}, {"id": 27754, "fullname": "Kan Cai", "url": "http://mlsys.org/api/miniconf/users/27754?format=json", "institution": null}, {"id": 27753, "fullname": "Jiten Thakkar", "url": "http://mlsys.org/api/miniconf/users/27753?format=json", "institution": null}, {"id": 27759, "fullname": "Sai Ganesh Bandiatmakuri", "url": "http://mlsys.org/api/miniconf/users/27759?format=json", "institution": "Google"}, {"id": 27769, "fullname": "Yogesh SY", "url": "http://mlsys.org/api/miniconf/users/27769?format=json", "institution": null}, {"id": 23805, "fullname": "Ani Udipi", "url": "http://mlsys.org/api/miniconf/users/23805?format=json", "institution": "Google"}, {"id": 27760, "fullname": "Vikas Agarwal", "url": "http://mlsys.org/api/miniconf/users/27760?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3604", "url": "https://openxla.org/xprof", "sourceid": 16, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=KqRLAdGK6C", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 898, "modified": "2026-03-23T21:52:46.968487-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=KqRLAdGK6C", "resourcetype": "UriEventmedia"}, {"id": 1013, "file": "/media/PosterPDFs/MLSys%202026/3604.png", "modified": "2026-05-13T15:14:28.074166-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1014, "file": "/media/PosterPDFs/MLSys%202026/3604-thumb.png", "modified": "2026-05-13T15:14:28.159848-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1086, "modified": "2026-05-15T10:18:33.046744-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3604_M1UoXGo.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "34", "related_events": ["http://mlsys.org/api/miniconf/events/3827?format=json"], "related_events_ids": [3827]}, {"id": 3815, "uid": "07e1cd7dca89a1678042477183b7ac3f", "name": "Event Tensor: A Unified Abstraction for Compiling Dynamic Megakernel", "authors": [{"id": 16930, "fullname": "Hongyi Jin", "url": "http://mlsys.org/api/miniconf/users/16930?format=json", "institution": "Carnegie Mellon University"}, {"id": 15229, "fullname": "Bohan Hou", "url": "http://mlsys.org/api/miniconf/users/15229?format=json", "institution": "Carnegie Mellon University"}, {"id": 27670, "fullname": "Guanjie Wang", "url": "http://mlsys.org/api/miniconf/users/27670?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 16412, "fullname": "Ruihang Lai", "url": "http://mlsys.org/api/miniconf/users/16412?format=json", "institution": "Carnegie Mellon University"}, {"id": 27671, "fullname": "Jinqi Chen", "url": "http://mlsys.org/api/miniconf/users/27671?format=json", "institution": "School of Computer Science, Carnegie Mellon University"}, {"id": 12026, "fullname": "Zihao Ye", "url": "http://mlsys.org/api/miniconf/users/12026?format=json", "institution": "NVIDIA"}, {"id": 20904, "fullname": "Yaxing Cai", "url": "http://mlsys.org/api/miniconf/users/20904?format=json", "institution": "NVIDIA"}, {"id": 23351, "fullname": "Yixin Dong", "url": "http://mlsys.org/api/miniconf/users/23351?format=json", "institution": "Carnegie Mellon University"}, {"id": 27672, "fullname": "Xinhao Cheng", "url": "http://mlsys.org/api/miniconf/users/27672?format=json", "institution": "Carnegie Mellon University"}, {"id": 25596, "fullname": "Zhihao Zhang", "url": "http://mlsys.org/api/miniconf/users/25596?format=json", "institution": "Carnegie Mellon University"}, {"id": 20906, "fullname": "Yilong Zhao", "url": "http://mlsys.org/api/miniconf/users/20906?format=json", "institution": "University of California, Berkeley"}, {"id": 28960, "fullname": "Yingyi Huang", "url": "http://mlsys.org/api/miniconf/users/28960?format=json", "institution": "NVIDIA"}, {"id": 27674, "fullname": "Lijie Yang", "url": "http://mlsys.org/api/miniconf/users/27674?format=json", "institution": "Princeton University"}, {"id": 27675, "fullname": "Jinchen Jiang", "url": "http://mlsys.org/api/miniconf/users/27675?format=json", "institution": "Tsinghua University"}, {"id": 27676, "fullname": "Gabriele Oliaro", "url": "http://mlsys.org/api/miniconf/users/27676?format=json", "institution": "Carnegie Mellon University"}, {"id": 27677, "fullname": "Jianan Ji", "url": "http://mlsys.org/api/miniconf/users/27677?format=json", "institution": null}, {"id": 27678, "fullname": "Xupeng Miao", "url": "http://mlsys.org/api/miniconf/users/27678?format=json", "institution": "Purdue University"}, {"id": 12410, "fullname": "Vinod Grover", "url": "http://mlsys.org/api/miniconf/users/12410?format=json", "institution": "NVIDIA"}, {"id": 12052, "fullname": "Todd Mowry", "url": "http://mlsys.org/api/miniconf/users/12052?format=json", "institution": "Carnegie Mellon University"}, {"id": 16147, "fullname": "Zhihao Jia", "url": "http://mlsys.org/api/miniconf/users/16147?format=json", "institution": "Carnegie Mellon University and LithosAI"}, {"id": 11984, "fullname": "Tianqi Chen", "url": "http://mlsys.org/api/miniconf/users/11984?format=json", "institution": "CMU"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Compilers and Kernels", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3815", "url": null, "sourceid": -119, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T16:45:00-07:00", "endtime": "2026-05-21T17:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3718?format=json", "parent_id": 3718, "eventmedia": [{"id": 1135, "modified": "2026-05-15T22:07:55.580286-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3815.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3592?format=json"], "related_events_ids": [3592]}, {"id": 3800, "uid": "a3c65c2974270fd093ee8a9bf8ae7d0b", "name": "ProTrain: Efficient LLM Training via Automatic Memory Management", "authors": [{"id": 27620, "fullname": "Hanmei Yang", "url": "http://mlsys.org/api/miniconf/users/27620?format=json", "institution": "UMass Amherst"}, {"id": 28465, "fullname": "Jin Zhou", "url": "http://mlsys.org/api/miniconf/users/28465?format=json", "institution": "University of Massachusetts at Amherst"}, {"id": 27622, "fullname": "Yao Fu", "url": "http://mlsys.org/api/miniconf/users/27622?format=json", "institution": "Advanced Micro Devices"}, {"id": 28466, "fullname": "Xiaoqun Wang", "url": "http://mlsys.org/api/miniconf/users/28466?format=json", "institution": "Advanced Micro Devices"}, {"id": 27624, "fullname": "Ramine Roane", "url": "http://mlsys.org/api/miniconf/users/27624?format=json", "institution": "Advanced Micro Devices"}, {"id": 11878, "fullname": "Hui Guan", "url": "http://mlsys.org/api/miniconf/users/11878?format=json", "institution": "University of Massachusetts, Amherst; Amazon"}, {"id": 27625, "fullname": "Tongping Liu", "url": "http://mlsys.org/api/miniconf/users/27625?format=json", "institution": "XPeng Motors"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3800", "url": null, "sourceid": -108, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T09:00:00-07:00", "endtime": "2026-05-20T09:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3679?format=json", "parent_id": 3679, "eventmedia": [{"id": 1061, "modified": "2026-05-19T22:17:46.629965-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3800_lv912MR.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3577?format=json"], "related_events_ids": [3577]}, {"id": 3511, "uid": "d1fe173d08e959397adf34b1d77e88d7", "name": "Machine Learning Fleet Efficiency: Improving TPU Systems at Scale with ML Productivity Goodput", "authors": [{"id": 27181, "fullname": "Arissa Wongpanich", "url": "http://mlsys.org/api/miniconf/users/27181?format=json", "institution": "Google"}, {"id": 11197, "fullname": "Tayo Oguntebi", "url": "http://mlsys.org/api/miniconf/users/11197?format=json", "institution": "Google LLC"}, {"id": 27182, "fullname": "Jose Baiocchi Paredes", "url": "http://mlsys.org/api/miniconf/users/27182?format=json", "institution": "Google"}, {"id": 11105, "fullname": "Yu Wang", "url": "http://mlsys.org/api/miniconf/users/11105?format=json", "institution": "Harvard University"}, {"id": 27183, "fullname": "Phitchaya Phothilimthana", "url": "http://mlsys.org/api/miniconf/users/27183?format=json", "institution": "OpenAI"}, {"id": 27184, "fullname": "Ritwika Mitra", "url": "http://mlsys.org/api/miniconf/users/27184?format=json", "institution": "Google"}, {"id": 27185, "fullname": "Zongwei Zhou", "url": "http://mlsys.org/api/miniconf/users/27185?format=json", "institution": null}, {"id": 11194, "fullname": "Naveen Kumar", "url": "http://mlsys.org/api/miniconf/users/11194?format=json", "institution": "Google"}, {"id": 10754, "fullname": "Vijay Janapa Reddi", "url": "http://mlsys.org/api/miniconf/users/10754?format=json", "institution": "Harvard University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3511", "url": null, "sourceid": 79, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=y31QSL9yMG", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 805, "modified": "2026-03-23T21:52:43.351317-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=y31QSL9yMG", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "44", "related_events": ["http://mlsys.org/api/miniconf/events/3734?format=json"], "related_events_ids": [3734]}, {"id": 3560, "uid": "7f1de29e6da19d22b51c68001e7e0e54", "name": "Learning from Less: Measuring the Effectiveness of RLVR in Low Data and Compute Regimes", "authors": [{"id": 27558, "fullname": "Justin Bauer", "url": "http://mlsys.org/api/miniconf/users/27558?format=json", "institution": "Snorkel AI"}, {"id": 27559, "fullname": "Thomas Walshe", "url": "http://mlsys.org/api/miniconf/users/27559?format=json", "institution": "Reflection AI"}, {"id": 27560, "fullname": "Derek Pham", "url": "http://mlsys.org/api/miniconf/users/27560?format=json", "institution": "Snorkel AI"}, {"id": 27561, "fullname": "Harit Vishwakarma", "url": "http://mlsys.org/api/miniconf/users/27561?format=json", "institution": "University of Wisconsin, Madison"}, {"id": 27562, "fullname": "Armin Parchami", "url": "http://mlsys.org/api/miniconf/users/27562?format=json", "institution": "Snorkel AI"}, {"id": 27563, "fullname": "Frederic Sala", "url": "http://mlsys.org/api/miniconf/users/27563?format=json", "institution": "University of Wisconsin, Madison"}, {"id": 27564, "fullname": "Paroma Varma", "url": "http://mlsys.org/api/miniconf/users/27564?format=json", "institution": "Snorkel AI"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3560", "url": null, "sourceid": 135, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=fV4t4kYvgi", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 854, "modified": "2026-03-23T21:52:45.251890-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=fV4t4kYvgi", "resourcetype": "UriEventmedia"}, {"id": 1044, "file": "/media/PosterPDFs/MLSys%202026/3560.png", "modified": "2026-05-14T11:10:24.265581-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1045, "file": "/media/PosterPDFs/MLSys%202026/3560-thumb.png", "modified": "2026-05-14T11:10:24.380700-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "31", "related_events": ["http://mlsys.org/api/miniconf/events/3783?format=json"], "related_events_ids": [3783]}, {"id": 3626, "uid": "43ec517d68b6edd3015b3edc9a11367b", "name": "BEAM: Joint Resource\u2013Power Optimization for Energy-Efficient LLM Inference under SLO contraints", "authors": [{"id": 27852, "fullname": "Hyunjae Lee", "url": "http://mlsys.org/api/miniconf/users/27852?format=json", "institution": "Korea Advanced Institute of Science and Technology"}, {"id": 27853, "fullname": "Sangjin Choi", "url": "http://mlsys.org/api/miniconf/users/27853?format=json", "institution": "Korea Advanced Institute of Science &amp; Technology"}, {"id": 27854, "fullname": "Seungjae Lim", "url": "http://mlsys.org/api/miniconf/users/27854?format=json", "institution": "Korea Advanced Institute of Science &amp; Technology"}, {"id": 27855, "fullname": "Youngjin Kwon", "url": "http://mlsys.org/api/miniconf/users/27855?format=json", "institution": "Korea Advanced Institute of Science &amp; Technology"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3626", "url": null, "sourceid": 81, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=BfNBXM8CCT", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 920, "modified": "2026-03-23T21:52:47.855700-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=BfNBXM8CCT", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "1", "related_events": ["http://mlsys.org/api/miniconf/events/3849?format=json"], "related_events_ids": [3849]}, {"id": 3551, "uid": "ac627ab1ccbdb62ec96e702f07f6425b", "name": "CATWILD: Compiler Autotuning for TPU workloads in the Wild", "authors": [{"id": 28452, "fullname": "Ignacio Cano", "url": "http://mlsys.org/api/miniconf/users/28452?format=json", "institution": "Google"}, {"id": 11105, "fullname": "Yu Wang", "url": "http://mlsys.org/api/miniconf/users/11105?format=json", "institution": "Harvard University"}, {"id": 12264, "fullname": "Mike Burrows", "url": "http://mlsys.org/api/miniconf/users/12264?format=json", "institution": "Google Brain"}, {"id": 27433, "fullname": "Ziqiang Feng", "url": "http://mlsys.org/api/miniconf/users/27433?format=json", "institution": null}, {"id": 27434, "fullname": "Matheus Camargo", "url": "http://mlsys.org/api/miniconf/users/27434?format=json", "institution": "Google"}, {"id": 27436, "fullname": "Chao Wang", "url": "http://mlsys.org/api/miniconf/users/27436?format=json", "institution": ""}, {"id": 27437, "fullname": "David Liu", "url": "http://mlsys.org/api/miniconf/users/27437?format=json", "institution": "Google"}, {"id": 27438, "fullname": "Tengyu Sun", "url": "http://mlsys.org/api/miniconf/users/27438?format=json", "institution": "Google"}, {"id": 27435, "fullname": "Alexander Wertheim", "url": "http://mlsys.org/api/miniconf/users/27435?format=json", "institution": "Google"}, {"id": 27181, "fullname": "Arissa Wongpanich", "url": "http://mlsys.org/api/miniconf/users/27181?format=json", "institution": "Google"}, {"id": 27439, "fullname": "Christof Angermueller", "url": "http://mlsys.org/api/miniconf/users/27439?format=json", "institution": "Google"}, {"id": 27440, "fullname": "Hyojun Kim", "url": "http://mlsys.org/api/miniconf/users/27440?format=json", "institution": null}, {"id": 27441, "fullname": "Wenqi Cao", "url": "http://mlsys.org/api/miniconf/users/27441?format=json", "institution": null}, {"id": 27453, "fullname": "Aleksey Orekhov", "url": "http://mlsys.org/api/miniconf/users/27453?format=json", "institution": null}, {"id": 12263, "fullname": "Amit Sabne", "url": "http://mlsys.org/api/miniconf/users/12263?format=json", "institution": "Google"}, {"id": 27442, "fullname": "Emma Sevastian", "url": "http://mlsys.org/api/miniconf/users/27442?format=json", "institution": null}, {"id": 27446, "fullname": "Mehrdad Khani", "url": "http://mlsys.org/api/miniconf/users/27446?format=json", "institution": "Google"}, {"id": 27443, "fullname": "Karthik Murthy", "url": "http://mlsys.org/api/miniconf/users/27443?format=json", "institution": null}, {"id": 27444, "fullname": "Berkin Ilbeyi", "url": "http://mlsys.org/api/miniconf/users/27444?format=json", "institution": "Google"}, {"id": 28453, "fullname": "Subhankar Shah", "url": "http://mlsys.org/api/miniconf/users/28453?format=json", "institution": "Google"}, {"id": 27445, "fullname": "Ryan Lefever", "url": "http://mlsys.org/api/miniconf/users/27445?format=json", "institution": "Google"}, {"id": 28454, "fullname": "Arjun Khare", "url": "http://mlsys.org/api/miniconf/users/28454?format=json", "institution": "Google"}, {"id": 27448, "fullname": "Ankit Sinha", "url": "http://mlsys.org/api/miniconf/users/27448?format=json", "institution": "Google"}, {"id": 27449, "fullname": "Peter Ma", "url": "http://mlsys.org/api/miniconf/users/27449?format=json", "institution": null}, {"id": 27450, "fullname": "Matt Bierbaum", "url": "http://mlsys.org/api/miniconf/users/27450?format=json", "institution": null}, {"id": 27451, "fullname": "Jeremiah Wilke", "url": "http://mlsys.org/api/miniconf/users/27451?format=json", "institution": null}, {"id": 27456, "fullname": "Emily Donahue", "url": "http://mlsys.org/api/miniconf/users/27456?format=json", "institution": "Cornell University"}, {"id": 27457, "fullname": "Sami Abu-El-Haija", "url": "http://mlsys.org/api/miniconf/users/27457?format=json", "institution": "Research, Google"}, {"id": 27452, "fullname": "Nikhil Sarda", "url": "http://mlsys.org/api/miniconf/users/27452?format=json", "institution": "Research, Google"}, {"id": 27146, "fullname": "Vineetha Govindaraj", "url": "http://mlsys.org/api/miniconf/users/27146?format=json", "institution": "Deepmind"}, {"id": 27459, "fullname": "Shobha Vasudevan", "url": "http://mlsys.org/api/miniconf/users/27459?format=json", "institution": null}, {"id": 27455, "fullname": "Kirill Gugaev", "url": "http://mlsys.org/api/miniconf/users/27455?format=json", "institution": null}, {"id": 27460, "fullname": "Idan Nachman", "url": "http://mlsys.org/api/miniconf/users/27460?format=json", "institution": null}, {"id": 27454, "fullname": "Jie Sun", "url": "http://mlsys.org/api/miniconf/users/27454?format=json", "institution": null}, {"id": 27182, "fullname": "Jose Baiocchi Paredes", "url": "http://mlsys.org/api/miniconf/users/27182?format=json", "institution": "Google"}, {"id": 27461, "fullname": "Samrat Ghosh", "url": "http://mlsys.org/api/miniconf/users/27461?format=json", "institution": null}, {"id": 27462, "fullname": "Domagoj Babic", "url": "http://mlsys.org/api/miniconf/users/27462?format=json", "institution": null}, {"id": 27463, "fullname": "Zongwei Zhou", "url": "http://mlsys.org/api/miniconf/users/27463?format=json", "institution": null}, {"id": 11194, "fullname": "Naveen Kumar", "url": "http://mlsys.org/api/miniconf/users/11194?format=json", "institution": "Google"}, {"id": 27183, "fullname": "Phitchaya Phothilimthana", "url": "http://mlsys.org/api/miniconf/users/27183?format=json", "institution": "OpenAI"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3551", "url": null, "sourceid": 99, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=hB3nov3gIP", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 845, "modified": "2026-03-23T21:52:44.871029-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=hB3nov3gIP", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "51", "related_events": ["http://mlsys.org/api/miniconf/events/3774?format=json"], "related_events_ids": [3774]}, {"id": 3849, "uid": "43ec517d68b6edd3015b3edc9a11367b", "name": "BEAM: Joint Resource\u2013Power Optimization for Energy-Efficient LLM Inference under SLO contraints", "authors": [{"id": 27852, "fullname": "Hyunjae Lee", "url": "http://mlsys.org/api/miniconf/users/27852?format=json", "institution": "Korea Advanced Institute of Science and Technology"}, {"id": 27853, "fullname": "Sangjin Choi", "url": "http://mlsys.org/api/miniconf/users/27853?format=json", "institution": "Korea Advanced Institute of Science &amp; Technology"}, {"id": 27854, "fullname": "Seungjae Lim", "url": "http://mlsys.org/api/miniconf/users/27854?format=json", "institution": "Korea Advanced Institute of Science &amp; Technology"}, {"id": 27855, "fullname": "Youngjin Kwon", "url": "http://mlsys.org/api/miniconf/users/27855?format=json", "institution": "Korea Advanced Institute of Science &amp; Technology"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3849", "url": "https://github.com/jlee335/BEAM-artifact", "sourceid": -81, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T08:30:00-07:00", "endtime": "2026-05-20T08:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3678?format=json", "parent_id": 3678, "eventmedia": [{"id": 1144, "modified": "2026-05-19T07:50:33.916352-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3849_mCVfQGX.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3626?format=json"], "related_events_ids": [3626]}, {"id": 3774, "uid": "ac627ab1ccbdb62ec96e702f07f6425b", "name": "CATWILD: Compiler Autotuning for TPU workloads in the Wild", "authors": [{"id": 28452, "fullname": "Ignacio Cano", "url": "http://mlsys.org/api/miniconf/users/28452?format=json", "institution": "Google"}, {"id": 11105, "fullname": "Yu Wang", "url": "http://mlsys.org/api/miniconf/users/11105?format=json", "institution": "Harvard University"}, {"id": 12264, "fullname": "Mike Burrows", "url": "http://mlsys.org/api/miniconf/users/12264?format=json", "institution": "Google Brain"}, {"id": 27433, "fullname": "Ziqiang Feng", "url": "http://mlsys.org/api/miniconf/users/27433?format=json", "institution": null}, {"id": 27434, "fullname": "Matheus Camargo", "url": "http://mlsys.org/api/miniconf/users/27434?format=json", "institution": "Google"}, {"id": 27436, "fullname": "Chao Wang", "url": "http://mlsys.org/api/miniconf/users/27436?format=json", "institution": ""}, {"id": 27437, "fullname": "David Liu", "url": "http://mlsys.org/api/miniconf/users/27437?format=json", "institution": "Google"}, {"id": 27438, "fullname": "Tengyu Sun", "url": "http://mlsys.org/api/miniconf/users/27438?format=json", "institution": "Google"}, {"id": 27435, "fullname": "Alexander Wertheim", "url": "http://mlsys.org/api/miniconf/users/27435?format=json", "institution": "Google"}, {"id": 27181, "fullname": "Arissa Wongpanich", "url": "http://mlsys.org/api/miniconf/users/27181?format=json", "institution": "Google"}, {"id": 27439, "fullname": "Christof Angermueller", "url": "http://mlsys.org/api/miniconf/users/27439?format=json", "institution": "Google"}, {"id": 27440, "fullname": "Hyojun Kim", "url": "http://mlsys.org/api/miniconf/users/27440?format=json", "institution": null}, {"id": 27441, "fullname": "Wenqi Cao", "url": "http://mlsys.org/api/miniconf/users/27441?format=json", "institution": null}, {"id": 27453, "fullname": "Aleksey Orekhov", "url": "http://mlsys.org/api/miniconf/users/27453?format=json", "institution": null}, {"id": 12263, "fullname": "Amit Sabne", "url": "http://mlsys.org/api/miniconf/users/12263?format=json", "institution": "Google"}, {"id": 27442, "fullname": "Emma Sevastian", "url": "http://mlsys.org/api/miniconf/users/27442?format=json", "institution": null}, {"id": 27446, "fullname": "Mehrdad Khani", "url": "http://mlsys.org/api/miniconf/users/27446?format=json", "institution": "Google"}, {"id": 27443, "fullname": "Karthik Murthy", "url": "http://mlsys.org/api/miniconf/users/27443?format=json", "institution": null}, {"id": 27444, "fullname": "Berkin Ilbeyi", "url": "http://mlsys.org/api/miniconf/users/27444?format=json", "institution": "Google"}, {"id": 28453, "fullname": "Subhankar Shah", "url": "http://mlsys.org/api/miniconf/users/28453?format=json", "institution": "Google"}, {"id": 27445, "fullname": "Ryan Lefever", "url": "http://mlsys.org/api/miniconf/users/27445?format=json", "institution": "Google"}, {"id": 28454, "fullname": "Arjun Khare", "url": "http://mlsys.org/api/miniconf/users/28454?format=json", "institution": "Google"}, {"id": 27448, "fullname": "Ankit Sinha", "url": "http://mlsys.org/api/miniconf/users/27448?format=json", "institution": "Google"}, {"id": 27449, "fullname": "Peter Ma", "url": "http://mlsys.org/api/miniconf/users/27449?format=json", "institution": null}, {"id": 27450, "fullname": "Matt Bierbaum", "url": "http://mlsys.org/api/miniconf/users/27450?format=json", "institution": null}, {"id": 27451, "fullname": "Jeremiah Wilke", "url": "http://mlsys.org/api/miniconf/users/27451?format=json", "institution": null}, {"id": 27456, "fullname": "Emily Donahue", "url": "http://mlsys.org/api/miniconf/users/27456?format=json", "institution": "Cornell University"}, {"id": 27457, "fullname": "Sami Abu-El-Haija", "url": "http://mlsys.org/api/miniconf/users/27457?format=json", "institution": "Research, Google"}, {"id": 27452, "fullname": "Nikhil Sarda", "url": "http://mlsys.org/api/miniconf/users/27452?format=json", "institution": "Research, Google"}, {"id": 27146, "fullname": "Vineetha Govindaraj", "url": "http://mlsys.org/api/miniconf/users/27146?format=json", "institution": "Deepmind"}, {"id": 27459, "fullname": "Shobha Vasudevan", "url": "http://mlsys.org/api/miniconf/users/27459?format=json", "institution": null}, {"id": 27455, "fullname": "Kirill Gugaev", "url": "http://mlsys.org/api/miniconf/users/27455?format=json", "institution": null}, {"id": 27460, "fullname": "Idan Nachman", "url": "http://mlsys.org/api/miniconf/users/27460?format=json", "institution": null}, {"id": 27454, "fullname": "Jie Sun", "url": "http://mlsys.org/api/miniconf/users/27454?format=json", "institution": null}, {"id": 27182, "fullname": "Jose Baiocchi Paredes", "url": "http://mlsys.org/api/miniconf/users/27182?format=json", "institution": "Google"}, {"id": 27461, "fullname": "Samrat Ghosh", "url": "http://mlsys.org/api/miniconf/users/27461?format=json", "institution": null}, {"id": 27462, "fullname": "Domagoj Babic", "url": "http://mlsys.org/api/miniconf/users/27462?format=json", "institution": null}, {"id": 27463, "fullname": "Zongwei Zhou", "url": "http://mlsys.org/api/miniconf/users/27463?format=json", "institution": null}, {"id": 11194, "fullname": "Naveen Kumar", "url": "http://mlsys.org/api/miniconf/users/11194?format=json", "institution": "Google"}, {"id": 27183, "fullname": "Phitchaya Phothilimthana", "url": "http://mlsys.org/api/miniconf/users/27183?format=json", "institution": "OpenAI"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Compilers/HW", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3774", "url": null, "sourceid": -99, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-22T09:00:00-07:00", "endtime": "2026-05-22T09:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3721?format=json", "parent_id": 3721, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3551?format=json"], "related_events_ids": [3551]}, {"id": 3635, "uid": "28dd2c7955ce926456240b2ff0100bde", "name": "AXLearn: Modular, Hardware-Agnostic Large Model Training", "authors": [{"id": 27168, "fullname": "Mark Lee", "url": "http://mlsys.org/api/miniconf/users/27168?format=json", "institution": "Meta"}, {"id": 25935, "fullname": "Chang Lan", "url": "http://mlsys.org/api/miniconf/users/25935?format=json", "institution": ""}, {"id": 27918, "fullname": "Tom Gunter", "url": "http://mlsys.org/api/miniconf/users/27918?format=json", "institution": "Apple"}, {"id": 28476, "fullname": "John Peebles", "url": "http://mlsys.org/api/miniconf/users/28476?format=json", "institution": "Apple"}, {"id": 28477, "fullname": "Hanzhi Zhou", "url": "http://mlsys.org/api/miniconf/users/28477?format=json", "institution": "OpenAI"}, {"id": 27921, "fullname": "Xuan Zou", "url": "http://mlsys.org/api/miniconf/users/27921?format=json", "institution": null}, {"id": 27922, "fullname": "Sneha Bangalore", "url": "http://mlsys.org/api/miniconf/users/27922?format=json", "institution": ""}, {"id": 27923, "fullname": "Chung-Cheng Chiu", "url": "http://mlsys.org/api/miniconf/users/27923?format=json", "institution": null}, {"id": 27924, "fullname": "Nan Du", "url": "http://mlsys.org/api/miniconf/users/27924?format=json", "institution": null}, {"id": 27925, "fullname": "Xianzhi Du", "url": "http://mlsys.org/api/miniconf/users/27925?format=json", "institution": "Apple"}, {"id": 27926, "fullname": "Philipp Dufter", "url": "http://mlsys.org/api/miniconf/users/27926?format=json", "institution": "Apple"}, {"id": 27927, "fullname": "Liang He", "url": "http://mlsys.org/api/miniconf/users/27927?format=json", "institution": null}, {"id": 27928, "fullname": "Ruixuan Hou", "url": "http://mlsys.org/api/miniconf/users/27928?format=json", "institution": "Apple Inc"}, {"id": 27929, "fullname": "Haoshuo Huang", "url": "http://mlsys.org/api/miniconf/users/27929?format=json", "institution": "Apple"}, {"id": 27930, "fullname": "Dongseong Hwang", "url": "http://mlsys.org/api/miniconf/users/27930?format=json", "institution": null}, {"id": 27931, "fullname": "Xiang Kong", "url": "http://mlsys.org/api/miniconf/users/27931?format=json", "institution": "Apple"}, {"id": 27932, "fullname": "Jinhao Lei", "url": "http://mlsys.org/api/miniconf/users/27932?format=json", "institution": ", Columbia University"}, {"id": 27933, "fullname": "Tao Lei", "url": "http://mlsys.org/api/miniconf/users/27933?format=json", "institution": "Apple"}, {"id": 27934, "fullname": "Meng Li", "url": "http://mlsys.org/api/miniconf/users/27934?format=json", "institution": "Apple"}, {"id": 15067, "fullname": "Li Li", "url": "http://mlsys.org/api/miniconf/users/15067?format=json", "institution": "Apple"}, {"id": 27935, "fullname": "Jiarui Lu", "url": "http://mlsys.org/api/miniconf/users/27935?format=json", "institution": "Apple"}, {"id": 27936, "fullname": "Zhiyun Lu", "url": "http://mlsys.org/api/miniconf/users/27936?format=json", "institution": "Apple"}, {"id": 27937, "fullname": "Yiping Ma", "url": "http://mlsys.org/api/miniconf/users/27937?format=json", "institution": null}, {"id": 27938, "fullname": "David Qiu", "url": "http://mlsys.org/api/miniconf/users/27938?format=json", "institution": null}, {"id": 27939, "fullname": "Vivek Rathod", "url": "http://mlsys.org/api/miniconf/users/27939?format=json", "institution": null}, {"id": 27940, "fullname": "Senyu Tong", "url": "http://mlsys.org/api/miniconf/users/27940?format=json", "institution": null}, {"id": 27941, "fullname": "Zhucheng Tu", "url": "http://mlsys.org/api/miniconf/users/27941?format=json", "institution": "Apple"}, {"id": 27942, "fullname": "Chong Wang", "url": "http://mlsys.org/api/miniconf/users/27942?format=json", "institution": "Meta"}, {"id": 27943, "fullname": "Jianyu Wang", "url": "http://mlsys.org/api/miniconf/users/27943?format=json", "institution": "Apple"}, {"id": 27944, "fullname": "Yongqiang Wang", "url": "http://mlsys.org/api/miniconf/users/27944?format=json", "institution": null}, {"id": 27945, "fullname": "Zirui Wang", "url": "http://mlsys.org/api/miniconf/users/27945?format=json", "institution": "Google Deepmind"}, {"id": 27946, "fullname": "Floris Weers", "url": "http://mlsys.org/api/miniconf/users/27946?format=json", "institution": null}, {"id": 27947, "fullname": "Sam Wiseman", "url": "http://mlsys.org/api/miniconf/users/27947?format=json", "institution": "Apple"}, {"id": 27948, "fullname": "Guoli Yin", "url": "http://mlsys.org/api/miniconf/users/27948?format=json", "institution": "Apple"}, {"id": 27949, "fullname": "Bowen Zhang", "url": "http://mlsys.org/api/miniconf/users/27949?format=json", "institution": null}, {"id": 12530, "fullname": "Xiyou Zhou", "url": "http://mlsys.org/api/miniconf/users/12530?format=json", "institution": "Apple"}, {"id": 17608, "fullname": "Danyang Zhuo", "url": "http://mlsys.org/api/miniconf/users/17608?format=json", "institution": "Duke University"}, {"id": 27950, "fullname": "Cheng Leong", "url": "http://mlsys.org/api/miniconf/users/27950?format=json", "institution": null}, {"id": 27951, "fullname": "Ruoming Pang", "url": "http://mlsys.org/api/miniconf/users/27951?format=json", "institution": "OpenAI"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3635", "url": "https://github.com/apple/axlearn", "sourceid": 77, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=41x11EB3bc", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 929, "modified": "2026-03-23T21:52:48.241206-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=41x11EB3bc", "resourcetype": "UriEventmedia"}, {"id": 1116, "modified": "2026-05-15T15:55:49.475974-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3635.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "26", "related_events": ["http://mlsys.org/api/miniconf/events/3858?format=json"], "related_events_ids": [3858]}, {"id": 3818, "uid": "6512bd43d9caa6e02c990b0a82652dca", "name": "Once-for-All Channel Mixers (HyperTinyPW): Generative Compression for TinyML", "authors": [{"id": 25666, "fullname": "Yassien Shaalan", "url": "http://mlsys.org/api/miniconf/users/25666?format=json", "institution": "Independent"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Model Compression", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3818", "url": "https://github.com/yassienshaalan/tinyml-gen", "sourceid": -11, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T17:30:00-07:00", "endtime": "2026-05-20T17:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3696?format=json", "parent_id": 3696, "eventmedia": [{"id": 956, "modified": "2026-05-19T07:38:18.761090-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3818_UaGcJ0C.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3595?format=json"], "related_events_ids": [3595]}, {"id": 3740, "uid": "6ea9ab1baa0efb9e19094440c317e21b", "name": "ProfInfer: An eBPF-based Fine-Grained LLM Inference Profiler", "authors": [{"id": 26249, "fullname": "Bohua Zou", "url": "http://mlsys.org/api/miniconf/users/26249?format=json", "institution": "Technical University of Munich"}, {"id": 27201, "fullname": "Debayan Roy", "url": "http://mlsys.org/api/miniconf/users/27201?format=json", "institution": null}, {"id": 27202, "fullname": "Dhimankumar Airao", "url": "http://mlsys.org/api/miniconf/users/27202?format=json", "institution": null}, {"id": 27203, "fullname": "Weihao Xu", "url": "http://mlsys.org/api/miniconf/users/27203?format=json", "institution": "TUM"}, {"id": 25570, "fullname": "Binqi Sun", "url": "http://mlsys.org/api/miniconf/users/25570?format=json", "institution": "Technical University of Munich"}, {"id": 27204, "fullname": "Yutao Liu", "url": "http://mlsys.org/api/miniconf/users/27204?format=json", "institution": null}, {"id": 27205, "fullname": "Haibo Chen", "url": "http://mlsys.org/api/miniconf/users/27205?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3740", "url": "https://gitcode.com/openharmony-robot/oh-llama.cpp/tree/main/profinfer", "sourceid": -29, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T17:30:00-07:00", "endtime": "2026-05-21T17:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3717?format=json", "parent_id": 3717, "eventmedia": [{"id": 1042, "modified": "2026-05-21T08:19:32.754581-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3740_fDdgYfm.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3517?format=json"], "related_events_ids": [3517]}, {"id": 3513, "uid": "1c383cd30b7c298ab50293adfecb7b18", "name": "GhostServe: A Lightweight Checkpointing System in the Shadow for Fault-Tolerant LLM Serving", "authors": [{"id": 25189, "fullname": "Shakya Jayakody", "url": "http://mlsys.org/api/miniconf/users/25189?format=json", "institution": "University of Central Florida"}, {"id": 17878, "fullname": "Youpeng Zhao", "url": "http://mlsys.org/api/miniconf/users/17878?format=json", "institution": "University of Central Florida"}, {"id": 27193, "fullname": "Chinmay Dhanraj Nehate", "url": "http://mlsys.org/api/miniconf/users/27193?format=json", "institution": "University of Central Florida"}, {"id": 26288, "fullname": "Jun Wang", "url": "http://mlsys.org/api/miniconf/users/26288?format=json", "institution": "University of Central Florida"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3513", "url": null, "sourceid": 35, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=xKjYiUgeOK", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 807, "modified": "2026-03-23T21:52:43.414974-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=xKjYiUgeOK", "resourcetype": "UriEventmedia"}, {"id": 990, "file": "/media/PosterPDFs/MLSys%202026/3513.png", "modified": "2026-05-15T07:05:30.806277-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 991, "file": "/media/PosterPDFs/MLSys%202026/3513-thumb.png", "modified": "2026-05-17T07:31:33.140051-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "34", "related_events": ["http://mlsys.org/api/miniconf/events/3736?format=json"], "related_events_ids": [3736]}, {"id": 3788, "uid": "44f683a84163b3523afe57c2e008bc8c", "name": "Locality-Aware Beam Scheduling for Efficient Test-Time Compute with a Consumer-grade GPU", "authors": [{"id": 25535, "fullname": "Hsing-Ti Wang", "url": "http://mlsys.org/api/miniconf/users/25535?format=json", "institution": "NTU ECLab"}, {"id": 26242, "fullname": "Hung-Tso Shiao", "url": "http://mlsys.org/api/miniconf/users/26242?format=json", "institution": "National Taiwan University"}, {"id": 27580, "fullname": "Chia-Lin Yang", "url": "http://mlsys.org/api/miniconf/users/27580?format=json", "institution": "Department of computer science and informational engineering, National Taiwan University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3788", "url": null, "sourceid": -62, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T09:15:00-07:00", "endtime": "2026-05-20T09:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3678?format=json", "parent_id": 3678, "eventmedia": [{"id": 1136, "modified": "2026-05-16T02:42:53.915094-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3788_AVkP8ig.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3565?format=json"], "related_events_ids": [3565]}, {"id": 3630, "uid": "c0c7c76d30bd3dcaefc96f40275bdc0a", "name": "ADR: AN AGENTIC DETECTION SYSTEMFORENTERPRISE AGENTIC AI SECURITY", "authors": [{"id": 27880, "fullname": "Chenning Li", "url": "http://mlsys.org/api/miniconf/users/27880?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 17735, "fullname": "Pan Hu", "url": "http://mlsys.org/api/miniconf/users/17735?format=json", "institution": "Uber"}, {"id": 28472, "fullname": "Justin Xu", "url": "http://mlsys.org/api/miniconf/users/28472?format=json", "institution": "University of Oxford"}, {"id": 27882, "fullname": "Baris Ozbas", "url": "http://mlsys.org/api/miniconf/users/27882?format=json", "institution": "Uber"}, {"id": 27883, "fullname": "Olivia Liu", "url": "http://mlsys.org/api/miniconf/users/27883?format=json", "institution": ""}, {"id": 25578, "fullname": "Caroline Van", "url": "http://mlsys.org/api/miniconf/users/25578?format=json", "institution": "Uber Technologies"}, {"id": 27884, "fullname": "Manxue Li", "url": "http://mlsys.org/api/miniconf/users/27884?format=json", "institution": null}, {"id": 27885, "fullname": "Wei Zhou", "url": "http://mlsys.org/api/miniconf/users/27885?format=json", "institution": "Uber"}, {"id": 12450, "fullname": "Mohammad Alizadeh", "url": "http://mlsys.org/api/miniconf/users/12450?format=json", "institution": "MIT CSAIL"}, {"id": 27886, "fullname": "Pengyu Zhang", "url": "http://mlsys.org/api/miniconf/users/27886?format=json", "institution": "Uber"}, {"id": 28966, "fullname": "KK Sriramadhesikan", "url": "http://mlsys.org/api/miniconf/users/28966?format=json", "institution": null}, {"id": 28967, "fullname": "Ming Zhang", "url": "http://mlsys.org/api/miniconf/users/28967?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3630", "url": null, "sourceid": 50, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=7B91Naeszw", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 924, "modified": "2026-03-23T21:52:48.031481-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=7B91Naeszw", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "1", "related_events": ["http://mlsys.org/api/miniconf/events/3853?format=json"], "related_events_ids": [3853]}, {"id": 3553, "uid": "069059b7ef840f0c74a814ec9237b6ec", "name": "FlexTrain: Scalable Hybrid-Parallel Training with Elastic Resource Utilization and Consistent Accuracy", "authors": [{"id": 25944, "fullname": "Weilin Cai", "url": "http://mlsys.org/api/miniconf/users/25944?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 27470, "fullname": "Diandian Gu", "url": "http://mlsys.org/api/miniconf/users/27470?format=json", "institution": "Bytedance Seed"}, {"id": 28455, "fullname": "Baoquan Zhong", "url": "http://mlsys.org/api/miniconf/users/28455?format=json", "institution": "Zhejiang University"}, {"id": 27471, "fullname": "Jun Wang", "url": "http://mlsys.org/api/miniconf/users/27471?format=json", "institution": "ByteDance Inc."}, {"id": 28456, "fullname": "Zhuolin Zheng", "url": "http://mlsys.org/api/miniconf/users/28456?format=json", "institution": "ByteDance Inc."}, {"id": 28457, "fullname": "Gaohong Liu", "url": "http://mlsys.org/api/miniconf/users/28457?format=json", "institution": "ByteDance Inc."}, {"id": 28458, "fullname": "Jiang Kaihua", "url": "http://mlsys.org/api/miniconf/users/28458?format=json", "institution": "University of Chinese Academy of Sciences"}, {"id": 28459, "fullname": "Shuguang Wang", "url": "http://mlsys.org/api/miniconf/users/28459?format=json", "institution": "Huazhong University of Science and Technology"}, {"id": 27472, "fullname": "Wencong Xiao", "url": "http://mlsys.org/api/miniconf/users/27472?format=json", "institution": null}, {"id": 19049, "fullname": "Jiayi Huang", "url": "http://mlsys.org/api/miniconf/users/19049?format=json", "institution": "HKUST(GZ)"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3553", "url": null, "sourceid": 126, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=h2yhNcbwSL", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 847, "modified": "2026-03-23T21:52:44.957563-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=h2yhNcbwSL", "resourcetype": "UriEventmedia"}, {"id": 973, "file": "/media/PosterPDFs/MLSys%202026/3553.png", "modified": "2026-05-07T21:14:28.850417-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 974, "file": "/media/PosterPDFs/MLSys%202026/3553-thumb.png", "modified": "2026-05-07T21:14:28.943499-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "33", "related_events": ["http://mlsys.org/api/miniconf/events/3776?format=json"], "related_events_ids": [3776]}, {"id": 3755, "uid": "14bfa6bb14875e45bba028a21ed38046", "name": "SpecDiff-2: Scaling Diffusion Drafter Alignment For Faster Speculative Decoding", "authors": [{"id": 27322, "fullname": "Jameson Sandler", "url": "http://mlsys.org/api/miniconf/users/27322?format=json", "institution": "University of Virginia"}, {"id": 27323, "fullname": "Jacob K Christopher", "url": "http://mlsys.org/api/miniconf/users/27323?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27324, "fullname": "Tom Hartvigsen", "url": "http://mlsys.org/api/miniconf/users/27324?format=json", "institution": null}, {"id": 27325, "fullname": "Ferdinando Fioretto", "url": "http://mlsys.org/api/miniconf/users/27325?format=json", "institution": "University of Virginia"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 5", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3755", "url": null, "sourceid": -69, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T09:15:00-07:00", "endtime": "2026-05-21T09:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3701?format=json", "parent_id": 3701, "eventmedia": [{"id": 1244, "modified": "2026-05-21T08:23:01.921110-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3755.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3532?format=json"], "related_events_ids": [3532]}, {"id": 3636, "uid": "26657d5ff9020d2abefe558796b99584", "name": "Zorse: Optimizing LLM Training Efficiency on Heterogeneous GPU Clusters", "authors": [{"id": 14867, "fullname": "Runsheng Guo", "url": "http://mlsys.org/api/miniconf/users/14867?format=json", "institution": "OpenAI"}, {"id": 27952, "fullname": "Utkarsh Anand", "url": "http://mlsys.org/api/miniconf/users/27952?format=json", "institution": "University of Waterloo"}, {"id": 14868, "fullname": "Khuzaima Daudjee", "url": "http://mlsys.org/api/miniconf/users/14868?format=json", "institution": "University of Waterloo"}, {"id": 27953, "fullname": "Rathijit Sen", "url": "http://mlsys.org/api/miniconf/users/27953?format=json", "institution": "Microsoft"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3636", "url": null, "sourceid": 96, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=40leuGH3iO", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 930, "modified": "2026-03-23T21:52:48.292004-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=40leuGH3iO", "resourcetype": "UriEventmedia"}, {"id": 1027, "file": "/media/PosterPDFs/MLSys%202026/3636.png", "modified": "2026-05-14T02:20:11.668923-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1028, "file": "/media/PosterPDFs/MLSys%202026/3636-thumb.png", "modified": "2026-05-14T02:20:11.756101-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "37", "related_events": ["http://mlsys.org/api/miniconf/events/3859?format=json"], "related_events_ids": [3859]}, {"id": 3784, "uid": "32bb90e8976aab5298d5da10fe66f21d", "name": "Breaking the Ice: Analyzing Cold Start Latency in vLLM", "authors": [{"id": 25925, "fullname": "Huzaifa Shaaban Kabakibo", "url": "http://mlsys.org/api/miniconf/users/25925?format=json", "institution": "Paderborn University"}, {"id": 27154, "fullname": "Animesh Trivedi", "url": "http://mlsys.org/api/miniconf/users/27154?format=json", "institution": "International Business Machines"}, {"id": 27565, "fullname": "Lin Wang", "url": "http://mlsys.org/api/miniconf/users/27565?format=json", "institution": "Paderborn University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3784", "url": "https://github.com/upb-cn/vllm-startup-profiler", "sourceid": -72, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T09:30:00-07:00", "endtime": "2026-05-20T09:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3678?format=json", "parent_id": 3678, "eventmedia": [{"id": 1223, "modified": "2026-05-19T09:35:47.364159-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3784.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3561?format=json"], "related_events_ids": [3561]}, {"id": 3733, "uid": "6f4922f45568161a8cdf4ad2299f6d23", "name": "Accelerating Large-Scale Reasoning Model Inference with Sparse Self-Speculative Decoding", "authors": [{"id": 20906, "fullname": "Yilong Zhao", "url": "http://mlsys.org/api/miniconf/users/20906?format=json", "institution": "University of California, Berkeley"}, {"id": 21005, "fullname": "Jiaming Tang", "url": "http://mlsys.org/api/miniconf/users/21005?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 17683, "fullname": "Kan Zhu", "url": "http://mlsys.org/api/miniconf/users/17683?format=json", "institution": "University of Washington"}, {"id": 12026, "fullname": "Zihao Ye", "url": "http://mlsys.org/api/miniconf/users/12026?format=json", "institution": "NVIDIA"}, {"id": 27178, "fullname": "Chi-Chih Chang", "url": "http://mlsys.org/api/miniconf/users/27178?format=json", "institution": "Cornell University"}, {"id": 27179, "fullname": "Chaofan Lin", "url": "http://mlsys.org/api/miniconf/users/27179?format=json", "institution": "Tsinghua University"}, {"id": 27180, "fullname": "Jongseok Park", "url": "http://mlsys.org/api/miniconf/users/27180?format=json", "institution": "University of California, Berkeley"}, {"id": 17675, "fullname": "Guangxuan Xiao", "url": "http://mlsys.org/api/miniconf/users/17675?format=json", "institution": "MIT"}, {"id": 17625, "fullname": "Mohamed Abdelfattah", "url": "http://mlsys.org/api/miniconf/users/17625?format=json", "institution": "Cornell University"}, {"id": 11143, "fullname": "Mingyu Gao", "url": "http://mlsys.org/api/miniconf/users/11143?format=json", "institution": "Tsinghua University"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}, {"id": 12133, "fullname": "Song Han", "url": "http://mlsys.org/api/miniconf/users/12133?format=json", "institution": "MIT"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 5", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3733", "url": null, "sourceid": -18, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T09:30:00-07:00", "endtime": "2026-05-21T09:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3701?format=json", "parent_id": 3701, "eventmedia": [{"id": 1127, "modified": "2026-05-21T08:30:19.793622-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3733_usZ8H1U.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3510?format=json"], "related_events_ids": [3510]}, {"id": 3779, "uid": "c9e1074f5b3f9fc8ea15d152add07294", "name": "Attribution-based Sparse Activation in Large Language Models", "authors": [{"id": 27495, "fullname": "Jifeng Song", "url": "http://mlsys.org/api/miniconf/users/27495?format=json", "institution": "University of Pittsburgh"}, {"id": 27496, "fullname": "Xiangyu Yin", "url": "http://mlsys.org/api/miniconf/users/27496?format=json", "institution": "University of Pittsburgh"}, {"id": 27497, "fullname": "Boyuan Yang", "url": "http://mlsys.org/api/miniconf/users/27497?format=json", "institution": "University of Pittsburgh"}, {"id": 27498, "fullname": "Kai Huang", "url": "http://mlsys.org/api/miniconf/users/27498?format=json", "institution": "University of Pittsburgh"}, {"id": 27499, "fullname": "Weichen Liu", "url": "http://mlsys.org/api/miniconf/users/27499?format=json", "institution": "University of Pittsburgh"}, {"id": 27500, "fullname": "Wei Gao", "url": "http://mlsys.org/api/miniconf/users/27500?format=json", "institution": "University of Pittsburgh"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient Computation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3779", "url": null, "sourceid": -104, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-22T08:30:00-07:00", "endtime": "2026-05-22T08:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3722?format=json", "parent_id": 3722, "eventmedia": [{"id": 1107, "modified": "2026-05-21T09:16:00.928281-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3779_uKmthRH.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3556?format=json"], "related_events_ids": [3556]}, {"id": 3597, "uid": "98dce83da57b0395e163467c9dae521b", "name": "Shannonic: Efficient Entropy-Optimal Compression for ML Workloads", "authors": [{"id": 17719, "fullname": "Kareem Ibrahim", "url": "http://mlsys.org/api/miniconf/users/17719?format=json", "institution": "University of Toronto"}, {"id": 28467, "fullname": "Mohammadjavad Maheronnaghsh", "url": "http://mlsys.org/api/miniconf/users/28467?format=json", "institution": "University of Toronto"}, {"id": 17666, "fullname": "Andreas Moshovos", "url": "http://mlsys.org/api/miniconf/users/17666?format=json", "institution": "University of Toronto"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3597", "url": null, "sourceid": 93, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=NhMxI0GbB8", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 891, "modified": "2026-03-23T21:52:46.716165-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=NhMxI0GbB8", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "40", "related_events": ["http://mlsys.org/api/miniconf/events/3820?format=json"], "related_events_ids": [3820]}, {"id": 3544, "uid": "37693cfc748049e45d87b8c7d8b9aacd", "name": "NEST: Network- and Memory-Aware Device Placement for Distributed Deep Learning", "authors": [{"id": 26264, "fullname": "Irene Wang", "url": "http://mlsys.org/api/miniconf/users/26264?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27364, "fullname": "Vishnu Venkata", "url": "http://mlsys.org/api/miniconf/users/27364?format=json", "institution": null}, {"id": 11122, "fullname": "Arvind Krishnamurthy", "url": "http://mlsys.org/api/miniconf/users/11122?format=json", "institution": "University of Washington"}, {"id": 27358, "fullname": "Divya Mahajan", "url": "http://mlsys.org/api/miniconf/users/27358?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3544", "url": "https://github.com/scai-tech/Nest", "sourceid": 23, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=jpIoO2zSKA", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 838, "modified": "2026-03-23T21:52:44.568592-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=jpIoO2zSKA", "resourcetype": "UriEventmedia"}, {"id": 1084, "file": "/media/PosterPDFs/MLSys%202026/3544.png", "modified": "2026-05-15T09:21:16.699503-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1065, "modified": "2026-05-14T22:35:39.219776-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3544.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "10", "related_events": ["http://mlsys.org/api/miniconf/events/3767?format=json"], "related_events_ids": [3767]}, {"id": 3595, "uid": "6512bd43d9caa6e02c990b0a82652dca", "name": "Once-for-All Channel Mixers (HyperTinyPW): Generative Compression for TinyML", "authors": [{"id": 25666, "fullname": "Yassien Shaalan", "url": "http://mlsys.org/api/miniconf/users/25666?format=json", "institution": "Independent"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3595", "url": "https://github.com/yassienshaalan/tinyml-gen", "sourceid": 11, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=NrDa5Fu10D", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 889, "modified": "2026-03-23T21:52:46.652716-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=NrDa5Fu10D", "resourcetype": "UriEventmedia"}, {"id": 944, "file": "/media/PosterPDFs/MLSys%202026/3595.png", "modified": "2026-04-22T00:20:47.426113-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 945, "file": "/media/PosterPDFs/MLSys%202026/3595-thumb.png", "modified": "2026-04-22T00:20:47.497900-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "42", "related_events": ["http://mlsys.org/api/miniconf/events/3818?format=json"], "related_events_ids": [3818]}, {"id": 3582, "uid": "2723d092b63885e0d7c260cc007e8b9d", "name": "MixLLM: LLM Quantization with Global Mixed-precision between Output-features and Highly-efficient System Design", "authors": [{"id": 28440, "fullname": "Zhen Zheng", "url": "http://mlsys.org/api/miniconf/users/28440?format=json", "institution": "ByteDance Inc."}, {"id": 27641, "fullname": "Xiaonan Song", "url": "http://mlsys.org/api/miniconf/users/27641?format=json", "institution": "Microsoft"}, {"id": 27642, "fullname": "Chuanjie Liu", "url": "http://mlsys.org/api/miniconf/users/27642?format=json", "institution": "Microsoft"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3582", "url": null, "sourceid": 109, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=VBbMRQ4VOc", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 876, "modified": "2026-03-23T21:52:46.162606-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=VBbMRQ4VOc", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "43", "related_events": ["http://mlsys.org/api/miniconf/events/3805?format=json"], "related_events_ids": [3805]}, {"id": 3845, "uid": "3295c76acbf4caaed33c36b1b5fc2cb1", "name": "ParallelKittens: Systematic and Practical Simplification of Multi-GPU AI Kernels", "authors": [{"id": 27842, "fullname": "Stuart H. Sul", "url": "http://mlsys.org/api/miniconf/users/27842?format=json", "institution": "Stanford University"}, {"id": 27192, "fullname": "Simran Arora", "url": "http://mlsys.org/api/miniconf/users/27192?format=json", "institution": "Computer Science Department, Stanford University"}, {"id": 27843, "fullname": "Benjamin Spector", "url": "http://mlsys.org/api/miniconf/users/27843?format=json", "institution": "Stanford University"}, {"id": 11444, "fullname": "Christopher R\u00e9", "url": "http://mlsys.org/api/miniconf/users/11444?format=json", "institution": "Stanford University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Compilers and Kernels", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3845", "url": "https://github.com/HazyResearch/ThunderKittens", "sourceid": -66, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T16:30:00-07:00", "endtime": "2026-05-21T16:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3718?format=json", "parent_id": 3718, "eventmedia": [{"id": 1245, "modified": "2026-05-21T11:07:17.202151-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3845.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3622?format=json"], "related_events_ids": [3622]}, {"id": 3547, "uid": "3ef815416f775098fe977004015c6193", "name": "Search Your Block Floating Point Scales!", "authors": [{"id": 27410, "fullname": "Tanmaey Gupta", "url": "http://mlsys.org/api/miniconf/users/27410?format=json", "institution": "Cornell University"}, {"id": 27411, "fullname": "Hayden Prairie", "url": "http://mlsys.org/api/miniconf/users/27411?format=json", "institution": "University of California, San Diego                    Together AI"}, {"id": 23865, "fullname": "Xiaoxia Wu", "url": "http://mlsys.org/api/miniconf/users/23865?format=json", "institution": "TogtherAI"}, {"id": 27412, "fullname": "Reyna Abhyankar", "url": "http://mlsys.org/api/miniconf/users/27412?format=json", "institution": "Together AI"}, {"id": 25635, "fullname": "Qingyang Wu", "url": "http://mlsys.org/api/miniconf/users/25635?format=json", "institution": "Together AI"}, {"id": 24490, "fullname": "Austin Silveria", "url": "http://mlsys.org/api/miniconf/users/24490?format=json", "institution": "University of California, San Diego"}, {"id": 27413, "fullname": "Pragaash Ponnusamy", "url": "http://mlsys.org/api/miniconf/users/27413?format=json", "institution": "Together AI"}, {"id": 27251, "fullname": "Jue Wang", "url": "http://mlsys.org/api/miniconf/users/27251?format=json", "institution": "Together AI"}, {"id": 18231, "fullname": "Ben Athiwaratkun", "url": "http://mlsys.org/api/miniconf/users/18231?format=json", "institution": null}, {"id": 14753, "fullname": "Shuaiwen Song", "url": "http://mlsys.org/api/miniconf/users/14753?format=json", "institution": "University of Sydney"}, {"id": 27414, "fullname": "Tri Dao", "url": "http://mlsys.org/api/miniconf/users/27414?format=json", "institution": "Princeton, TogetherAI"}, {"id": 27189, "fullname": "Daniel Fu", "url": "http://mlsys.org/api/miniconf/users/27189?format=json", "institution": "University of California, San Diego"}, {"id": 11289, "fullname": "Christopher De Sa", "url": "http://mlsys.org/api/miniconf/users/11289?format=json", "institution": "Cornell University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3547", "url": null, "sourceid": 85, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=innqECyZPK", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 841, "modified": "2026-03-23T21:52:44.701711-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=innqECyZPK", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "46", "related_events": ["http://mlsys.org/api/miniconf/events/3770?format=json"], "related_events_ids": [3770]}, {"id": 3566, "uid": "65ded5353c5ee48d0b7d48c591b8f430", "name": "PRISM: Parametrically Refactor Inference for Speculative Decoding Draft Models", "authors": [{"id": 28462, "fullname": "Xuliang Wang", "url": "http://mlsys.org/api/miniconf/users/28462?format=json", "institution": "University of Waterloo"}, {"id": 27581, "fullname": "Yuetao Chen", "url": "http://mlsys.org/api/miniconf/users/27581?format=json", "institution": "The Chinese University of Hong Kong"}, {"id": 27582, "fullname": "Maochan Zhen", "url": "http://mlsys.org/api/miniconf/users/27582?format=json", "institution": "Central China Institute of Artificial Intelligence"}, {"id": 27583, "fullname": "Fang LIU", "url": "http://mlsys.org/api/miniconf/users/27583?format=json", "institution": "CIAI"}, {"id": 27584, "fullname": "Xinzhou Zheng", "url": "http://mlsys.org/api/miniconf/users/27584?format=json", "institution": "University of Science and Technology of China"}, {"id": 27585, "fullname": "Xingwu Liu", "url": "http://mlsys.org/api/miniconf/users/27585?format=json", "institution": "Dalian University of Technology"}, {"id": 27586, "fullname": "Hong Xu", "url": "http://mlsys.org/api/miniconf/users/27586?format=json", "institution": "The Chinese University of Hong Kong"}, {"id": 27587, "fullname": "Ming Li", "url": "http://mlsys.org/api/miniconf/users/27587?format=json", "institution": "University of Waterloo"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3566", "url": null, "sourceid": 132, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=cvU2HuuxEf", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 860, "modified": "2026-03-23T21:52:45.514870-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=cvU2HuuxEf", "resourcetype": "UriEventmedia"}, {"id": 1126, "file": "/media/PosterPDFs/MLSys%202026/3566-thumb.png", "modified": "2026-05-15T19:48:46.471142-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1125, "file": "/media/PosterPDFs/MLSys%202026/3566.png", "modified": "2026-05-15T19:48:46.378542-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "2", "related_events": ["http://mlsys.org/api/miniconf/events/3789?format=json"], "related_events_ids": [3789]}, {"id": 3620, "uid": "03afdbd66e7929b125f8597834fa83a4", "name": "PROMPTS: PeRformance Optimization via Multi-Agent Planning for LLM Training and Serving", "authors": [{"id": 27835, "fullname": "Yuran Ding", "url": "http://mlsys.org/api/miniconf/users/27835?format=json", "institution": "Google"}, {"id": 27836, "fullname": "Ruobing Han", "url": "http://mlsys.org/api/miniconf/users/27836?format=json", "institution": "Google DeepMind"}, {"id": 27837, "fullname": "Xiaofan Zhang", "url": "http://mlsys.org/api/miniconf/users/27837?format=json", "institution": "Google"}, {"id": 27838, "fullname": "Xinwei Chen", "url": "http://mlsys.org/api/miniconf/users/27838?format=json", "institution": "Waymo"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3620", "url": null, "sourceid": 63, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=FTOfgVHcZn", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 914, "modified": "2026-03-23T21:52:47.624044-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=FTOfgVHcZn", "resourcetype": "UriEventmedia"}, {"id": 1015, "file": "/media/PosterPDFs/MLSys%202026/3620.png", "modified": "2026-05-13T19:43:52.364003-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1016, "file": "/media/PosterPDFs/MLSys%202026/3620-thumb.png", "modified": "2026-05-13T19:56:20.931260-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "3", "related_events": ["http://mlsys.org/api/miniconf/events/3843?format=json"], "related_events_ids": [3843]}, {"id": 3562, "uid": "7cbbc409ec990f19c78c75bd1e06f215", "name": "CDLM: Consistency Diffusion Language Models for Faster Sampling", "authors": [{"id": 25522, "fullname": "Minseo Kim", "url": "http://mlsys.org/api/miniconf/users/25522?format=json", "institution": "Seoul National University"}, {"id": 24298, "fullname": "Chenfeng Xu", "url": "http://mlsys.org/api/miniconf/users/24298?format=json", "institution": "Together AI/UT Austin"}, {"id": 17672, "fullname": "Coleman Hooper", "url": "http://mlsys.org/api/miniconf/users/17672?format=json", "institution": "University of California, Berkeley"}, {"id": 27566, "fullname": "Harman Singh", "url": "http://mlsys.org/api/miniconf/users/27566?format=json", "institution": "University of California, Berkeley"}, {"id": 18231, "fullname": "Ben Athiwaratkun", "url": "http://mlsys.org/api/miniconf/users/18231?format=json", "institution": null}, {"id": 18868, "fullname": "Ce Zhang", "url": "http://mlsys.org/api/miniconf/users/18868?format=json", "institution": null}, {"id": 11240, "fullname": "Kurt Keutzer", "url": "http://mlsys.org/api/miniconf/users/11240?format=json", "institution": "EECS, UC Berkeley"}, {"id": 11237, "fullname": "Amir Gholami", "url": "http://mlsys.org/api/miniconf/users/11237?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3562", "url": null, "sourceid": 70, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=eB8yjR6alL", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 856, "modified": "2026-03-23T21:52:45.337875-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=eB8yjR6alL", "resourcetype": "UriEventmedia"}, {"id": 982, "file": "/media/PosterPDFs/MLSys%202026/3562-thumb.png", "modified": "2026-05-10T09:49:27.348071-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 983, "file": "/media/PosterPDFs/MLSys%202026/3562.png", "modified": "2026-05-10T09:53:10.282746-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "4", "related_events": ["http://mlsys.org/api/miniconf/events/3785?format=json"], "related_events_ids": [3785]}, {"id": 3559, "uid": "f0935e4cd5920aa6c7c996a5ee53a70f", "name": "Speculative Decoding: Performance or Illusion?", "authors": [{"id": 28490, "fullname": "Xiaoxuan Liu", "url": "http://mlsys.org/api/miniconf/users/28490?format=json", "institution": "OpenAI"}, {"id": 25915, "fullname": "Jiaxiang Yu", "url": "http://mlsys.org/api/miniconf/users/25915?format=json", "institution": "UC Berkeley"}, {"id": 27180, "fullname": "Jongseok Park", "url": "http://mlsys.org/api/miniconf/users/27180?format=json", "institution": "University of California, Berkeley"}, {"id": 11118, "fullname": "Ion Stoica", "url": "http://mlsys.org/api/miniconf/users/11118?format=json", "institution": "UC Berkeley"}, {"id": 27557, "fullname": "Alvin Cheung", "url": "http://mlsys.org/api/miniconf/users/27557?format=json", "institution": "University of California, Berkeley"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3559", "url": null, "sourceid": 106, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=fzkqtezFEi", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 853, "modified": "2026-03-23T21:52:45.206502-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=fzkqtezFEi", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "6", "related_events": ["http://mlsys.org/api/miniconf/events/3782?format=json"], "related_events_ids": [3782]}, {"id": 3863, "uid": "d645920e395fedad7bbbed0eca3fe2e0", "name": "Hippocampus: An Efficient and Scalable Memory Module for Agentic AI", "authors": [{"id": 27978, "fullname": "Yi Li", "url": "http://mlsys.org/api/miniconf/users/27978?format=json", "institution": "University of Texas at Dallas"}, {"id": 12896, "fullname": "Lianjie Cao", "url": "http://mlsys.org/api/miniconf/users/12896?format=json", "institution": "HPE Labs"}, {"id": 15334, "fullname": "Faraz Ahmed", "url": "http://mlsys.org/api/miniconf/users/15334?format=json", "institution": "Hewlett Packard Labs"}, {"id": 14774, "fullname": "Puneet Sharma", "url": "http://mlsys.org/api/miniconf/users/14774?format=json", "institution": "HP Labs"}, {"id": 23337, "fullname": "Bingzhe Li", "url": "http://mlsys.org/api/miniconf/users/23337?format=json", "institution": "University of Texas at Dallas"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3863", "url": null, "sourceid": -40, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T14:45:00-07:00", "endtime": "2026-05-19T15:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3674?format=json", "parent_id": 3674, "eventmedia": [{"id": 1225, "modified": "2026-05-19T12:51:18.201572-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3863.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3640?format=json"], "related_events_ids": [3640]}, {"id": 3623, "uid": "1f0e3dad99908345f7439f8ffabdffc4", "name": "HELIOS : Adaptive Model And Early-Exit Selection for Efficient LLM Inference Serving", "authors": [{"id": 25962, "fullname": "Avinash Kumar", "url": "http://mlsys.org/api/miniconf/users/25962?format=json", "institution": "The University of Texas at Austin"}, {"id": 19188, "fullname": "Shashank Nag", "url": "http://mlsys.org/api/miniconf/users/19188?format=json", "institution": "The University of Texas at Austin"}, {"id": 27844, "fullname": "Jason Clemons", "url": "http://mlsys.org/api/miniconf/users/27844?format=json", "institution": "NVIDIA"}, {"id": 12633, "fullname": "LIZY JOHn", "url": "http://mlsys.org/api/miniconf/users/12633?format=json", "institution": "UT-Austin"}, {"id": 27845, "fullname": "Poulami Das", "url": "http://mlsys.org/api/miniconf/users/27845?format=json", "institution": "University of Texas at Austin"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3623", "url": null, "sourceid": 19, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=CV52m9NJFK", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 917, "modified": "2026-03-23T21:52:47.742568-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=CV52m9NJFK", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "11", "related_events": ["http://mlsys.org/api/miniconf/events/3846?format=json"], "related_events_ids": [3846]}, {"id": 3751, "uid": "67c6a1e7ce56d3d6fa748ab6d9af3fd7", "name": "TiDAR: Think in Diffusion, Talk in Autoregression", "authors": [{"id": 27286, "fullname": "Jingyu Liu", "url": "http://mlsys.org/api/miniconf/users/27286?format=json", "institution": "University of Chicago"}, {"id": 27287, "fullname": "Xin Dong", "url": "http://mlsys.org/api/miniconf/users/27287?format=json", "institution": "Seed"}, {"id": 27288, "fullname": "Zhifan Ye", "url": "http://mlsys.org/api/miniconf/users/27288?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27289, "fullname": "Rishabh Mehta", "url": "http://mlsys.org/api/miniconf/users/27289?format=json", "institution": null}, {"id": 27290, "fullname": "Yonggan Fu", "url": "http://mlsys.org/api/miniconf/users/27290?format=json", "institution": "NVIDIA"}, {"id": 27291, "fullname": "vartika singh", "url": "http://mlsys.org/api/miniconf/users/27291?format=json", "institution": "State University of New York, Buffalo"}, {"id": 18868, "fullname": "Ce Zhang", "url": "http://mlsys.org/api/miniconf/users/18868?format=json", "institution": null}, {"id": 27292, "fullname": "Pavlo Molchanov", "url": "http://mlsys.org/api/miniconf/users/27292?format=json", "institution": "NVIDIA Research"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Multimodal and Generative Models", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3751", "url": "https://tidarlm.github.io", "sourceid": -47, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T14:00:00-07:00", "endtime": "2026-05-19T14:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3669?format=json", "parent_id": 3669, "eventmedia": [{"id": 984, "modified": "2026-05-19T12:58:29.083310-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3751_1jPpJd3.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3528?format=json"], "related_events_ids": [3528]}, {"id": 3616, "uid": "65b9eea6e1cc6bb9f0cd2a47751a186f", "name": "REPARO: LOSS-RESILIENT GENERATIVE CODEC FOR VIDEO CONFERENCING", "authors": [{"id": 27821, "fullname": "Tianhong Li", "url": "http://mlsys.org/api/miniconf/users/27821?format=json", "institution": "Meta"}, {"id": 27822, "fullname": "Vibhaalakshmi Sivaraman", "url": "http://mlsys.org/api/miniconf/users/27822?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27823, "fullname": "Pantea Karimi", "url": "http://mlsys.org/api/miniconf/users/27823?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27824, "fullname": "Lijie Fan", "url": "http://mlsys.org/api/miniconf/users/27824?format=json", "institution": "Google DeepMind"}, {"id": 12450, "fullname": "Mohammad Alizadeh", "url": "http://mlsys.org/api/miniconf/users/12450?format=json", "institution": "MIT CSAIL"}, {"id": 13201, "fullname": "Dina Katabi", "url": "http://mlsys.org/api/miniconf/users/13201?format=json", "institution": "MIT"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3616", "url": null, "sourceid": 105, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=GaBGzA7fpe", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 910, "modified": "2026-03-23T21:52:47.459053-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=GaBGzA7fpe", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "15", "related_events": ["http://mlsys.org/api/miniconf/events/3839?format=json"], "related_events_ids": [3839]}, {"id": 3775, "uid": "e2c420d928d4bf8ce0ff2ec19b371514", "name": "MTraining: Distributed Dynamic Sparse Attention for Efficient Ultra-Long Context Training", "authors": [{"id": 27464, "fullname": "Wenxuan Li", "url": "http://mlsys.org/api/miniconf/users/27464?format=json", "institution": "Microsoft Research Asia"}, {"id": 27465, "fullname": "Chengruidong Zhang", "url": "http://mlsys.org/api/miniconf/users/27465?format=json", "institution": "Alibaba Group"}, {"id": 27466, "fullname": "Huiqiang Jiang", "url": "http://mlsys.org/api/miniconf/users/27466?format=json", "institution": "Qwen"}, {"id": 27467, "fullname": "Yucheng Li", "url": "http://mlsys.org/api/miniconf/users/27467?format=json", "institution": "Alibaba Group"}, {"id": 27468, "fullname": "Yuqing Yang", "url": "http://mlsys.org/api/miniconf/users/27468?format=json", "institution": null}, {"id": 27469, "fullname": "Lili Qiu", "url": "http://mlsys.org/api/miniconf/users/27469?format=json", "institution": "Microsoft Research Asia"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3775", "url": null, "sourceid": -71, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T09:15:00-07:00", "endtime": "2026-05-20T09:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3679?format=json", "parent_id": 3679, "eventmedia": [{"id": 1142, "modified": "2026-05-15T23:58:31.953566-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3775_6HYrxML.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3552?format=json"], "related_events_ids": [3552]}, {"id": 3569, "uid": "9bf31c7ff062936a96d3c8bd1f8f2ff3", "name": "EarthSight: A Distributed Framework for Low-Latency Satellite Intelligence", "authors": [{"id": 27599, "fullname": "Ansel Erol", "url": "http://mlsys.org/api/miniconf/users/27599?format=json", "institution": "Georgia Institute of Technology"}, {"id": 28491, "fullname": "Seungjun Lee", "url": "http://mlsys.org/api/miniconf/users/28491?format=json", "institution": "Korea Advanced Institute of Science &amp; Technology"}, {"id": 27358, "fullname": "Divya Mahajan", "url": "http://mlsys.org/api/miniconf/users/27358?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3569", "url": "https://www.github.com/scai-tech/earthsight", "sourceid": 15, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=c3O6DnhUYm", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 863, "modified": "2026-03-23T21:52:45.635713-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=c3O6DnhUYm", "resourcetype": "UriEventmedia"}, {"id": 939, "file": "/media/PosterPDFs/MLSys%202026/3569.png", "modified": "2026-04-18T09:03:06.586917-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 940, "file": "/media/PosterPDFs/MLSys%202026/3569-thumb.png", "modified": "2026-04-18T09:04:45.045034-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "19", "related_events": ["http://mlsys.org/api/miniconf/events/3792?format=json"], "related_events_ids": [3792]}, {"id": 3624, "uid": "5f93f983524def3dca464469d2cf9f3e", "name": "Massive-Scale Out-Of-Core UMAP on the GPU", "authors": [{"id": 27164, "fullname": "Jinsol Park", "url": "http://mlsys.org/api/miniconf/users/27164?format=json", "institution": "NVIDIA"}, {"id": 11859, "fullname": "Corey Nolet", "url": "http://mlsys.org/api/miniconf/users/11859?format=json", "institution": "NVIDIA"}, {"id": 14733, "fullname": "Edward Raff", "url": "http://mlsys.org/api/miniconf/users/14733?format=json", "institution": "Booz Allen Hamilton"}, {"id": 27846, "fullname": "Tim Oates", "url": "http://mlsys.org/api/miniconf/users/27846?format=json", "institution": "University of Maryland, Baltimore County"}, {"id": 27847, "fullname": "Akira Naruse", "url": "http://mlsys.org/api/miniconf/users/27847?format=json", "institution": "NVIDIA"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3624", "url": null, "sourceid": 110, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=CR35IJQD2J", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 918, "modified": "2026-03-23T21:52:47.789624-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=CR35IJQD2J", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "23", "related_events": ["http://mlsys.org/api/miniconf/events/3847?format=json"], "related_events_ids": [3847]}, {"id": 3638, "uid": "c9f0f895fb98ab9159f51fd0297e236d", "name": "Charon: A Unified and Fine-Grained Simulator for Large-Scale LLM Training and Inference", "authors": [{"id": 25502, "fullname": "Mengtian Yang", "url": "http://mlsys.org/api/miniconf/users/25502?format=json", "institution": "ByteDance Seed"}, {"id": 27169, "fullname": "Zhekun Zhang", "url": "http://mlsys.org/api/miniconf/users/27169?format=json", "institution": "ByteDance Inc."}, {"id": 25517, "fullname": "Mingheng Wu", "url": "http://mlsys.org/api/miniconf/users/25517?format=json", "institution": "ByteDance Seed"}, {"id": 27965, "fullname": "jianwen yan", "url": "http://mlsys.org/api/miniconf/users/27965?format=json", "institution": ""}, {"id": 27966, "fullname": "Hanshi Sun", "url": "http://mlsys.org/api/miniconf/users/27966?format=json", "institution": "ByteDance Seed"}, {"id": 20944, "fullname": "Li-Wen Chang", "url": "http://mlsys.org/api/miniconf/users/20944?format=json", "institution": "ByteDance Inc."}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3638", "url": null, "sourceid": 8, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=19O6GAS7Su", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 932, "modified": "2026-03-23T21:52:48.378560-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=19O6GAS7Su", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "24", "related_events": ["http://mlsys.org/api/miniconf/events/3861?format=json"], "related_events_ids": [3861]}, {"id": 3576, "uid": "4c56ff4ce4aaf9573aa5dff913df997a", "name": "DriftBench: Measuring and Predicting Infrastructure Drift in LLM Serving Systems", "authors": [{"id": 25492, "fullname": "Gianluigi Vitale", "url": "http://mlsys.org/api/miniconf/users/25492?format=json", "institution": "Universitas Mercatorum"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3576", "url": null, "sourceid": 121, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=Xfzzp6grRP", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 870, "modified": "2026-03-23T21:52:45.920644-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=Xfzzp6grRP", "resourcetype": "UriEventmedia"}, {"id": 1000, "file": "/media/PosterPDFs/MLSys%202026/3576.png", "modified": "2026-05-13T07:20:21.477299-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1001, "file": "/media/PosterPDFs/MLSys%202026/3576-thumb.png", "modified": "2026-05-13T07:20:21.569078-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1002, "modified": "2026-05-13T07:34:12.377412-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3576_1JOoaYa.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "29", "related_events": ["http://mlsys.org/api/miniconf/events/3799?format=json"], "related_events_ids": [3799]}, {"id": 3743, "uid": "698d51a19d8a121ce581499d7b701668", "name": "FarSkip-Collective: Unhobbling Blocking Communication in Mixture of Experts Models", "authors": [{"id": 26274, "fullname": "Yonatan Dukler", "url": "http://mlsys.org/api/miniconf/users/26274?format=json", "institution": "AMD"}, {"id": 27232, "fullname": "Guihong Li", "url": "http://mlsys.org/api/miniconf/users/27232?format=json", "institution": null}, {"id": 27233, "fullname": "Deval Shah", "url": "http://mlsys.org/api/miniconf/users/27233?format=json", "institution": null}, {"id": 28438, "fullname": "Jiang Liu", "url": "http://mlsys.org/api/miniconf/users/28438?format=json", "institution": "Advanced Micro Devices"}, {"id": 27234, "fullname": "Vikram Appia", "url": "http://mlsys.org/api/miniconf/users/27234?format=json", "institution": "Advanced Micro Devices"}, {"id": 12648, "fullname": "Emad Barsoum", "url": "http://mlsys.org/api/miniconf/users/12648?format=json", "institution": "Cerebras"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3743", "url": null, "sourceid": -111, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T16:00:00-07:00", "endtime": "2026-05-20T16:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3691?format=json", "parent_id": 3691, "eventmedia": [{"id": 1165, "modified": "2026-05-16T19:24:10.256120-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3743.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3520?format=json"], "related_events_ids": [3520]}, {"id": 3520, "uid": "698d51a19d8a121ce581499d7b701668", "name": "FarSkip-Collective: Unhobbling Blocking Communication in Mixture of Experts Models", "authors": [{"id": 26274, "fullname": "Yonatan Dukler", "url": "http://mlsys.org/api/miniconf/users/26274?format=json", "institution": "AMD"}, {"id": 27232, "fullname": "Guihong Li", "url": "http://mlsys.org/api/miniconf/users/27232?format=json", "institution": null}, {"id": 27233, "fullname": "Deval Shah", "url": "http://mlsys.org/api/miniconf/users/27233?format=json", "institution": null}, {"id": 28438, "fullname": "Jiang Liu", "url": "http://mlsys.org/api/miniconf/users/28438?format=json", "institution": "Advanced Micro Devices"}, {"id": 27234, "fullname": "Vikram Appia", "url": "http://mlsys.org/api/miniconf/users/27234?format=json", "institution": "Advanced Micro Devices"}, {"id": 12648, "fullname": "Emad Barsoum", "url": "http://mlsys.org/api/miniconf/users/12648?format=json", "institution": "Cerebras"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3520", "url": null, "sourceid": 111, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=ruOpvLzsGV", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 814, "modified": "2026-03-23T21:52:43.667545-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=ruOpvLzsGV", "resourcetype": "UriEventmedia"}, {"id": 1166, "file": "/media/PosterPDFs/MLSys%202026/3520.png", "modified": "2026-05-16T19:30:24.730571-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "32", "related_events": ["http://mlsys.org/api/miniconf/events/3743?format=json"], "related_events_ids": [3743]}, {"id": 3546, "uid": "1ff1de774005f8da13f42943881c655f", "name": "FaaScale: Unlocking Fast LLM Scaling for Serverless Inference", "authors": [{"id": 27398, "fullname": "Minchen Yu", "url": "http://mlsys.org/api/miniconf/users/27398?format=json", "institution": "The Chinese University of Hong Kong, Shenzhen"}, {"id": 27399, "fullname": "Rui Yang", "url": "http://mlsys.org/api/miniconf/users/27399?format=json", "institution": "University of Virginia"}, {"id": 27400, "fullname": "Chaobo Jia", "url": "http://mlsys.org/api/miniconf/users/27400?format=json", "institution": null}, {"id": 27401, "fullname": "Zhaoyuan Su", "url": "http://mlsys.org/api/miniconf/users/27401?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27402, "fullname": "Sheng Yao", "url": "http://mlsys.org/api/miniconf/users/27402?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27403, "fullname": "Tingfeng Lan", "url": "http://mlsys.org/api/miniconf/users/27403?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27404, "fullname": "Yuchen Yang", "url": "http://mlsys.org/api/miniconf/users/27404?format=json", "institution": null}, {"id": 27405, "fullname": "Zirui Wang", "url": "http://mlsys.org/api/miniconf/users/27405?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27406, "fullname": "Yue Cheng", "url": "http://mlsys.org/api/miniconf/users/27406?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27407, "fullname": "Wei Wang", "url": "http://mlsys.org/api/miniconf/users/27407?format=json", "institution": "HKUST"}, {"id": 27408, "fullname": "Ao Wang", "url": "http://mlsys.org/api/miniconf/users/27408?format=json", "institution": null}, {"id": 27409, "fullname": "Ruichuan Chen", "url": "http://mlsys.org/api/miniconf/users/27409?format=json", "institution": "Nokia Bell Labs"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3546", "url": null, "sourceid": 24, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=jgL8LuOVyT", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 840, "modified": "2026-03-23T21:52:44.651887-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=jgL8LuOVyT", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "11", "related_events": ["http://mlsys.org/api/miniconf/events/3769?format=json"], "related_events_ids": [3769]}, {"id": 3769, "uid": "1ff1de774005f8da13f42943881c655f", "name": "FaaScale: Unlocking Fast LLM Scaling for Serverless Inference", "authors": [{"id": 27398, "fullname": "Minchen Yu", "url": "http://mlsys.org/api/miniconf/users/27398?format=json", "institution": "The Chinese University of Hong Kong, Shenzhen"}, {"id": 27399, "fullname": "Rui Yang", "url": "http://mlsys.org/api/miniconf/users/27399?format=json", "institution": "University of Virginia"}, {"id": 27400, "fullname": "Chaobo Jia", "url": "http://mlsys.org/api/miniconf/users/27400?format=json", "institution": null}, {"id": 27401, "fullname": "Zhaoyuan Su", "url": "http://mlsys.org/api/miniconf/users/27401?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27402, "fullname": "Sheng Yao", "url": "http://mlsys.org/api/miniconf/users/27402?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27403, "fullname": "Tingfeng Lan", "url": "http://mlsys.org/api/miniconf/users/27403?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27404, "fullname": "Yuchen Yang", "url": "http://mlsys.org/api/miniconf/users/27404?format=json", "institution": null}, {"id": 27405, "fullname": "Zirui Wang", "url": "http://mlsys.org/api/miniconf/users/27405?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27406, "fullname": "Yue Cheng", "url": "http://mlsys.org/api/miniconf/users/27406?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27407, "fullname": "Wei Wang", "url": "http://mlsys.org/api/miniconf/users/27407?format=json", "institution": "HKUST"}, {"id": 27408, "fullname": "Ao Wang", "url": "http://mlsys.org/api/miniconf/users/27408?format=json", "institution": null}, {"id": 27409, "fullname": "Ruichuan Chen", "url": "http://mlsys.org/api/miniconf/users/27409?format=json", "institution": "Nokia Bell Labs"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 2", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3769", "url": null, "sourceid": -24, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T09:45:00-07:00", "endtime": "2026-05-20T10:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3678?format=json", "parent_id": 3678, "eventmedia": [{"id": 1035, "modified": "2026-05-14T07:43:18.404441-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3769.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3546?format=json"], "related_events_ids": [3546]}, {"id": 3548, "uid": "f7177163c833dff4b38fc8d2872f1ec6", "name": "DynaFlow: Transparent and Flexible Intra-Device Parallelism via Programmable Operator Scheduling", "authors": [{"id": 27415, "fullname": "Yi Pan", "url": "http://mlsys.org/api/miniconf/users/27415?format=json", "institution": "Shanghai Jiao Tong University"}, {"id": 27416, "fullname": "Yile Gu", "url": "http://mlsys.org/api/miniconf/users/27416?format=json", "institution": "Department of Computer Science, University of Washington"}, {"id": 25662, "fullname": "Luo Jinbin", "url": "http://mlsys.org/api/miniconf/users/25662?format=json", "institution": "Shanghai Jiao Tong University"}, {"id": 27417, "fullname": "Yibo Wu", "url": "http://mlsys.org/api/miniconf/users/27417?format=json", "institution": "University of Washington; University of Wisconsin Madison"}, {"id": 27418, "fullname": "Ziren Wang", "url": "http://mlsys.org/api/miniconf/users/27418?format=json", "institution": "Tsinghua University"}, {"id": 27419, "fullname": "Hongtao Zhang", "url": "http://mlsys.org/api/miniconf/users/27419?format=json", "institution": null}, {"id": 20912, "fullname": "Ziyi Xu", "url": "http://mlsys.org/api/miniconf/users/20912?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 27420, "fullname": "Shengkai Lin", "url": "http://mlsys.org/api/miniconf/users/27420?format=json", "institution": "Shanghai Jiao Tong University"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}, {"id": 17972, "fullname": "Stephanie Wang", "url": "http://mlsys.org/api/miniconf/users/17972?format=json", "institution": "UW &amp; Anyscale"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3548", "url": null, "sourceid": 44, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=i0yqC9954S", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 842, "modified": "2026-03-23T21:52:44.736245-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=i0yqC9954S", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "39", "related_events": ["http://mlsys.org/api/miniconf/events/3771?format=json"], "related_events_ids": [3771]}, {"id": 3771, "uid": "f7177163c833dff4b38fc8d2872f1ec6", "name": "DynaFlow: Transparent and Flexible Intra-Device Parallelism via Programmable Operator Scheduling", "authors": [{"id": 27415, "fullname": "Yi Pan", "url": "http://mlsys.org/api/miniconf/users/27415?format=json", "institution": "Shanghai Jiao Tong University"}, {"id": 27416, "fullname": "Yile Gu", "url": "http://mlsys.org/api/miniconf/users/27416?format=json", "institution": "Department of Computer Science, University of Washington"}, {"id": 25662, "fullname": "Luo Jinbin", "url": "http://mlsys.org/api/miniconf/users/25662?format=json", "institution": "Shanghai Jiao Tong University"}, {"id": 27417, "fullname": "Yibo Wu", "url": "http://mlsys.org/api/miniconf/users/27417?format=json", "institution": "University of Washington; University of Wisconsin Madison"}, {"id": 27418, "fullname": "Ziren Wang", "url": "http://mlsys.org/api/miniconf/users/27418?format=json", "institution": "Tsinghua University"}, {"id": 27419, "fullname": "Hongtao Zhang", "url": "http://mlsys.org/api/miniconf/users/27419?format=json", "institution": null}, {"id": 20912, "fullname": "Ziyi Xu", "url": "http://mlsys.org/api/miniconf/users/20912?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 27420, "fullname": "Shengkai Lin", "url": "http://mlsys.org/api/miniconf/users/27420?format=json", "institution": "Shanghai Jiao Tong University"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}, {"id": 17972, "fullname": "Stephanie Wang", "url": "http://mlsys.org/api/miniconf/users/17972?format=json", "institution": "UW &amp; Anyscale"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Compilers and Kernels", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3771", "url": "https://github.com/uw-syfi/DynaFlow", "sourceid": -44, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T17:15:00-07:00", "endtime": "2026-05-21T17:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3718?format=json", "parent_id": 3718, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3548?format=json"], "related_events_ids": [3548]}, {"id": 3833, "uid": "a97da629b098b75c294dffdc3e463904", "name": "BatchLLM: Optimizing Large Batched LLM Inference with Global Prefix Sharing and Throughput-oriented Token Batching", "authors": [{"id": 28440, "fullname": "Zhen Zheng", "url": "http://mlsys.org/api/miniconf/users/28440?format=json", "institution": "ByteDance Inc."}, {"id": 28468, "fullname": "Xin Ji", "url": "http://mlsys.org/api/miniconf/users/28468?format=json", "institution": "Microsoft"}, {"id": 25922, "fullname": "Taosong Fang", "url": "http://mlsys.org/api/miniconf/users/25922?format=json", "institution": "Institute of Software Chinese Academy of Sciences"}, {"id": 27794, "fullname": "Fanghao Zhou", "url": "http://mlsys.org/api/miniconf/users/27794?format=json", "institution": "Microsoft Corp."}, {"id": 27642, "fullname": "Chuanjie Liu", "url": "http://mlsys.org/api/miniconf/users/27642?format=json", "institution": "Microsoft"}, {"id": 27795, "fullname": "Gang Peng", "url": "http://mlsys.org/api/miniconf/users/27795?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Agentic AI/MLSys", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3833", "url": null, "sourceid": -107, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T09:45:00-07:00", "endtime": "2026-05-21T10:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3700?format=json", "parent_id": 3700, "eventmedia": [{"id": 1170, "modified": "2026-05-16T23:59:06.579743-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3833.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3610?format=json"], "related_events_ids": [3610]}, {"id": 3610, "uid": "a97da629b098b75c294dffdc3e463904", "name": "BatchLLM: Optimizing Large Batched LLM Inference with Global Prefix Sharing and Throughput-oriented Token Batching", "authors": [{"id": 28440, "fullname": "Zhen Zheng", "url": "http://mlsys.org/api/miniconf/users/28440?format=json", "institution": "ByteDance Inc."}, {"id": 28468, "fullname": "Xin Ji", "url": "http://mlsys.org/api/miniconf/users/28468?format=json", "institution": "Microsoft"}, {"id": 25922, "fullname": "Taosong Fang", "url": "http://mlsys.org/api/miniconf/users/25922?format=json", "institution": "Institute of Software Chinese Academy of Sciences"}, {"id": 27794, "fullname": "Fanghao Zhou", "url": "http://mlsys.org/api/miniconf/users/27794?format=json", "institution": "Microsoft Corp."}, {"id": 27642, "fullname": "Chuanjie Liu", "url": "http://mlsys.org/api/miniconf/users/27642?format=json", "institution": "Microsoft"}, {"id": 27795, "fullname": "Gang Peng", "url": "http://mlsys.org/api/miniconf/users/27795?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3610", "url": null, "sourceid": 107, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=IuVHde07l6", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 904, "modified": "2026-03-23T21:52:47.187677-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=IuVHde07l6", "resourcetype": "UriEventmedia"}, {"id": 1173, "file": "/media/PosterPDFs/MLSys%202026/3610.png", "modified": "2026-05-17T07:52:15.373246-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1174, "file": "/media/PosterPDFs/MLSys%202026/3610-thumb.png", "modified": "2026-05-17T07:52:15.507443-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "14", "related_events": ["http://mlsys.org/api/miniconf/events/3833?format=json"], "related_events_ids": [3833]}, {"id": 3865, "uid": "6364d3f0f495b6ab9dcf8d3b5c6e0b01", "name": "OSWorld-Human: Benchmarking the Efficiency of Computer-Use Agents", "authors": [{"id": 27412, "fullname": "Reyna Abhyankar", "url": "http://mlsys.org/api/miniconf/users/27412?format=json", "institution": "Together AI"}, {"id": 27985, "fullname": "Qi Qi", "url": "http://mlsys.org/api/miniconf/users/27985?format=json", "institution": "University of California, San Diego"}, {"id": 26292, "fullname": "Yiying Zhang", "url": "http://mlsys.org/api/miniconf/users/26292?format=json", "institution": "UCSD and GenseeAI"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Agentic AI 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3865", "url": null, "sourceid": -32, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T13:00:00-07:00", "endtime": "2026-05-19T13:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3668?format=json", "parent_id": 3668, "eventmedia": [{"id": 1177, "modified": "2026-05-17T11:45:37.011855-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3865.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3642?format=json"], "related_events_ids": [3642]}, {"id": 3552, "uid": "e2c420d928d4bf8ce0ff2ec19b371514", "name": "MTraining: Distributed Dynamic Sparse Attention for Efficient Ultra-Long Context Training", "authors": [{"id": 27464, "fullname": "Wenxuan Li", "url": "http://mlsys.org/api/miniconf/users/27464?format=json", "institution": "Microsoft Research Asia"}, {"id": 27465, "fullname": "Chengruidong Zhang", "url": "http://mlsys.org/api/miniconf/users/27465?format=json", "institution": "Alibaba Group"}, {"id": 27466, "fullname": "Huiqiang Jiang", "url": "http://mlsys.org/api/miniconf/users/27466?format=json", "institution": "Qwen"}, {"id": 27467, "fullname": "Yucheng Li", "url": "http://mlsys.org/api/miniconf/users/27467?format=json", "institution": "Alibaba Group"}, {"id": 27468, "fullname": "Yuqing Yang", "url": "http://mlsys.org/api/miniconf/users/27468?format=json", "institution": null}, {"id": 27469, "fullname": "Lili Qiu", "url": "http://mlsys.org/api/miniconf/users/27469?format=json", "institution": "Microsoft Research Asia"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3552", "url": null, "sourceid": 71, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=h6SD2zgwGq", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 846, "modified": "2026-03-23T21:52:44.915489-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=h6SD2zgwGq", "resourcetype": "UriEventmedia"}, {"id": 999, "file": "/media/PosterPDFs/MLSys%202026/3552.png", "modified": "2026-05-13T06:45:17.970039-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "8", "related_events": ["http://mlsys.org/api/miniconf/events/3775?format=json"], "related_events_ids": [3775]}, {"id": 3778, "uid": "68d30a9594728bc39aa24be94b319d21", "name": "Wave: A Symbolic Python DSL And Compiler for High-Performance Machine Learning", "authors": [{"id": 18549, "fullname": "Harsh Menon", "url": "http://mlsys.org/api/miniconf/users/18549?format=json", "institution": "AMD"}, {"id": 28460, "fullname": "Oleksandr Zinenko", "url": "http://mlsys.org/api/miniconf/users/28460?format=json", "institution": "Advanced Micro Devices"}, {"id": 25620, "fullname": "Gaurav Verma", "url": "http://mlsys.org/api/miniconf/users/25620?format=json", "institution": "Advanced Micro Devices, Inc. (AMD) and Stony Brook University, NY"}, {"id": 27188, "fullname": "Stanley Winata", "url": "http://mlsys.org/api/miniconf/users/27188?format=json", "institution": null}, {"id": 27487, "fullname": "Ivan Butygin", "url": "http://mlsys.org/api/miniconf/users/27487?format=json", "institution": null}, {"id": 27488, "fullname": "Nithin Meganathan", "url": "http://mlsys.org/api/miniconf/users/27488?format=json", "institution": "AMD"}, {"id": 27147, "fullname": "Sanket Pandit", "url": "http://mlsys.org/api/miniconf/users/27147?format=json", "institution": "Advanced Micro Devices"}, {"id": 27489, "fullname": "William Gallard Hatch", "url": "http://mlsys.org/api/miniconf/users/27489?format=json", "institution": "AMD"}, {"id": 27490, "fullname": "Surya Jasper", "url": "http://mlsys.org/api/miniconf/users/27490?format=json", "institution": null}, {"id": 27491, "fullname": "Megan Kuo", "url": "http://mlsys.org/api/miniconf/users/27491?format=json", "institution": null}, {"id": 27492, "fullname": "Sahil FAIZAL", "url": "http://mlsys.org/api/miniconf/users/27492?format=json", "institution": "AMD"}, {"id": 27493, "fullname": "Ashay Rane", "url": "http://mlsys.org/api/miniconf/users/27493?format=json", "institution": null}, {"id": 27494, "fullname": "Aurore De Spirlet", "url": "http://mlsys.org/api/miniconf/users/27494?format=json", "institution": null}, {"id": 26125, "fullname": "Martin P. L\u00fccke", "url": "http://mlsys.org/api/miniconf/users/26125?format=json", "institution": "AMD"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Compilers/HW", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3778", "url": null, "sourceid": -84, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-22T08:45:00-07:00", "endtime": "2026-05-22T09:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3721?format=json", "parent_id": 3721, "eventmedia": [{"id": 1040, "modified": "2026-05-15T10:34:50.587584-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3778_wPh602N.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3555?format=json"], "related_events_ids": [3555]}, {"id": 3571, "uid": "5ef059938ba799aaa845e1c2e8a762bd", "name": "MAC-Attention: a Match--Amend--Complete scheme for fast and accurate attention computation", "authors": [{"id": 19233, "fullname": "Jinghan Yao", "url": "http://mlsys.org/api/miniconf/users/19233?format=json", "institution": "The Ohio State University"}, {"id": 21021, "fullname": "Sam Jacobs", "url": "http://mlsys.org/api/miniconf/users/21021?format=json", "institution": "Microsoft"}, {"id": 27604, "fullname": "Walid Krichene", "url": "http://mlsys.org/api/miniconf/users/27604?format=json", "institution": "Microsoft"}, {"id": 27605, "fullname": "Masahiro Tanaka", "url": "http://mlsys.org/api/miniconf/users/27605?format=json", "institution": "Anyscale"}, {"id": 20998, "fullname": "Dhabaleswar Panda", "url": "http://mlsys.org/api/miniconf/users/20998?format=json", "institution": "Ohio State University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3571", "url": null, "sourceid": 118, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=b6HBRCejb7", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 865, "modified": "2026-03-23T21:52:45.719722-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=b6HBRCejb7", "resourcetype": "UriEventmedia"}, {"id": 948, "file": "/media/PosterPDFs/MLSys%202026/3571.png", "modified": "2026-04-25T09:50:27.715829-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 949, "file": "/media/PosterPDFs/MLSys%202026/3571-thumb.png", "modified": "2026-04-25T09:50:27.817827-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "19", "related_events": ["http://mlsys.org/api/miniconf/events/3794?format=json"], "related_events_ids": [3794]}, {"id": 3864, "uid": "92cc227532d17e56e07902b254dfad10", "name": "SkipKV: Selective Skipping of KV Generation and Storage for Efficient Inference with Large Reasoning Models", "authors": [{"id": 27979, "fullname": "Jiayi Tian", "url": "http://mlsys.org/api/miniconf/users/27979?format=json", "institution": "University of California, Santa Barbara"}, {"id": 27980, "fullname": "Seyedarmin Azizi", "url": "http://mlsys.org/api/miniconf/users/27980?format=json", "institution": "University of Southern California"}, {"id": 24084, "fullname": "Yequan Zhao", "url": "http://mlsys.org/api/miniconf/users/24084?format=json", "institution": "University of California Santa Barbara"}, {"id": 27981, "fullname": "Erfan Potraghloo", "url": "http://mlsys.org/api/miniconf/users/27981?format=json", "institution": "University of Southern California"}, {"id": 27982, "fullname": "Sean McPherson", "url": "http://mlsys.org/api/miniconf/users/27982?format=json", "institution": "Intel"}, {"id": 27983, "fullname": "Sharath Nittur Sridhar", "url": "http://mlsys.org/api/miniconf/users/27983?format=json", "institution": "Intel Labs"}, {"id": 23955, "fullname": "Zhengyang Wang", "url": "http://mlsys.org/api/miniconf/users/23955?format=json", "institution": "University of California, Santa Barbara"}, {"id": 24510, "fullname": "zheng Zhang", "url": "http://mlsys.org/api/miniconf/users/24510?format=json", "institution": "University of California, Santa Barbara"}, {"id": 27347, "fullname": "Massoud Pedram", "url": "http://mlsys.org/api/miniconf/users/27347?format=json", "institution": "University of Southern California"}, {"id": 27984, "fullname": "Souvik Kundu", "url": "http://mlsys.org/api/miniconf/users/27984?format=json", "institution": "Intel"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3864", "url": null, "sourceid": -92, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T13:30:00-07:00", "endtime": "2026-05-20T13:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3687?format=json", "parent_id": 3687, "eventmedia": [{"id": 1163, "modified": "2026-05-17T15:58:42.143232-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3864_lxfVaNQ.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3641?format=json"], "related_events_ids": [3641]}, {"id": 3641, "uid": "92cc227532d17e56e07902b254dfad10", "name": "SkipKV: Selective Skipping of KV Generation and Storage for Efficient Inference with Large Reasoning Models", "authors": [{"id": 27979, "fullname": "Jiayi Tian", "url": "http://mlsys.org/api/miniconf/users/27979?format=json", "institution": "University of California, Santa Barbara"}, {"id": 27980, "fullname": "Seyedarmin Azizi", "url": "http://mlsys.org/api/miniconf/users/27980?format=json", "institution": "University of Southern California"}, {"id": 24084, "fullname": "Yequan Zhao", "url": "http://mlsys.org/api/miniconf/users/24084?format=json", "institution": "University of California Santa Barbara"}, {"id": 27981, "fullname": "Erfan Potraghloo", "url": "http://mlsys.org/api/miniconf/users/27981?format=json", "institution": "University of Southern California"}, {"id": 27982, "fullname": "Sean McPherson", "url": "http://mlsys.org/api/miniconf/users/27982?format=json", "institution": "Intel"}, {"id": 27983, "fullname": "Sharath Nittur Sridhar", "url": "http://mlsys.org/api/miniconf/users/27983?format=json", "institution": "Intel Labs"}, {"id": 23955, "fullname": "Zhengyang Wang", "url": "http://mlsys.org/api/miniconf/users/23955?format=json", "institution": "University of California, Santa Barbara"}, {"id": 24510, "fullname": "zheng Zhang", "url": "http://mlsys.org/api/miniconf/users/24510?format=json", "institution": "University of California, Santa Barbara"}, {"id": 27347, "fullname": "Massoud Pedram", "url": "http://mlsys.org/api/miniconf/users/27347?format=json", "institution": "University of Southern California"}, {"id": 27984, "fullname": "Souvik Kundu", "url": "http://mlsys.org/api/miniconf/users/27984?format=json", "institution": "Intel"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3641", "url": null, "sourceid": 92, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=0EsV9SIm8p", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 935, "modified": "2026-03-23T21:52:48.481281-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=0EsV9SIm8p", "resourcetype": "UriEventmedia"}, {"id": 1167, "file": "/media/PosterPDFs/MLSys%202026/3641.png", "modified": "2026-05-17T16:48:28.289774-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1191, "modified": "2026-05-17T16:26:38.737817-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3641.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "13", "related_events": ["http://mlsys.org/api/miniconf/events/3864?format=json"], "related_events_ids": [3864]}, {"id": 3780, "uid": "c7e1249ffc03eb9ded908c236bd1996d", "name": "Optimizing Deployment Configurations for LLM Inference", "authors": [{"id": 27501, "fullname": "Sungmin Cho", "url": "http://mlsys.org/api/miniconf/users/27501?format=json", "institution": "Meta"}, {"id": 27148, "fullname": "Jaewon Lee", "url": "http://mlsys.org/api/miniconf/users/27148?format=json", "institution": "Meta"}, {"id": 28959, "fullname": "Chunqiang Tang", "url": "http://mlsys.org/api/miniconf/users/28959?format=json", "institution": "Facebook"}, {"id": 27503, "fullname": "Yejin Lee", "url": "http://mlsys.org/api/miniconf/users/27503?format=json", "institution": "META"}, {"id": 13318, "fullname": "Geonhwa Jeong", "url": "http://mlsys.org/api/miniconf/users/13318?format=json", "institution": "Meta"}, {"id": 27504, "fullname": "Anca Agape", "url": "http://mlsys.org/api/miniconf/users/27504?format=json", "institution": null}, {"id": 27505, "fullname": "Scott Batura", "url": "http://mlsys.org/api/miniconf/users/27505?format=json", "institution": null}, {"id": 27506, "fullname": "Vincent Boivin", "url": "http://mlsys.org/api/miniconf/users/27506?format=json", "institution": null}, {"id": 27507, "fullname": "Stephen Chen", "url": "http://mlsys.org/api/miniconf/users/27507?format=json", "institution": null}, {"id": 27508, "fullname": "Renfei Chen", "url": "http://mlsys.org/api/miniconf/users/27508?format=json", "institution": null}, {"id": 27509, "fullname": "Sijia Chen", "url": "http://mlsys.org/api/miniconf/users/27509?format=json", "institution": "Facebook"}, {"id": 27510, "fullname": "Yan Cui", "url": "http://mlsys.org/api/miniconf/users/27510?format=json", "institution": null}, {"id": 27511, "fullname": "Bradley Davis", "url": "http://mlsys.org/api/miniconf/users/27511?format=json", "institution": null}, {"id": 27512, "fullname": "Summer Deng", "url": "http://mlsys.org/api/miniconf/users/27512?format=json", "institution": "Facebook"}, {"id": 27513, "fullname": "Nick Egebo", "url": "http://mlsys.org/api/miniconf/users/27513?format=json", "institution": null}, {"id": 27149, "fullname": "Emad El-Haraty", "url": "http://mlsys.org/api/miniconf/users/27149?format=json", "institution": "Facebook"}, {"id": 27514, "fullname": "Sebastien Estienne", "url": "http://mlsys.org/api/miniconf/users/27514?format=json", "institution": null}, {"id": 27515, "fullname": "Lu Fang", "url": "http://mlsys.org/api/miniconf/users/27515?format=json", "institution": "Facebook"}, {"id": 21303, "fullname": "Lu Fang", "url": "http://mlsys.org/api/miniconf/users/21303?format=json", "institution": "Meta"}, {"id": 27516, "fullname": "Joshua Fromm", "url": "http://mlsys.org/api/miniconf/users/27516?format=json", "institution": "Facebook"}, {"id": 27517, "fullname": "Raj Ganapathy", "url": "http://mlsys.org/api/miniconf/users/27517?format=json", "institution": null}, {"id": 27518, "fullname": "Vedanuj Goswami", "url": "http://mlsys.org/api/miniconf/users/27518?format=json", "institution": null}, {"id": 27519, "fullname": "Liangpeng Guo", "url": "http://mlsys.org/api/miniconf/users/27519?format=json", "institution": "Meta Platforms"}, {"id": 27520, "fullname": "Ye Hu", "url": "http://mlsys.org/api/miniconf/users/27520?format=json", "institution": null}, {"id": 27521, "fullname": "Chenheli Hua", "url": "http://mlsys.org/api/miniconf/users/27521?format=json", "institution": null}, {"id": 20937, "fullname": "Jianyu Huang", "url": "http://mlsys.org/api/miniconf/users/20937?format=json", "institution": "Research, Meta"}, {"id": 20923, "fullname": "Aya Ibrahim", "url": "http://mlsys.org/api/miniconf/users/20923?format=json", "institution": "Meta"}, {"id": 27522, "fullname": "Niranjan Jagannath", "url": "http://mlsys.org/api/miniconf/users/27522?format=json", "institution": null}, {"id": 16156, "fullname": "Hongyi Jia", "url": "http://mlsys.org/api/miniconf/users/16156?format=json", "institution": "Meta"}, {"id": 27523, "fullname": "Changkyu Kim", "url": "http://mlsys.org/api/miniconf/users/27523?format=json", "institution": "Facebook"}, {"id": 27524, "fullname": "Shikai Li", "url": "http://mlsys.org/api/miniconf/users/27524?format=json", "institution": null}, {"id": 27525, "fullname": "Brandon Liu", "url": "http://mlsys.org/api/miniconf/users/27525?format=json", "institution": null}, {"id": 27526, "fullname": "Jiawen Liu", "url": "http://mlsys.org/api/miniconf/users/27526?format=json", "institution": null}, {"id": 27527, "fullname": "Ajit Mathews", "url": "http://mlsys.org/api/miniconf/users/27527?format=json", "institution": null}, {"id": 27150, "fullname": "Xiaozhu Meng", "url": "http://mlsys.org/api/miniconf/users/27150?format=json", "institution": "Facebook"}, {"id": 27528, "fullname": "Vlad Tiberiu Mihailescu", "url": "http://mlsys.org/api/miniconf/users/27528?format=json", "institution": "Meta"}, {"id": 27529, "fullname": "Amit Nagpal", "url": "http://mlsys.org/api/miniconf/users/27529?format=json", "institution": null}, {"id": 15117, "fullname": "Maxim Naumov", "url": "http://mlsys.org/api/miniconf/users/15117?format=json", "institution": "Meta"}, {"id": 27530, "fullname": "Michal Ostrowski", "url": "http://mlsys.org/api/miniconf/users/27530?format=json", "institution": ""}, {"id": 27531, "fullname": "Jialin Ouyang", "url": "http://mlsys.org/api/miniconf/users/27531?format=json", "institution": null}, {"id": 27532, "fullname": "Jason Park", "url": "http://mlsys.org/api/miniconf/users/27532?format=json", "institution": null}, {"id": 16190, "fullname": "Sarunya Pumma", "url": "http://mlsys.org/api/miniconf/users/16190?format=json", "institution": "Meta"}, {"id": 27533, "fullname": "Ye Qi", "url": "http://mlsys.org/api/miniconf/users/27533?format=json", "institution": null}, {"id": 27534, "fullname": "Zixi Qi", "url": "http://mlsys.org/api/miniconf/users/27534?format=json", "institution": null}, {"id": 27535, "fullname": "Jeremy Francis Reizenstein", "url": "http://mlsys.org/api/miniconf/users/27535?format=json", "institution": "Meta AI"}, {"id": 27536, "fullname": "Rajasi Saha", "url": "http://mlsys.org/api/miniconf/users/27536?format=json", "institution": "Facebook"}, {"id": 27537, "fullname": "Nandhini Santhanam", "url": "http://mlsys.org/api/miniconf/users/27537?format=json", "institution": null}, {"id": 27538, "fullname": "Zhan Shu", "url": "http://mlsys.org/api/miniconf/users/27538?format=json", "institution": null}, {"id": 27539, "fullname": "Ruan Silva", "url": "http://mlsys.org/api/miniconf/users/27539?format=json", "institution": "Meta"}, {"id": 27540, "fullname": "Grigory Sizov", "url": "http://mlsys.org/api/miniconf/users/27540?format=json", "institution": null}, {"id": 27151, "fullname": "Jon Swenson", "url": "http://mlsys.org/api/miniconf/users/27151?format=json", "institution": "Facebook"}, {"id": 27541, "fullname": "Brandon Taylor", "url": "http://mlsys.org/api/miniconf/users/27541?format=json", "institution": null}, {"id": 27542, "fullname": "Chris Thi", "url": "http://mlsys.org/api/miniconf/users/27542?format=json", "institution": ""}, {"id": 27543, "fullname": "Adolfo Victoria", "url": "http://mlsys.org/api/miniconf/users/27543?format=json", "institution": null}, {"id": 27152, "fullname": "Yunfan Wang", "url": "http://mlsys.org/api/miniconf/users/27152?format=json", "institution": "Facebook"}, {"id": 27544, "fullname": "Pengchao Wang", "url": "http://mlsys.org/api/miniconf/users/27544?format=json", "institution": "Meta Inc."}, {"id": 23937, "fullname": "Wenchen Wang", "url": "http://mlsys.org/api/miniconf/users/23937?format=json", "institution": null}, {"id": 27545, "fullname": "Xiaodong Wang", "url": "http://mlsys.org/api/miniconf/users/27545?format=json", "institution": null}, {"id": 10964, "fullname": "Bram Wasti", "url": "http://mlsys.org/api/miniconf/users/10964?format=json", "institution": "Facebook"}, {"id": 27546, "fullname": "Wei Xu", "url": "http://mlsys.org/api/miniconf/users/27546?format=json", "institution": null}, {"id": 27547, "fullname": "Qirui Yang", "url": "http://mlsys.org/api/miniconf/users/27547?format=json", "institution": null}, {"id": 20938, "fullname": "Jingyi Yang", "url": "http://mlsys.org/api/miniconf/users/20938?format=json", "institution": "Facebook"}, {"id": 27548, "fullname": "Hector Yuen", "url": "http://mlsys.org/api/miniconf/users/27548?format=json", "institution": null}, {"id": 27549, "fullname": "Zhengyuan Zhang", "url": "http://mlsys.org/api/miniconf/users/27549?format=json", "institution": null}, {"id": 27550, "fullname": "Jing Zhang", "url": "http://mlsys.org/api/miniconf/users/27550?format=json", "institution": "Facebook"}, {"id": 27153, "fullname": "Yi Zhen", "url": "http://mlsys.org/api/miniconf/users/27153?format=json", "institution": "Meta"}, {"id": 27551, "fullname": "Yanjun Zhou", "url": "http://mlsys.org/api/miniconf/users/27551?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Serving 6", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3780", "url": null, "sourceid": -87, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T13:30:00-07:00", "endtime": "2026-05-21T13:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3709?format=json", "parent_id": 3709, "eventmedia": [{"id": 1087, "modified": "2026-05-15T10:35:02.398375-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3780.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3557?format=json"], "related_events_ids": [3557]}, {"id": 3557, "uid": "c7e1249ffc03eb9ded908c236bd1996d", "name": "Optimizing Deployment Configurations for LLM Inference", "authors": [{"id": 27501, "fullname": "Sungmin Cho", "url": "http://mlsys.org/api/miniconf/users/27501?format=json", "institution": "Meta"}, {"id": 27148, "fullname": "Jaewon Lee", "url": "http://mlsys.org/api/miniconf/users/27148?format=json", "institution": "Meta"}, {"id": 28959, "fullname": "Chunqiang Tang", "url": "http://mlsys.org/api/miniconf/users/28959?format=json", "institution": "Facebook"}, {"id": 27503, "fullname": "Yejin Lee", "url": "http://mlsys.org/api/miniconf/users/27503?format=json", "institution": "META"}, {"id": 13318, "fullname": "Geonhwa Jeong", "url": "http://mlsys.org/api/miniconf/users/13318?format=json", "institution": "Meta"}, {"id": 27504, "fullname": "Anca Agape", "url": "http://mlsys.org/api/miniconf/users/27504?format=json", "institution": null}, {"id": 27505, "fullname": "Scott Batura", "url": "http://mlsys.org/api/miniconf/users/27505?format=json", "institution": null}, {"id": 27506, "fullname": "Vincent Boivin", "url": "http://mlsys.org/api/miniconf/users/27506?format=json", "institution": null}, {"id": 27507, "fullname": "Stephen Chen", "url": "http://mlsys.org/api/miniconf/users/27507?format=json", "institution": null}, {"id": 27508, "fullname": "Renfei Chen", "url": "http://mlsys.org/api/miniconf/users/27508?format=json", "institution": null}, {"id": 27509, "fullname": "Sijia Chen", "url": "http://mlsys.org/api/miniconf/users/27509?format=json", "institution": "Facebook"}, {"id": 27510, "fullname": "Yan Cui", "url": "http://mlsys.org/api/miniconf/users/27510?format=json", "institution": null}, {"id": 27511, "fullname": "Bradley Davis", "url": "http://mlsys.org/api/miniconf/users/27511?format=json", "institution": null}, {"id": 27512, "fullname": "Summer Deng", "url": "http://mlsys.org/api/miniconf/users/27512?format=json", "institution": "Facebook"}, {"id": 27513, "fullname": "Nick Egebo", "url": "http://mlsys.org/api/miniconf/users/27513?format=json", "institution": null}, {"id": 27149, "fullname": "Emad El-Haraty", "url": "http://mlsys.org/api/miniconf/users/27149?format=json", "institution": "Facebook"}, {"id": 27514, "fullname": "Sebastien Estienne", "url": "http://mlsys.org/api/miniconf/users/27514?format=json", "institution": null}, {"id": 27515, "fullname": "Lu Fang", "url": "http://mlsys.org/api/miniconf/users/27515?format=json", "institution": "Facebook"}, {"id": 21303, "fullname": "Lu Fang", "url": "http://mlsys.org/api/miniconf/users/21303?format=json", "institution": "Meta"}, {"id": 27516, "fullname": "Joshua Fromm", "url": "http://mlsys.org/api/miniconf/users/27516?format=json", "institution": "Facebook"}, {"id": 27517, "fullname": "Raj Ganapathy", "url": "http://mlsys.org/api/miniconf/users/27517?format=json", "institution": null}, {"id": 27518, "fullname": "Vedanuj Goswami", "url": "http://mlsys.org/api/miniconf/users/27518?format=json", "institution": null}, {"id": 27519, "fullname": "Liangpeng Guo", "url": "http://mlsys.org/api/miniconf/users/27519?format=json", "institution": "Meta Platforms"}, {"id": 27520, "fullname": "Ye Hu", "url": "http://mlsys.org/api/miniconf/users/27520?format=json", "institution": null}, {"id": 27521, "fullname": "Chenheli Hua", "url": "http://mlsys.org/api/miniconf/users/27521?format=json", "institution": null}, {"id": 20937, "fullname": "Jianyu Huang", "url": "http://mlsys.org/api/miniconf/users/20937?format=json", "institution": "Research, Meta"}, {"id": 20923, "fullname": "Aya Ibrahim", "url": "http://mlsys.org/api/miniconf/users/20923?format=json", "institution": "Meta"}, {"id": 27522, "fullname": "Niranjan Jagannath", "url": "http://mlsys.org/api/miniconf/users/27522?format=json", "institution": null}, {"id": 16156, "fullname": "Hongyi Jia", "url": "http://mlsys.org/api/miniconf/users/16156?format=json", "institution": "Meta"}, {"id": 27523, "fullname": "Changkyu Kim", "url": "http://mlsys.org/api/miniconf/users/27523?format=json", "institution": "Facebook"}, {"id": 27524, "fullname": "Shikai Li", "url": "http://mlsys.org/api/miniconf/users/27524?format=json", "institution": null}, {"id": 27525, "fullname": "Brandon Liu", "url": "http://mlsys.org/api/miniconf/users/27525?format=json", "institution": null}, {"id": 27526, "fullname": "Jiawen Liu", "url": "http://mlsys.org/api/miniconf/users/27526?format=json", "institution": null}, {"id": 27527, "fullname": "Ajit Mathews", "url": "http://mlsys.org/api/miniconf/users/27527?format=json", "institution": null}, {"id": 27150, "fullname": "Xiaozhu Meng", "url": "http://mlsys.org/api/miniconf/users/27150?format=json", "institution": "Facebook"}, {"id": 27528, "fullname": "Vlad Tiberiu Mihailescu", "url": "http://mlsys.org/api/miniconf/users/27528?format=json", "institution": "Meta"}, {"id": 27529, "fullname": "Amit Nagpal", "url": "http://mlsys.org/api/miniconf/users/27529?format=json", "institution": null}, {"id": 15117, "fullname": "Maxim Naumov", "url": "http://mlsys.org/api/miniconf/users/15117?format=json", "institution": "Meta"}, {"id": 27530, "fullname": "Michal Ostrowski", "url": "http://mlsys.org/api/miniconf/users/27530?format=json", "institution": ""}, {"id": 27531, "fullname": "Jialin Ouyang", "url": "http://mlsys.org/api/miniconf/users/27531?format=json", "institution": null}, {"id": 27532, "fullname": "Jason Park", "url": "http://mlsys.org/api/miniconf/users/27532?format=json", "institution": null}, {"id": 16190, "fullname": "Sarunya Pumma", "url": "http://mlsys.org/api/miniconf/users/16190?format=json", "institution": "Meta"}, {"id": 27533, "fullname": "Ye Qi", "url": "http://mlsys.org/api/miniconf/users/27533?format=json", "institution": null}, {"id": 27534, "fullname": "Zixi Qi", "url": "http://mlsys.org/api/miniconf/users/27534?format=json", "institution": null}, {"id": 27535, "fullname": "Jeremy Francis Reizenstein", "url": "http://mlsys.org/api/miniconf/users/27535?format=json", "institution": "Meta AI"}, {"id": 27536, "fullname": "Rajasi Saha", "url": "http://mlsys.org/api/miniconf/users/27536?format=json", "institution": "Facebook"}, {"id": 27537, "fullname": "Nandhini Santhanam", "url": "http://mlsys.org/api/miniconf/users/27537?format=json", "institution": null}, {"id": 27538, "fullname": "Zhan Shu", "url": "http://mlsys.org/api/miniconf/users/27538?format=json", "institution": null}, {"id": 27539, "fullname": "Ruan Silva", "url": "http://mlsys.org/api/miniconf/users/27539?format=json", "institution": "Meta"}, {"id": 27540, "fullname": "Grigory Sizov", "url": "http://mlsys.org/api/miniconf/users/27540?format=json", "institution": null}, {"id": 27151, "fullname": "Jon Swenson", "url": "http://mlsys.org/api/miniconf/users/27151?format=json", "institution": "Facebook"}, {"id": 27541, "fullname": "Brandon Taylor", "url": "http://mlsys.org/api/miniconf/users/27541?format=json", "institution": null}, {"id": 27542, "fullname": "Chris Thi", "url": "http://mlsys.org/api/miniconf/users/27542?format=json", "institution": ""}, {"id": 27543, "fullname": "Adolfo Victoria", "url": "http://mlsys.org/api/miniconf/users/27543?format=json", "institution": null}, {"id": 27152, "fullname": "Yunfan Wang", "url": "http://mlsys.org/api/miniconf/users/27152?format=json", "institution": "Facebook"}, {"id": 27544, "fullname": "Pengchao Wang", "url": "http://mlsys.org/api/miniconf/users/27544?format=json", "institution": "Meta Inc."}, {"id": 23937, "fullname": "Wenchen Wang", "url": "http://mlsys.org/api/miniconf/users/23937?format=json", "institution": null}, {"id": 27545, "fullname": "Xiaodong Wang", "url": "http://mlsys.org/api/miniconf/users/27545?format=json", "institution": null}, {"id": 10964, "fullname": "Bram Wasti", "url": "http://mlsys.org/api/miniconf/users/10964?format=json", "institution": "Facebook"}, {"id": 27546, "fullname": "Wei Xu", "url": "http://mlsys.org/api/miniconf/users/27546?format=json", "institution": null}, {"id": 27547, "fullname": "Qirui Yang", "url": "http://mlsys.org/api/miniconf/users/27547?format=json", "institution": null}, {"id": 20938, "fullname": "Jingyi Yang", "url": "http://mlsys.org/api/miniconf/users/20938?format=json", "institution": "Facebook"}, {"id": 27548, "fullname": "Hector Yuen", "url": "http://mlsys.org/api/miniconf/users/27548?format=json", "institution": null}, {"id": 27549, "fullname": "Zhengyuan Zhang", "url": "http://mlsys.org/api/miniconf/users/27549?format=json", "institution": null}, {"id": 27550, "fullname": "Jing Zhang", "url": "http://mlsys.org/api/miniconf/users/27550?format=json", "institution": "Facebook"}, {"id": 27153, "fullname": "Yi Zhen", "url": "http://mlsys.org/api/miniconf/users/27153?format=json", "institution": "Meta"}, {"id": 27551, "fullname": "Yanjun Zhou", "url": "http://mlsys.org/api/miniconf/users/27551?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3557", "url": null, "sourceid": 87, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=gEbKQeIdxB", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 851, "modified": "2026-03-23T21:52:45.120481-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=gEbKQeIdxB", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "18", "related_events": ["http://mlsys.org/api/miniconf/events/3780?format=json"], "related_events_ids": [3780]}, {"id": 3558, "uid": "7f6ffaa6bb0b408017b62254211691b5", "name": "AIRS: Scaling Live Inference in Resource Constrained Environments", "authors": [{"id": 27552, "fullname": "Nilesh Jagnik", "url": "http://mlsys.org/api/miniconf/users/27552?format=json", "institution": "Google"}, {"id": 27553, "fullname": "Xiaohao Yang", "url": "http://mlsys.org/api/miniconf/users/27553?format=json", "institution": null}, {"id": 27554, "fullname": "Tuan Do", "url": "http://mlsys.org/api/miniconf/users/27554?format=json", "institution": null}, {"id": 27555, "fullname": "Chelsea Chen", "url": "http://mlsys.org/api/miniconf/users/27555?format=json", "institution": null}, {"id": 27556, "fullname": "Harshvardhan GM", "url": "http://mlsys.org/api/miniconf/users/27556?format=json", "institution": "Google LLC"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3558", "url": null, "sourceid": 112, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=g1RWik4Gy1", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 852, "modified": "2026-03-23T21:52:45.165663-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=g1RWik4Gy1", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "36", "related_events": ["http://mlsys.org/api/miniconf/events/3781?format=json"], "related_events_ids": [3781]}, {"id": 3567, "uid": "9f61408e3afb633e50cdf1b20de6f466", "name": "DreamDDP: Accelerating Low-Bandwidth Geo-Distributed LLM Training with Layer-wise Partial Synchronization", "authors": [{"id": 27588, "fullname": "Zhenheng Tang", "url": "http://mlsys.org/api/miniconf/users/27588?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27589, "fullname": "Zichen TANG", "url": "http://mlsys.org/api/miniconf/users/27589?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27590, "fullname": "Junlin Huang", "url": "http://mlsys.org/api/miniconf/users/27590?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27591, "fullname": "Xinglin Pan", "url": "http://mlsys.org/api/miniconf/users/27591?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 27592, "fullname": "Rudan Yan", "url": "http://mlsys.org/api/miniconf/users/27592?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 27593, "fullname": "Yuxin Wang", "url": "http://mlsys.org/api/miniconf/users/27593?format=json", "institution": "Huawei Technologies Ltd."}, {"id": 27594, "fullname": "Amelie Zhou", "url": "http://mlsys.org/api/miniconf/users/27594?format=json", "institution": null}, {"id": 27595, "fullname": "Shaohuai Shi", "url": "http://mlsys.org/api/miniconf/users/27595?format=json", "institution": "Harbin Institute of Technology, Shenzhen"}, {"id": 27596, "fullname": "Xiaowen Chu", "url": "http://mlsys.org/api/miniconf/users/27596?format=json", "institution": "Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 27597, "fullname": "Bo Li", "url": "http://mlsys.org/api/miniconf/users/27597?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3567", "url": null, "sourceid": 56, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=cnvw0mbZQp", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 861, "modified": "2026-03-23T21:52:45.555547-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=cnvw0mbZQp", "resourcetype": "UriEventmedia"}, {"id": 954, "file": "/media/PosterPDFs/MLSys%202026/3567.png", "modified": "2026-04-26T10:01:55.367505-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 955, "file": "/media/PosterPDFs/MLSys%202026/3567-thumb.png", "modified": "2026-04-26T10:01:55.450488-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "45", "related_events": ["http://mlsys.org/api/miniconf/events/3790?format=json"], "related_events_ids": [3790]}, {"id": 3790, "uid": "9f61408e3afb633e50cdf1b20de6f466", "name": "DreamDDP: Accelerating Low-Bandwidth Geo-Distributed LLM Training with Layer-wise Partial Synchronization", "authors": [{"id": 27588, "fullname": "Zhenheng Tang", "url": "http://mlsys.org/api/miniconf/users/27588?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27589, "fullname": "Zichen TANG", "url": "http://mlsys.org/api/miniconf/users/27589?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27590, "fullname": "Junlin Huang", "url": "http://mlsys.org/api/miniconf/users/27590?format=json", "institution": "The Hong Kong University of Science and Technology"}, {"id": 27591, "fullname": "Xinglin Pan", "url": "http://mlsys.org/api/miniconf/users/27591?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 27592, "fullname": "Rudan Yan", "url": "http://mlsys.org/api/miniconf/users/27592?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 27593, "fullname": "Yuxin Wang", "url": "http://mlsys.org/api/miniconf/users/27593?format=json", "institution": "Huawei Technologies Ltd."}, {"id": 27594, "fullname": "Amelie Zhou", "url": "http://mlsys.org/api/miniconf/users/27594?format=json", "institution": null}, {"id": 27595, "fullname": "Shaohuai Shi", "url": "http://mlsys.org/api/miniconf/users/27595?format=json", "institution": "Harbin Institute of Technology, Shenzhen"}, {"id": 27596, "fullname": "Xiaowen Chu", "url": "http://mlsys.org/api/miniconf/users/27596?format=json", "institution": "Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 27597, "fullname": "Bo Li", "url": "http://mlsys.org/api/miniconf/users/27597?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Training 3", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3790", "url": null, "sourceid": -56, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T18:00:00-07:00", "endtime": "2026-05-20T18:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3695?format=json", "parent_id": 3695, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3567?format=json"], "related_events_ids": [3567]}, {"id": 3570, "uid": "735b90b4568125ed6c3f678819b6e058", "name": "ZK-APEX: ZERO-KNOWLEDGE APPROXIMATE PERSONALIZED UNLEARNING WITH EXECUTABLE PROOFS", "authors": [{"id": 25660, "fullname": "Mohammadmahdi Maheri", "url": "http://mlsys.org/api/miniconf/users/25660?format=json", "institution": "Imperial College London"}, {"id": 27602, "fullname": "Sunil Cotterill", "url": "http://mlsys.org/api/miniconf/users/27602?format=json", "institution": null}, {"id": 27603, "fullname": "Alex Davidson", "url": "http://mlsys.org/api/miniconf/users/27603?format=json", "institution": null}, {"id": 11279, "fullname": "Hamed Haddadi", "url": "http://mlsys.org/api/miniconf/users/11279?format=json", "institution": "Imperial College London"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3570", "url": null, "sourceid": 67, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=bLx6orLvQM", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 864, "modified": "2026-03-23T21:52:45.678302-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=bLx6orLvQM", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "32", "related_events": ["http://mlsys.org/api/miniconf/events/3793?format=json"], "related_events_ids": [3793]}, {"id": 3793, "uid": "735b90b4568125ed6c3f678819b6e058", "name": "ZK-APEX: ZERO-KNOWLEDGE APPROXIMATE PERSONALIZED UNLEARNING WITH EXECUTABLE PROOFS", "authors": [{"id": 25660, "fullname": "Mohammadmahdi Maheri", "url": "http://mlsys.org/api/miniconf/users/25660?format=json", "institution": "Imperial College London"}, {"id": 27602, "fullname": "Sunil Cotterill", "url": "http://mlsys.org/api/miniconf/users/27602?format=json", "institution": null}, {"id": 27603, "fullname": "Alex Davidson", "url": "http://mlsys.org/api/miniconf/users/27603?format=json", "institution": null}, {"id": 11279, "fullname": "Hamed Haddadi", "url": "http://mlsys.org/api/miniconf/users/11279?format=json", "institution": "Imperial College London"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Security and Privacy", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3793", "url": null, "sourceid": -67, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T17:15:00-07:00", "endtime": "2026-05-19T17:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3673?format=json", "parent_id": 3673, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3570?format=json"], "related_events_ids": [3570]}, {"id": 3578, "uid": "4e732ced3463d06de0ca9a15b6153677", "name": "Privatar: Scalable Privacy-preserving Multi-user VR via Secure Offloading", "authors": [{"id": 13393, "fullname": "Jianming Tong", "url": "http://mlsys.org/api/miniconf/users/13393?format=json", "institution": "Georgia Tech/Google"}, {"id": 27626, "fullname": "Hanshen Xiao", "url": "http://mlsys.org/api/miniconf/users/27626?format=json", "institution": "Purdue University"}, {"id": 27627, "fullname": "Krishna Nair", "url": "http://mlsys.org/api/miniconf/users/27627?format=json", "institution": null}, {"id": 19218, "fullname": "Hao Kang", "url": "http://mlsys.org/api/miniconf/users/19218?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27628, "fullname": "Ashish Sirasao", "url": "http://mlsys.org/api/miniconf/users/27628?format=json", "institution": "Amd inc"}, {"id": 27629, "fullname": "Ziqi Zhang", "url": "http://mlsys.org/api/miniconf/users/27629?format=json", "institution": "University of Illinois at Urbana-Champaign"}, {"id": 27630, "fullname": "G. Edward Suh", "url": "http://mlsys.org/api/miniconf/users/27630?format=json", "institution": "NVIDIA"}, {"id": 11662, "fullname": "Tushar Krishna", "url": "http://mlsys.org/api/miniconf/users/11662?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3578", "url": null, "sourceid": 26, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=WjJfnNhY65", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 872, "modified": "2026-03-23T21:52:46.003516-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=WjJfnNhY65", "resourcetype": "UriEventmedia"}, {"id": 937, "file": "/media/PosterPDFs/MLSys%202026/3578-thumb.png", "modified": "2026-04-18T00:29:59.324513-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 938, "file": "/media/PosterPDFs/MLSys%202026/3578.png", "modified": "2026-04-18T00:29:59.271739-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "30", "related_events": ["http://mlsys.org/api/miniconf/events/3801?format=json"], "related_events_ids": [3801]}, {"id": 3581, "uid": "42a0e188f5033bc65bf8d78622277c4e", "name": "A Lightweight High-Throughput Collective-Capable NoC for Large-Scale ML Accelerators", "authors": [{"id": 25644, "fullname": "Luca Colagrande", "url": "http://mlsys.org/api/miniconf/users/25644?format=json", "institution": "ETH Zurich"}, {"id": 25669, "fullname": "Lorenzo Leone", "url": "http://mlsys.org/api/miniconf/users/25669?format=json", "institution": "ETH Zurich"}, {"id": 27638, "fullname": "Chen Wu", "url": "http://mlsys.org/api/miniconf/users/27638?format=json", "institution": "ETH Zurich"}, {"id": 27639, "fullname": "Tim Fischer", "url": "http://mlsys.org/api/miniconf/users/27639?format=json", "institution": null}, {"id": 27640, "fullname": "Raphael Roth", "url": "http://mlsys.org/api/miniconf/users/27640?format=json", "institution": null}, {"id": 21010, "fullname": "Luca Benini", "url": "http://mlsys.org/api/miniconf/users/21010?format=json", "institution": "ETHZ - ETH Zurich"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3581", "url": null, "sourceid": 136, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=VDuS8N9RCx", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 875, "modified": "2026-03-23T21:52:46.121249-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=VDuS8N9RCx", "resourcetype": "UriEventmedia"}, {"id": 1071, "file": "/media/PosterPDFs/MLSys%202026/3581.png", "modified": "2026-05-15T04:18:51.847313-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1072, "file": "/media/PosterPDFs/MLSys%202026/3581-thumb.png", "modified": "2026-05-15T04:18:51.941480-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "44", "related_events": ["http://mlsys.org/api/miniconf/events/3804?format=json"], "related_events_ids": [3804]}, {"id": 3585, "uid": "19ca14e7ea6328a42e0eb13d585e4c22", "name": "AccelOpt: A Self-Improving LLM Agentic System for AI Accelerator Kernel Optimization", "authors": [{"id": 18114, "fullname": "Genghan Zhang", "url": "http://mlsys.org/api/miniconf/users/18114?format=json", "institution": "Stanford University"}, {"id": 27646, "fullname": "Shaowei Zhu", "url": "http://mlsys.org/api/miniconf/users/27646?format=json", "institution": "Amazon"}, {"id": 27647, "fullname": "Anjiang Wei", "url": "http://mlsys.org/api/miniconf/users/27647?format=json", "institution": null}, {"id": 27171, "fullname": "Zhenyu Song", "url": "http://mlsys.org/api/miniconf/users/27171?format=json", "institution": null}, {"id": 27648, "fullname": "Allen Nie", "url": "http://mlsys.org/api/miniconf/users/27648?format=json", "institution": "Google DeepMind"}, {"id": 15476, "fullname": "Zhen Jia", "url": "http://mlsys.org/api/miniconf/users/15476?format=json", "institution": "Amazon"}, {"id": 17626, "fullname": "Nandita Vijaykumar", "url": "http://mlsys.org/api/miniconf/users/17626?format=json", "institution": "Department of Computer Science, University of Toronto"}, {"id": 11990, "fullname": "Yida Wang", "url": "http://mlsys.org/api/miniconf/users/11990?format=json", "institution": "Amazon"}, {"id": 15013, "fullname": "Kunle Olukotun", "url": "http://mlsys.org/api/miniconf/users/15013?format=json", "institution": "Stanford"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3585", "url": null, "sourceid": 36, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=SBS4NJHYjZ", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 879, "modified": "2026-03-23T21:52:46.269486-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=SBS4NJHYjZ", "resourcetype": "UriEventmedia"}, {"id": 941, "file": "/media/PosterPDFs/MLSys%202026/3585.png", "modified": "2026-04-20T22:34:48.669322-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 942, "file": "/media/PosterPDFs/MLSys%202026/3585-thumb.png", "modified": "2026-04-20T22:38:27.823013-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "37", "related_events": ["http://mlsys.org/api/miniconf/events/3808?format=json"], "related_events_ids": [3808]}, {"id": 3586, "uid": "8f14e45fceea167a5a36dedd4bea2543", "name": "SuperInfer: SLO-Aware Rotary Scheduling and Memory Management for LLM Inference on Superchips", "authors": [{"id": 25942, "fullname": "Jiahuan Yu", "url": "http://mlsys.org/api/miniconf/users/25942?format=json", "institution": "University of Illinois Urbana-Champaign"}, {"id": 27649, "fullname": "Mingtao Hu", "url": "http://mlsys.org/api/miniconf/users/27649?format=json", "institution": "University of Illinois at Urbana-Champaign"}, {"id": 27650, "fullname": "Zichao Lin", "url": "http://mlsys.org/api/miniconf/users/27650?format=json", "institution": null}, {"id": 19015, "fullname": "Minjia Zhang", "url": "http://mlsys.org/api/miniconf/users/19015?format=json", "institution": "UIUC"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3586", "url": null, "sourceid": 7, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=RuslSHdIHa", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 880, "modified": "2026-03-23T21:52:46.304024-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=RuslSHdIHa", "resourcetype": "UriEventmedia"}, {"id": 1050, "file": "/media/PosterPDFs/MLSys%202026/3586.png", "modified": "2026-05-14T18:14:54.088640-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1051, "file": "/media/PosterPDFs/MLSys%202026/3586-thumb.png", "modified": "2026-05-14T18:14:54.208542-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "17", "related_events": ["http://mlsys.org/api/miniconf/events/3809?format=json"], "related_events_ids": [3809]}, {"id": 3591, "uid": "aab3238922bcc25a6f606eb525ffdc56", "name": "Rethinking DVFS for Mobile LLMs: Unified Energy-Aware Scheduling with CORE", "authors": [{"id": 27664, "fullname": "Zongpu Zhang", "url": "http://mlsys.org/api/miniconf/users/27664?format=json", "institution": "Purdue University"}, {"id": 27665, "fullname": "Pranab Dash", "url": "http://mlsys.org/api/miniconf/users/27665?format=json", "institution": null}, {"id": 27667, "fullname": "Qiang Xu", "url": "http://mlsys.org/api/miniconf/users/27667?format=json", "institution": "Purdue University"}, {"id": 27666, "fullname": "Y. Charlie Hu", "url": "http://mlsys.org/api/miniconf/users/27666?format=json", "institution": "Purdue University"}, {"id": 27668, "fullname": "Jian Li", "url": "http://mlsys.org/api/miniconf/users/27668?format=json", "institution": "Shanghai Jiao Tong University"}, {"id": 27669, "fullname": "Haibing Guan", "url": "http://mlsys.org/api/miniconf/users/27669?format=json", "institution": "Shanghai Jiao Tong University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3591", "url": null, "sourceid": 14, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=PSyHQ8kVUT", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 885, "modified": "2026-03-23T21:52:46.497723-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=PSyHQ8kVUT", "resourcetype": "UriEventmedia"}, {"id": 1017, "file": "/media/PosterPDFs/MLSys%202026/3591.png", "modified": "2026-05-13T20:20:03.014824-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1018, "file": "/media/PosterPDFs/MLSys%202026/3591-thumb.png", "modified": "2026-05-13T20:20:03.095857-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "17", "related_events": ["http://mlsys.org/api/miniconf/events/3814?format=json"], "related_events_ids": [3814]}, {"id": 3593, "uid": "fc490ca45c00b1249bbe3554a4fdf6fb", "name": "MorphServe: Efficient and Workload-Aware LLM Serving via Runtime Quantized Layer Swapping and KV Cache Resizing", "authors": [{"id": 27401, "fullname": "Zhaoyuan Su", "url": "http://mlsys.org/api/miniconf/users/27401?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27679, "fullname": "Zeyu Zhang", "url": "http://mlsys.org/api/miniconf/users/27679?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27403, "fullname": "Tingfeng Lan", "url": "http://mlsys.org/api/miniconf/users/27403?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27405, "fullname": "Zirui Wang", "url": "http://mlsys.org/api/miniconf/users/27405?format=json", "institution": "University of Virginia, Charlottesville"}, {"id": 27680, "fullname": "Haiying Shen", "url": "http://mlsys.org/api/miniconf/users/27680?format=json", "institution": null}, {"id": 27681, "fullname": "Juncheng Yang", "url": "http://mlsys.org/api/miniconf/users/27681?format=json", "institution": "Harvard University"}, {"id": 27406, "fullname": "Yue Cheng", "url": "http://mlsys.org/api/miniconf/users/27406?format=json", "institution": "University of Virginia, Charlottesville"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3593", "url": null, "sourceid": 65, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=PDu13oOl4G", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 887, "modified": "2026-03-23T21:52:46.576422-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=PDu13oOl4G", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "4", "related_events": ["http://mlsys.org/api/miniconf/events/3816?format=json"], "related_events_ids": [3816]}, {"id": 3799, "uid": "4c56ff4ce4aaf9573aa5dff913df997a", "name": "DriftBench: Measuring and Predicting Infrastructure Drift in LLM Serving Systems", "authors": [{"id": 25492, "fullname": "Gianluigi Vitale", "url": "http://mlsys.org/api/miniconf/users/25492?format=json", "institution": "Universitas Mercatorum"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3799", "url": null, "sourceid": -121, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T15:30:00-07:00", "endtime": "2026-05-21T15:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3714?format=json", "parent_id": 3714, "eventmedia": [{"id": 1003, "modified": "2026-05-13T07:31:50.649250-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3799_Hct4euu.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3576?format=json"], "related_events_ids": [3576]}, {"id": 3596, "uid": "202cb962ac59075b964b07152d234b70", "name": "Beyond the Buzz: A Pragmatic Take on Inference Disaggregation", "authors": [{"id": 27700, "fullname": "Tiyasa Mitra", "url": "http://mlsys.org/api/miniconf/users/27700?format=json", "institution": "NVIDIA"}, {"id": 27701, "fullname": "Ritika Borkar", "url": "http://mlsys.org/api/miniconf/users/27701?format=json", "institution": "NVIDIA"}, {"id": 27702, "fullname": "Nidhi Bhatia", "url": "http://mlsys.org/api/miniconf/users/27702?format=json", "institution": "NVIDIA Corporation"}, {"id": 27703, "fullname": "Shivam Raj", "url": "http://mlsys.org/api/miniconf/users/27703?format=json", "institution": "NVIDIA"}, {"id": 25864, "fullname": "hongkuan zhou", "url": "http://mlsys.org/api/miniconf/users/25864?format=json", "institution": "Nvidia"}, {"id": 27704, "fullname": "Yan Ru Pei", "url": "http://mlsys.org/api/miniconf/users/27704?format=json", "institution": "NVIDIA"}, {"id": 27705, "fullname": "Vishwanath Venkatesan", "url": "http://mlsys.org/api/miniconf/users/27705?format=json", "institution": null}, {"id": 27706, "fullname": "Kyle Kranen", "url": "http://mlsys.org/api/miniconf/users/27706?format=json", "institution": "NVIDIA"}, {"id": 27707, "fullname": "Ramon Matas", "url": "http://mlsys.org/api/miniconf/users/27707?format=json", "institution": "NVIDIA"}, {"id": 18519, "fullname": "Dheevatsa Mudigere", "url": "http://mlsys.org/api/miniconf/users/18519?format=json", "institution": "NVIDIA"}, {"id": 27708, "fullname": "Ritchie Zhao", "url": "http://mlsys.org/api/miniconf/users/27708?format=json", "institution": "NVIDIA"}, {"id": 27709, "fullname": "Maximilian Golub", "url": "http://mlsys.org/api/miniconf/users/27709?format=json", "institution": "NVIDIA"}, {"id": 27710, "fullname": "Arpan Dutta", "url": "http://mlsys.org/api/miniconf/users/27710?format=json", "institution": "NVIDIA"}, {"id": 27711, "fullname": "Suresh Nambi", "url": "http://mlsys.org/api/miniconf/users/27711?format=json", "institution": null}, {"id": 27712, "fullname": "Sailaja Madduri", "url": "http://mlsys.org/api/miniconf/users/27712?format=json", "institution": "NVIDIA"}, {"id": 27713, "fullname": "Dharmesh Jani", "url": "http://mlsys.org/api/miniconf/users/27713?format=json", "institution": "NVIDIA"}, {"id": 27714, "fullname": "Brian Pharris", "url": "http://mlsys.org/api/miniconf/users/27714?format=json", "institution": "NVIDIA"}, {"id": 27715, "fullname": "Itay Neeman", "url": "http://mlsys.org/api/miniconf/users/27715?format=json", "institution": "NVIDIA"}, {"id": 27716, "fullname": "Bita Darvish Rouhani", "url": "http://mlsys.org/api/miniconf/users/27716?format=json", "institution": "NVIDIA"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3596", "url": null, "sourceid": 123, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=NqC5tcBsa0", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 890, "modified": "2026-03-23T21:52:46.684672-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=NqC5tcBsa0", "resourcetype": "UriEventmedia"}, {"id": 1053, "file": "/media/PosterPDFs/MLSys%202026/3596.png", "modified": "2026-05-14T22:20:18.934969-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1054, "file": "/media/PosterPDFs/MLSys%202026/3596-thumb.png", "modified": "2026-05-14T22:20:19.043886-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "16", "related_events": ["http://mlsys.org/api/miniconf/events/3819?format=json"], "related_events_ids": [3819]}, {"id": 3606, "uid": "73278a4a86960eeb576a8fd4c9ec6997", "name": "Hawkeye: Reproducing GPU-Level Non-Determinism", "authors": [{"id": 27770, "fullname": "Erez Badash", "url": "http://mlsys.org/api/miniconf/users/27770?format=json", "institution": null}, {"id": 27771, "fullname": "Dan Boneh", "url": "http://mlsys.org/api/miniconf/users/27771?format=json", "institution": "Stanford University"}, {"id": 27772, "fullname": "Ilan Komargodski", "url": "http://mlsys.org/api/miniconf/users/27772?format=json", "institution": null}, {"id": 27773, "fullname": "Megha Srivastava", "url": "http://mlsys.org/api/miniconf/users/27773?format=json", "institution": "Stanford University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3606", "url": null, "sourceid": 113, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=JnmgsTFQQv", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 900, "modified": "2026-03-23T21:52:47.044074-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=JnmgsTFQQv", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "27", "related_events": ["http://mlsys.org/api/miniconf/events/3829?format=json"], "related_events_ids": [3829]}, {"id": 3829, "uid": "73278a4a86960eeb576a8fd4c9ec6997", "name": "Hawkeye: Reproducing GPU-Level Non-Determinism", "authors": [{"id": 27770, "fullname": "Erez Badash", "url": "http://mlsys.org/api/miniconf/users/27770?format=json", "institution": null}, {"id": 27771, "fullname": "Dan Boneh", "url": "http://mlsys.org/api/miniconf/users/27771?format=json", "institution": "Stanford University"}, {"id": 27772, "fullname": "Ilan Komargodski", "url": "http://mlsys.org/api/miniconf/users/27772?format=json", "institution": null}, {"id": 27773, "fullname": "Megha Srivastava", "url": "http://mlsys.org/api/miniconf/users/27773?format=json", "institution": "Stanford University"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Benchmarks and Evaluation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3829", "url": null, "sourceid": -113, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T15:15:00-07:00", "endtime": "2026-05-21T15:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3714?format=json", "parent_id": 3714, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3606?format=json"], "related_events_ids": [3606]}, {"id": 3609, "uid": "c8ffe9a587b126f152ed3d89a146b445", "name": "FlashInfer-Bench: Building the Virtuous Cycle for AI-driven LLM Systems", "authors": [{"id": 17934, "fullname": "Shanli Xing", "url": "http://mlsys.org/api/miniconf/users/17934?format=json", "institution": "University of Washington"}, {"id": 27789, "fullname": "Vivian Zhai", "url": "http://mlsys.org/api/miniconf/users/27789?format=json", "institution": "Carnegie Mellon University"}, {"id": 25656, "fullname": "Alexander Jiang", "url": "http://mlsys.org/api/miniconf/users/25656?format=json", "institution": "Carnegie Mellon University"}, {"id": 23351, "fullname": "Yixin Dong", "url": "http://mlsys.org/api/miniconf/users/23351?format=json", "institution": "Carnegie Mellon University"}, {"id": 27790, "fullname": "Yong Wu", "url": "http://mlsys.org/api/miniconf/users/27790?format=json", "institution": "Nvidia"}, {"id": 12026, "fullname": "Zihao Ye", "url": "http://mlsys.org/api/miniconf/users/12026?format=json", "institution": "NVIDIA"}, {"id": 25650, "fullname": "Charlie Ruan", "url": "http://mlsys.org/api/miniconf/users/25650?format=json", "institution": null}, {"id": 28960, "fullname": "Yingyi Huang", "url": "http://mlsys.org/api/miniconf/users/28960?format=json", "institution": "NVIDIA"}, {"id": 28498, "fullname": "Yineng Zhang", "url": "http://mlsys.org/api/miniconf/users/28498?format=json", "institution": "LightSeek Foundation"}, {"id": 27791, "fullname": "Liangsheng Yin", "url": "http://mlsys.org/api/miniconf/users/27791?format=json", "institution": null}, {"id": 27792, "fullname": "Aksara Bayyapu", "url": "http://mlsys.org/api/miniconf/users/27792?format=json", "institution": null}, {"id": 11020, "fullname": "Luis Ceze", "url": "http://mlsys.org/api/miniconf/users/11020?format=json", "institution": "University of Washington and NVIDIA"}, {"id": 11984, "fullname": "Tianqi Chen", "url": "http://mlsys.org/api/miniconf/users/11984?format=json", "institution": "CMU"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3609", "url": null, "sourceid": 124, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=IyryZno8Hh", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 903, "modified": "2026-03-23T21:52:47.151524-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=IyryZno8Hh", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "14", "related_events": ["http://mlsys.org/api/miniconf/events/3832?format=json"], "related_events_ids": [3832]}, {"id": 3832, "uid": "c8ffe9a587b126f152ed3d89a146b445", "name": "FlashInfer-Bench: Building the Virtuous Cycle for AI-driven LLM Systems", "authors": [{"id": 17934, "fullname": "Shanli Xing", "url": "http://mlsys.org/api/miniconf/users/17934?format=json", "institution": "University of Washington"}, {"id": 27789, "fullname": "Vivian Zhai", "url": "http://mlsys.org/api/miniconf/users/27789?format=json", "institution": "Carnegie Mellon University"}, {"id": 25656, "fullname": "Alexander Jiang", "url": "http://mlsys.org/api/miniconf/users/25656?format=json", "institution": "Carnegie Mellon University"}, {"id": 23351, "fullname": "Yixin Dong", "url": "http://mlsys.org/api/miniconf/users/23351?format=json", "institution": "Carnegie Mellon University"}, {"id": 27790, "fullname": "Yong Wu", "url": "http://mlsys.org/api/miniconf/users/27790?format=json", "institution": "Nvidia"}, {"id": 12026, "fullname": "Zihao Ye", "url": "http://mlsys.org/api/miniconf/users/12026?format=json", "institution": "NVIDIA"}, {"id": 25650, "fullname": "Charlie Ruan", "url": "http://mlsys.org/api/miniconf/users/25650?format=json", "institution": null}, {"id": 28960, "fullname": "Yingyi Huang", "url": "http://mlsys.org/api/miniconf/users/28960?format=json", "institution": "NVIDIA"}, {"id": 28498, "fullname": "Yineng Zhang", "url": "http://mlsys.org/api/miniconf/users/28498?format=json", "institution": "LightSeek Foundation"}, {"id": 27791, "fullname": "Liangsheng Yin", "url": "http://mlsys.org/api/miniconf/users/27791?format=json", "institution": null}, {"id": 27792, "fullname": "Aksara Bayyapu", "url": "http://mlsys.org/api/miniconf/users/27792?format=json", "institution": null}, {"id": 11020, "fullname": "Luis Ceze", "url": "http://mlsys.org/api/miniconf/users/11020?format=json", "institution": "University of Washington and NVIDIA"}, {"id": 11984, "fullname": "Tianqi Chen", "url": "http://mlsys.org/api/miniconf/users/11984?format=json", "institution": "CMU"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: ML for Systems", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3832", "url": null, "sourceid": -124, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T13:30:00-07:00", "endtime": "2026-05-20T13:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3688?format=json", "parent_id": 3688, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3609?format=json"], "related_events_ids": [3609]}, {"id": 3614, "uid": "a0a080f42e6f13b3a2df133f073095dd", "name": "DisAgg: Distributed Aggregators for Efficient Secure Aggregation", "authors": [{"id": 27813, "fullname": "Haaris Mehmood", "url": "http://mlsys.org/api/miniconf/users/27813?format=json", "institution": "Samsung"}, {"id": 28523, "fullname": "Giorgos Tatsis", "url": "http://mlsys.org/api/miniconf/users/28523?format=json", "institution": "CERTH/ITI"}, {"id": 27815, "fullname": "Dimitrios Alexopoulos", "url": "http://mlsys.org/api/miniconf/users/27815?format=json", "institution": "Pragma IoT Solutions"}, {"id": 27816, "fullname": "Karthikeyan Saravanan", "url": "http://mlsys.org/api/miniconf/users/27816?format=json", "institution": "Samsung"}, {"id": 25860, "fullname": "Jie Xi", "url": "http://mlsys.org/api/miniconf/users/25860?format=json", "institution": "Samsung R&amp;D Institute UK (SRUK)"}, {"id": 27817, "fullname": "Anastasios Drosou", "url": "http://mlsys.org/api/miniconf/users/27817?format=json", "institution": null}, {"id": 27818, "fullname": "Mete Ozay", "url": "http://mlsys.org/api/miniconf/users/27818?format=json", "institution": "Samsung Research"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3614", "url": null, "sourceid": 122, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=H0BLKrOgik", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 908, "modified": "2026-03-23T21:52:47.381737-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=H0BLKrOgik", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "31", "related_events": ["http://mlsys.org/api/miniconf/events/3837?format=json"], "related_events_ids": [3837]}, {"id": 3618, "uid": "d67d8ab4f4c10bf22aa353e27879133c", "name": "CAGE: Curvature-Aware Gradient Estimation For Accurate Quantization-Aware Training", "authors": [{"id": 27826, "fullname": "Soroush Tabesh", "url": "http://mlsys.org/api/miniconf/users/27826?format=json", "institution": "Institute of Science and Technology Austria"}, {"id": 28563, "fullname": "Mher Safaryan", "url": "http://mlsys.org/api/miniconf/users/28563?format=json", "institution": "ISTA, Austria | Lancaster University, UK"}, {"id": 27828, "fullname": "Andrei Panferov", "url": "http://mlsys.org/api/miniconf/users/27828?format=json", "institution": "Institute of Science and Technology Austria"}, {"id": 27829, "fullname": "Alexandra Volkova", "url": "http://mlsys.org/api/miniconf/users/27829?format=json", "institution": null}, {"id": 27830, "fullname": "Dan Alistarh", "url": "http://mlsys.org/api/miniconf/users/27830?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3618", "url": null, "sourceid": 39, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=Fubm1TtWeo", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 912, "modified": "2026-03-23T21:52:47.532702-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=Fubm1TtWeo", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "38", "related_events": ["http://mlsys.org/api/miniconf/events/3841?format=json"], "related_events_ids": [3841]}, {"id": 3619, "uid": "02522a2b2726fb0a03bb19f2d8d9524d", "name": "Stream2LLM: Overlap Context Streaming and Prefill for Reduced Time-to-First-Token", "authors": [{"id": 27831, "fullname": "Rajveer Bachkaniwala", "url": "http://mlsys.org/api/miniconf/users/27831?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27832, "fullname": "Chengqi Luo", "url": "http://mlsys.org/api/miniconf/users/27832?format=json", "institution": null}, {"id": 27833, "fullname": "Richard So", "url": "http://mlsys.org/api/miniconf/users/27833?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27358, "fullname": "Divya Mahajan", "url": "http://mlsys.org/api/miniconf/users/27358?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27834, "fullname": "Kexin Rong", "url": "http://mlsys.org/api/miniconf/users/27834?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3619", "url": null, "sourceid": 134, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=FuRo7Ur5Ib", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 913, "modified": "2026-03-23T21:52:47.584624-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=FuRo7Ur5Ib", "resourcetype": "UriEventmedia"}, {"id": 1005, "file": "/media/PosterPDFs/MLSys%202026/3619.png", "modified": "2026-05-13T12:56:32.117668-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1006, "file": "/media/PosterPDFs/MLSys%202026/3619-thumb.png", "modified": "2026-05-17T18:12:44.475012-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "16", "related_events": ["http://mlsys.org/api/miniconf/events/3842?format=json"], "related_events_ids": [3842]}, {"id": 3621, "uid": "1afa34a7f984eeabdbb0a7d494132ee5", "name": "OPKV: A High-Throughput Plugin-Driven Framework for Recallable Sparsity in Paged KV Cache Systems", "authors": [{"id": 27839, "fullname": "Huazheng Lao", "url": "http://mlsys.org/api/miniconf/users/27839?format=json", "institution": "Southeast University"}, {"id": 25856, "fullname": "Xiaofeng Li", "url": "http://mlsys.org/api/miniconf/users/25856?format=json", "institution": "Southeast University"}, {"id": 25589, "fullname": "Rui Xu", "url": "http://mlsys.org/api/miniconf/users/25589?format=json", "institution": ""}, {"id": 25641, "fullname": "Long Chen", "url": "http://mlsys.org/api/miniconf/users/25641?format=json", "institution": "Southeast University"}, {"id": 27840, "fullname": "Xia Zhu", "url": "http://mlsys.org/api/miniconf/users/27840?format=json", "institution": "Southeast University"}, {"id": 27841, "fullname": "Jinquan Zhang", "url": "http://mlsys.org/api/miniconf/users/27841?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3621", "url": null, "sourceid": 131, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=EB5bgzv4qA", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 915, "modified": "2026-03-23T21:52:47.660267-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=EB5bgzv4qA", "resourcetype": "UriEventmedia"}, {"id": 1082, "file": "/media/PosterPDFs/MLSys%202026/3621.png", "modified": "2026-05-15T09:28:27.078496-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1083, "file": "/media/PosterPDFs/MLSys%202026/3621-thumb.png", "modified": "2026-05-15T09:28:27.183398-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "15", "related_events": ["http://mlsys.org/api/miniconf/events/3844?format=json"], "related_events_ids": [3844]}, {"id": 3629, "uid": "33e75ff09dd601bbe69f351039152189", "name": "Dataflow Is All You Need", "authors": [{"id": 27864, "fullname": "Darshan Gandhi", "url": "http://mlsys.org/api/miniconf/users/27864?format=json", "institution": "Sambanova Systems"}, {"id": 27865, "fullname": "Pushkar Nandkar", "url": "http://mlsys.org/api/miniconf/users/27865?format=json", "institution": "Sambanova Systems"}, {"id": 27866, "fullname": "David Koeplinger", "url": "http://mlsys.org/api/miniconf/users/27866?format=json", "institution": "SambaNova"}, {"id": 25920, "fullname": "Nasim Farahini", "url": "http://mlsys.org/api/miniconf/users/25920?format=json", "institution": null}, {"id": 27166, "fullname": "Romy Tsoupidi", "url": "http://mlsys.org/api/miniconf/users/27166?format=json", "institution": "Sambanova Systems"}, {"id": 27867, "fullname": "Samuel Rydh", "url": "http://mlsys.org/api/miniconf/users/27867?format=json", "institution": null}, {"id": 27868, "fullname": "Matheen Musaddiq", "url": "http://mlsys.org/api/miniconf/users/27868?format=json", "institution": null}, {"id": 18777, "fullname": "Tuowen Zhao", "url": "http://mlsys.org/api/miniconf/users/18777?format=json", "institution": "SambaNova Systems, Inc."}, {"id": 27869, "fullname": "Reid Goodbar", "url": "http://mlsys.org/api/miniconf/users/27869?format=json", "institution": "SambaNova Systems"}, {"id": 27870, "fullname": "Nathan Sheeley", "url": "http://mlsys.org/api/miniconf/users/27870?format=json", "institution": null}, {"id": 27871, "fullname": "Leon Zhang", "url": "http://mlsys.org/api/miniconf/users/27871?format=json", "institution": "Sambanova Systems"}, {"id": 27872, "fullname": "Matthew Shaffer", "url": "http://mlsys.org/api/miniconf/users/27872?format=json", "institution": null}, {"id": 27873, "fullname": "John Long", "url": "http://mlsys.org/api/miniconf/users/27873?format=json", "institution": "Sambanova Systems"}, {"id": 27167, "fullname": "Han Wang", "url": "http://mlsys.org/api/miniconf/users/27167?format=json", "institution": "SambaNova"}, {"id": 27874, "fullname": "Angela Wang", "url": "http://mlsys.org/api/miniconf/users/27874?format=json", "institution": null}, {"id": 27875, "fullname": "Arjun Sabnis", "url": "http://mlsys.org/api/miniconf/users/27875?format=json", "institution": null}, {"id": 27876, "fullname": "Joshua Brot", "url": "http://mlsys.org/api/miniconf/users/27876?format=json", "institution": null}, {"id": 18774, "fullname": "Yun Du", "url": "http://mlsys.org/api/miniconf/users/18774?format=json", "institution": null}, {"id": 27877, "fullname": "H\u00e5kan Zeffer", "url": "http://mlsys.org/api/miniconf/users/27877?format=json", "institution": "SambaNova Systems, Inc"}, {"id": 27878, "fullname": "Mingran Wang", "url": "http://mlsys.org/api/miniconf/users/27878?format=json", "institution": null}, {"id": 27879, "fullname": "Raghu Prabhakar", "url": "http://mlsys.org/api/miniconf/users/27879?format=json", "institution": "Sambanova Systems Inc"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3629", "url": null, "sourceid": 28, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=7wOOhxkuN8", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 923, "modified": "2026-03-23T21:52:47.993911-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=7wOOhxkuN8", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "45", "related_events": ["http://mlsys.org/api/miniconf/events/3852?format=json"], "related_events_ids": [3852]}, {"id": 3852, "uid": "33e75ff09dd601bbe69f351039152189", "name": "Dataflow Is All You Need", "authors": [{"id": 27864, "fullname": "Darshan Gandhi", "url": "http://mlsys.org/api/miniconf/users/27864?format=json", "institution": "Sambanova Systems"}, {"id": 27865, "fullname": "Pushkar Nandkar", "url": "http://mlsys.org/api/miniconf/users/27865?format=json", "institution": "Sambanova Systems"}, {"id": 27866, "fullname": "David Koeplinger", "url": "http://mlsys.org/api/miniconf/users/27866?format=json", "institution": "SambaNova"}, {"id": 25920, "fullname": "Nasim Farahini", "url": "http://mlsys.org/api/miniconf/users/25920?format=json", "institution": null}, {"id": 27166, "fullname": "Romy Tsoupidi", "url": "http://mlsys.org/api/miniconf/users/27166?format=json", "institution": "Sambanova Systems"}, {"id": 27867, "fullname": "Samuel Rydh", "url": "http://mlsys.org/api/miniconf/users/27867?format=json", "institution": null}, {"id": 27868, "fullname": "Matheen Musaddiq", "url": "http://mlsys.org/api/miniconf/users/27868?format=json", "institution": null}, {"id": 18777, "fullname": "Tuowen Zhao", "url": "http://mlsys.org/api/miniconf/users/18777?format=json", "institution": "SambaNova Systems, Inc."}, {"id": 27869, "fullname": "Reid Goodbar", "url": "http://mlsys.org/api/miniconf/users/27869?format=json", "institution": "SambaNova Systems"}, {"id": 27870, "fullname": "Nathan Sheeley", "url": "http://mlsys.org/api/miniconf/users/27870?format=json", "institution": null}, {"id": 27871, "fullname": "Leon Zhang", "url": "http://mlsys.org/api/miniconf/users/27871?format=json", "institution": "Sambanova Systems"}, {"id": 27872, "fullname": "Matthew Shaffer", "url": "http://mlsys.org/api/miniconf/users/27872?format=json", "institution": null}, {"id": 27873, "fullname": "John Long", "url": "http://mlsys.org/api/miniconf/users/27873?format=json", "institution": "Sambanova Systems"}, {"id": 27167, "fullname": "Han Wang", "url": "http://mlsys.org/api/miniconf/users/27167?format=json", "institution": "SambaNova"}, {"id": 27874, "fullname": "Angela Wang", "url": "http://mlsys.org/api/miniconf/users/27874?format=json", "institution": null}, {"id": 27875, "fullname": "Arjun Sabnis", "url": "http://mlsys.org/api/miniconf/users/27875?format=json", "institution": null}, {"id": 27876, "fullname": "Joshua Brot", "url": "http://mlsys.org/api/miniconf/users/27876?format=json", "institution": null}, {"id": 18774, "fullname": "Yun Du", "url": "http://mlsys.org/api/miniconf/users/18774?format=json", "institution": null}, {"id": 27877, "fullname": "H\u00e5kan Zeffer", "url": "http://mlsys.org/api/miniconf/users/27877?format=json", "institution": "SambaNova Systems, Inc"}, {"id": 27878, "fullname": "Mingran Wang", "url": "http://mlsys.org/api/miniconf/users/27878?format=json", "institution": null}, {"id": 27879, "fullname": "Raghu Prabhakar", "url": "http://mlsys.org/api/miniconf/users/27879?format=json", "institution": "Sambanova Systems Inc"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Compilers/HW", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3852", "url": null, "sourceid": -28, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-22T08:15:00-07:00", "endtime": "2026-05-22T08:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3721?format=json", "parent_id": 3721, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3629?format=json"], "related_events_ids": [3629]}, {"id": 3631, "uid": "d82c8d1619ad8176d665453cfb2e55f0", "name": "BLASST: Dynamic BLocked Attention Sparsity via Softmax Thresholding", "authors": [{"id": 27887, "fullname": "Jiayi Yuan", "url": "http://mlsys.org/api/miniconf/users/27887?format=json", "institution": "Rice University"}, {"id": 15623, "fullname": "Cameron Shinn", "url": "http://mlsys.org/api/miniconf/users/15623?format=json", "institution": "University of California, Davis"}, {"id": 27888, "fullname": "Kai Xu", "url": "http://mlsys.org/api/miniconf/users/27888?format=json", "institution": "NVIDIA"}, {"id": 27889, "fullname": "Jingze Cui", "url": "http://mlsys.org/api/miniconf/users/27889?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 27890, "fullname": "George Klimiashvili", "url": "http://mlsys.org/api/miniconf/users/27890?format=json", "institution": "NVIDIA"}, {"id": 27891, "fullname": "Guangxuan Xiao", "url": "http://mlsys.org/api/miniconf/users/27891?format=json", "institution": null}, {"id": 27892, "fullname": "Perkz Zheng", "url": "http://mlsys.org/api/miniconf/users/27892?format=json", "institution": "NVIDIA"}, {"id": 27893, "fullname": "Bo Li", "url": "http://mlsys.org/api/miniconf/users/27893?format=json", "institution": "NVIDIA"}, {"id": 27894, "fullname": "Zhou Yuxin", "url": "http://mlsys.org/api/miniconf/users/27894?format=json", "institution": "NVIDIA"}, {"id": 27895, "fullname": "Zhouhai Ye", "url": "http://mlsys.org/api/miniconf/users/27895?format=json", "institution": "NVIDIA"}, {"id": 27896, "fullname": "Weijie You", "url": "http://mlsys.org/api/miniconf/users/27896?format=json", "institution": "NVIDIA"}, {"id": 28473, "fullname": "Tian Zheng", "url": "http://mlsys.org/api/miniconf/users/28473?format=json", "institution": "NVIDIA"}, {"id": 28474, "fullname": "Dominic Brown", "url": "http://mlsys.org/api/miniconf/users/28474?format=json", "institution": "NVIDIA"}, {"id": 28475, "fullname": "Pengbo Wang", "url": "http://mlsys.org/api/miniconf/users/28475?format=json", "institution": "NVIDIA"}, {"id": 27339, "fullname": "Markus Hoehnerbach", "url": "http://mlsys.org/api/miniconf/users/27339?format=json", "institution": "Meta"}, {"id": 27897, "fullname": "Richard Cai", "url": "http://mlsys.org/api/miniconf/users/27897?format=json", "institution": "NVIDIA"}, {"id": 27898, "fullname": "Julien Demouth", "url": "http://mlsys.org/api/miniconf/users/27898?format=json", "institution": "University of Lorraine"}, {"id": 27899, "fullname": "John D. Owens", "url": "http://mlsys.org/api/miniconf/users/27899?format=json", "institution": "UC Davis"}, {"id": 27900, "fullname": "Xia Hu", "url": "http://mlsys.org/api/miniconf/users/27900?format=json", "institution": "Shanghai Artificial Intelligence Laboratory"}, {"id": 27901, "fullname": "Song Han", "url": "http://mlsys.org/api/miniconf/users/27901?format=json", "institution": null}, {"id": 25625, "fullname": "Timmy Liu", "url": "http://mlsys.org/api/miniconf/users/25625?format=json", "institution": "Nvidia"}, {"id": 12477, "fullname": "Huizi Mao", "url": "http://mlsys.org/api/miniconf/users/12477?format=json", "institution": "Stanford University"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3631", "url": null, "sourceid": 53, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=6INSBXTQ4x", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 925, "modified": "2026-03-23T21:52:48.064377-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=6INSBXTQ4x", "resourcetype": "UriEventmedia"}, {"id": 1122, "file": "/media/PosterPDFs/MLSys%202026/3631.png", "modified": "2026-05-18T19:31:06.682929-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1123, "file": "/media/PosterPDFs/MLSys%202026/3631-thumb.png", "modified": "2026-05-15T18:29:16.974829-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "3", "related_events": ["http://mlsys.org/api/miniconf/events/3854?format=json"], "related_events_ids": [3854]}, {"id": 3634, "uid": "9fc3d7152ba9336a670e36d0ed79bc43", "name": "SONAR: Benchmarking Topology and Collaboration in Decentralized Learning", "authors": [{"id": 27911, "fullname": "Joyce Yuan", "url": "http://mlsys.org/api/miniconf/users/27911?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 28279, "fullname": "Yichuan Shi", "url": "http://mlsys.org/api/miniconf/users/28279?format=json", "institution": "MIT"}, {"id": 27913, "fullname": "Abhishek Singh", "url": "http://mlsys.org/api/miniconf/users/27913?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 28968, "fullname": "Rishi Sharma", "url": "http://mlsys.org/api/miniconf/users/28968?format=json", "institution": "Microsoft"}, {"id": 27915, "fullname": "Ramesh Raskar", "url": "http://mlsys.org/api/miniconf/users/27915?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27916, "fullname": "Jonas Blanc", "url": "http://mlsys.org/api/miniconf/users/27916?format=json", "institution": null}, {"id": 27917, "fullname": "Martin Jaggi", "url": "http://mlsys.org/api/miniconf/users/27917?format=json", "institution": "EPFL"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 1 & Opening Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3634", "url": "https://github.com/aidecentralized/sonar", "sourceid": 133, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=4Bqg7Xyk5t", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3676?format=json", "parent_id": 3676, "eventmedia": [{"id": 928, "modified": "2026-03-23T21:52:48.197417-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=4Bqg7Xyk5t", "resourcetype": "UriEventmedia"}, {"id": 1023, "file": "/media/PosterPDFs/MLSys%202026/3634.png", "modified": "2026-05-13T23:29:45.662025-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1024, "file": "/media/PosterPDFs/MLSys%202026/3634-thumb.png", "modified": "2026-05-13T23:29:45.769632-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "25", "related_events": ["http://mlsys.org/api/miniconf/events/3857?format=json"], "related_events_ids": [3857]}, {"id": 3857, "uid": "9fc3d7152ba9336a670e36d0ed79bc43", "name": "SONAR: Benchmarking Topology and Collaboration in Decentralized Learning", "authors": [{"id": 27911, "fullname": "Joyce Yuan", "url": "http://mlsys.org/api/miniconf/users/27911?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 28279, "fullname": "Yichuan Shi", "url": "http://mlsys.org/api/miniconf/users/28279?format=json", "institution": "MIT"}, {"id": 27913, "fullname": "Abhishek Singh", "url": "http://mlsys.org/api/miniconf/users/27913?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 28968, "fullname": "Rishi Sharma", "url": "http://mlsys.org/api/miniconf/users/28968?format=json", "institution": "Microsoft"}, {"id": 27915, "fullname": "Ramesh Raskar", "url": "http://mlsys.org/api/miniconf/users/27915?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27916, "fullname": "Jonas Blanc", "url": "http://mlsys.org/api/miniconf/users/27916?format=json", "institution": null}, {"id": 27917, "fullname": "Martin Jaggi", "url": "http://mlsys.org/api/miniconf/users/27917?format=json", "institution": "EPFL"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Federated Learning", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3857", "url": null, "sourceid": -133, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T16:30:00-07:00", "endtime": "2026-05-19T16:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3672?format=json", "parent_id": 3672, "eventmedia": [{"id": 1025, "modified": "2026-05-14T00:47:16.131130-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3857.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3634?format=json"], "related_events_ids": [3634]}, {"id": 3858, "uid": "28dd2c7955ce926456240b2ff0100bde", "name": "AXLearn: Modular, Hardware-Agnostic Large Model Training", "authors": [{"id": 27168, "fullname": "Mark Lee", "url": "http://mlsys.org/api/miniconf/users/27168?format=json", "institution": "Meta"}, {"id": 25935, "fullname": "Chang Lan", "url": "http://mlsys.org/api/miniconf/users/25935?format=json", "institution": ""}, {"id": 27918, "fullname": "Tom Gunter", "url": "http://mlsys.org/api/miniconf/users/27918?format=json", "institution": "Apple"}, {"id": 28476, "fullname": "John Peebles", "url": "http://mlsys.org/api/miniconf/users/28476?format=json", "institution": "Apple"}, {"id": 28477, "fullname": "Hanzhi Zhou", "url": "http://mlsys.org/api/miniconf/users/28477?format=json", "institution": "OpenAI"}, {"id": 27921, "fullname": "Xuan Zou", "url": "http://mlsys.org/api/miniconf/users/27921?format=json", "institution": null}, {"id": 27922, "fullname": "Sneha Bangalore", "url": "http://mlsys.org/api/miniconf/users/27922?format=json", "institution": ""}, {"id": 27923, "fullname": "Chung-Cheng Chiu", "url": "http://mlsys.org/api/miniconf/users/27923?format=json", "institution": null}, {"id": 27924, "fullname": "Nan Du", "url": "http://mlsys.org/api/miniconf/users/27924?format=json", "institution": null}, {"id": 27925, "fullname": "Xianzhi Du", "url": "http://mlsys.org/api/miniconf/users/27925?format=json", "institution": "Apple"}, {"id": 27926, "fullname": "Philipp Dufter", "url": "http://mlsys.org/api/miniconf/users/27926?format=json", "institution": "Apple"}, {"id": 27927, "fullname": "Liang He", "url": "http://mlsys.org/api/miniconf/users/27927?format=json", "institution": null}, {"id": 27928, "fullname": "Ruixuan Hou", "url": "http://mlsys.org/api/miniconf/users/27928?format=json", "institution": "Apple Inc"}, {"id": 27929, "fullname": "Haoshuo Huang", "url": "http://mlsys.org/api/miniconf/users/27929?format=json", "institution": "Apple"}, {"id": 27930, "fullname": "Dongseong Hwang", "url": "http://mlsys.org/api/miniconf/users/27930?format=json", "institution": null}, {"id": 27931, "fullname": "Xiang Kong", "url": "http://mlsys.org/api/miniconf/users/27931?format=json", "institution": "Apple"}, {"id": 27932, "fullname": "Jinhao Lei", "url": "http://mlsys.org/api/miniconf/users/27932?format=json", "institution": ", Columbia University"}, {"id": 27933, "fullname": "Tao Lei", "url": "http://mlsys.org/api/miniconf/users/27933?format=json", "institution": "Apple"}, {"id": 27934, "fullname": "Meng Li", "url": "http://mlsys.org/api/miniconf/users/27934?format=json", "institution": "Apple"}, {"id": 15067, "fullname": "Li Li", "url": "http://mlsys.org/api/miniconf/users/15067?format=json", "institution": "Apple"}, {"id": 27935, "fullname": "Jiarui Lu", "url": "http://mlsys.org/api/miniconf/users/27935?format=json", "institution": "Apple"}, {"id": 27936, "fullname": "Zhiyun Lu", "url": "http://mlsys.org/api/miniconf/users/27936?format=json", "institution": "Apple"}, {"id": 27937, "fullname": "Yiping Ma", "url": "http://mlsys.org/api/miniconf/users/27937?format=json", "institution": null}, {"id": 27938, "fullname": "David Qiu", "url": "http://mlsys.org/api/miniconf/users/27938?format=json", "institution": null}, {"id": 27939, "fullname": "Vivek Rathod", "url": "http://mlsys.org/api/miniconf/users/27939?format=json", "institution": null}, {"id": 27940, "fullname": "Senyu Tong", "url": "http://mlsys.org/api/miniconf/users/27940?format=json", "institution": null}, {"id": 27941, "fullname": "Zhucheng Tu", "url": "http://mlsys.org/api/miniconf/users/27941?format=json", "institution": "Apple"}, {"id": 27942, "fullname": "Chong Wang", "url": "http://mlsys.org/api/miniconf/users/27942?format=json", "institution": "Meta"}, {"id": 27943, "fullname": "Jianyu Wang", "url": "http://mlsys.org/api/miniconf/users/27943?format=json", "institution": "Apple"}, {"id": 27944, "fullname": "Yongqiang Wang", "url": "http://mlsys.org/api/miniconf/users/27944?format=json", "institution": null}, {"id": 27945, "fullname": "Zirui Wang", "url": "http://mlsys.org/api/miniconf/users/27945?format=json", "institution": "Google Deepmind"}, {"id": 27946, "fullname": "Floris Weers", "url": "http://mlsys.org/api/miniconf/users/27946?format=json", "institution": null}, {"id": 27947, "fullname": "Sam Wiseman", "url": "http://mlsys.org/api/miniconf/users/27947?format=json", "institution": "Apple"}, {"id": 27948, "fullname": "Guoli Yin", "url": "http://mlsys.org/api/miniconf/users/27948?format=json", "institution": "Apple"}, {"id": 27949, "fullname": "Bowen Zhang", "url": "http://mlsys.org/api/miniconf/users/27949?format=json", "institution": null}, {"id": 12530, "fullname": "Xiyou Zhou", "url": "http://mlsys.org/api/miniconf/users/12530?format=json", "institution": "Apple"}, {"id": 17608, "fullname": "Danyang Zhuo", "url": "http://mlsys.org/api/miniconf/users/17608?format=json", "institution": "Duke University"}, {"id": 27950, "fullname": "Cheng Leong", "url": "http://mlsys.org/api/miniconf/users/27950?format=json", "institution": null}, {"id": 27951, "fullname": "Ruoming Pang", "url": "http://mlsys.org/api/miniconf/users/27951?format=json", "institution": "OpenAI"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: LLM Training 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3858", "url": null, "sourceid": -77, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T15:15:00-07:00", "endtime": "2026-05-21T15:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3713?format=json", "parent_id": 3713, "eventmedia": [{"id": 1220, "modified": "2026-05-21T11:05:40.608338-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3858_Pfx0B13.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3635?format=json"], "related_events_ids": [3635]}, {"id": 3592, "uid": "07e1cd7dca89a1678042477183b7ac3f", "name": "Event Tensor: A Unified Abstraction for Compiling Dynamic Megakernel", "authors": [{"id": 16930, "fullname": "Hongyi Jin", "url": "http://mlsys.org/api/miniconf/users/16930?format=json", "institution": "Carnegie Mellon University"}, {"id": 15229, "fullname": "Bohan Hou", "url": "http://mlsys.org/api/miniconf/users/15229?format=json", "institution": "Carnegie Mellon University"}, {"id": 27670, "fullname": "Guanjie Wang", "url": "http://mlsys.org/api/miniconf/users/27670?format=json", "institution": "Shanghai Jiaotong University"}, {"id": 16412, "fullname": "Ruihang Lai", "url": "http://mlsys.org/api/miniconf/users/16412?format=json", "institution": "Carnegie Mellon University"}, {"id": 27671, "fullname": "Jinqi Chen", "url": "http://mlsys.org/api/miniconf/users/27671?format=json", "institution": "School of Computer Science, Carnegie Mellon University"}, {"id": 12026, "fullname": "Zihao Ye", "url": "http://mlsys.org/api/miniconf/users/12026?format=json", "institution": "NVIDIA"}, {"id": 20904, "fullname": "Yaxing Cai", "url": "http://mlsys.org/api/miniconf/users/20904?format=json", "institution": "NVIDIA"}, {"id": 23351, "fullname": "Yixin Dong", "url": "http://mlsys.org/api/miniconf/users/23351?format=json", "institution": "Carnegie Mellon University"}, {"id": 27672, "fullname": "Xinhao Cheng", "url": "http://mlsys.org/api/miniconf/users/27672?format=json", "institution": "Carnegie Mellon University"}, {"id": 25596, "fullname": "Zhihao Zhang", "url": "http://mlsys.org/api/miniconf/users/25596?format=json", "institution": "Carnegie Mellon University"}, {"id": 20906, "fullname": "Yilong Zhao", "url": "http://mlsys.org/api/miniconf/users/20906?format=json", "institution": "University of California, Berkeley"}, {"id": 28960, "fullname": "Yingyi Huang", "url": "http://mlsys.org/api/miniconf/users/28960?format=json", "institution": "NVIDIA"}, {"id": 27674, "fullname": "Lijie Yang", "url": "http://mlsys.org/api/miniconf/users/27674?format=json", "institution": "Princeton University"}, {"id": 27675, "fullname": "Jinchen Jiang", "url": "http://mlsys.org/api/miniconf/users/27675?format=json", "institution": "Tsinghua University"}, {"id": 27676, "fullname": "Gabriele Oliaro", "url": "http://mlsys.org/api/miniconf/users/27676?format=json", "institution": "Carnegie Mellon University"}, {"id": 27677, "fullname": "Jianan Ji", "url": "http://mlsys.org/api/miniconf/users/27677?format=json", "institution": null}, {"id": 27678, "fullname": "Xupeng Miao", "url": "http://mlsys.org/api/miniconf/users/27678?format=json", "institution": "Purdue University"}, {"id": 12410, "fullname": "Vinod Grover", "url": "http://mlsys.org/api/miniconf/users/12410?format=json", "institution": "NVIDIA"}, {"id": 12052, "fullname": "Todd Mowry", "url": "http://mlsys.org/api/miniconf/users/12052?format=json", "institution": "Carnegie Mellon University"}, {"id": 16147, "fullname": "Zhihao Jia", "url": "http://mlsys.org/api/miniconf/users/16147?format=json", "institution": "Carnegie Mellon University and LithosAI"}, {"id": 11984, "fullname": "Tianqi Chen", "url": "http://mlsys.org/api/miniconf/users/11984?format=json", "institution": "CMU"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3592", "url": null, "sourceid": 119, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=PJqFhAbUHa", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 886, "modified": "2026-03-23T21:52:46.536288-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=PJqFhAbUHa", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "35", "related_events": ["http://mlsys.org/api/miniconf/events/3815?format=json"], "related_events_ids": [3815]}, {"id": 3541, "uid": "fbd7939d674997cdb4692d34de8633c4", "name": "Demystifying the Mixture of Experts Serving Tax", "authors": [{"id": 14926, "fullname": "Pratyush Patel", "url": "http://mlsys.org/api/miniconf/users/14926?format=json", "institution": "University of Washington"}, {"id": 28479, "fullname": "Dayeol Lee", "url": "http://mlsys.org/api/miniconf/users/28479?format=json", "institution": "Meta"}, {"id": 28480, "fullname": "Shintaro Iwasaki", "url": "http://mlsys.org/api/miniconf/users/28480?format=json", "institution": null}, {"id": 11122, "fullname": "Arvind Krishnamurthy", "url": "http://mlsys.org/api/miniconf/users/11122?format=json", "institution": "University of Washington"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 2", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3541", "url": null, "sourceid": 76, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=lELxqcgrsN", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3697?format=json", "parent_id": 3697, "eventmedia": [{"id": 835, "modified": "2026-03-23T21:52:44.457499-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=lELxqcgrsN", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "30", "related_events": ["http://mlsys.org/api/miniconf/events/3764?format=json"], "related_events_ids": [3764]}, {"id": 3764, "uid": "fbd7939d674997cdb4692d34de8633c4", "name": "Demystifying the Mixture of Experts Serving Tax", "authors": [{"id": 14926, "fullname": "Pratyush Patel", "url": "http://mlsys.org/api/miniconf/users/14926?format=json", "institution": "University of Washington"}, {"id": 28479, "fullname": "Dayeol Lee", "url": "http://mlsys.org/api/miniconf/users/28479?format=json", "institution": "Meta"}, {"id": 28480, "fullname": "Shintaro Iwasaki", "url": "http://mlsys.org/api/miniconf/users/28480?format=json", "institution": null}, {"id": 11122, "fullname": "Arvind Krishnamurthy", "url": "http://mlsys.org/api/miniconf/users/11122?format=json", "institution": "University of Washington"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 4", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3764", "url": null, "sourceid": -76, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-20T15:45:00-07:00", "endtime": "2026-05-20T16:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3691?format=json", "parent_id": 3691, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3541?format=json"], "related_events_ids": [3541]}, {"id": 3542, "uid": "3c59dc048e8850243be8079a5c74d079", "name": "Cost-aware Duration Prediction for Software Upgrades in Datacenters", "authors": [{"id": 27360, "fullname": "Yi Ding", "url": "http://mlsys.org/api/miniconf/users/27360?format=json", "institution": "Purdue University"}, {"id": 28481, "fullname": "Aijia Gao", "url": "http://mlsys.org/api/miniconf/users/28481?format=json", "institution": "Meta Platforms Inc"}, {"id": 28482, "fullname": "Thibaud Ryden", "url": "http://mlsys.org/api/miniconf/users/28482?format=json", "institution": null}, {"id": 28483, "fullname": "Michal Sedlak", "url": "http://mlsys.org/api/miniconf/users/28483?format=json", "institution": ""}, {"id": 28484, "fullname": "Essam Ewaisha", "url": "http://mlsys.org/api/miniconf/users/28484?format=json", "institution": null}, {"id": 28485, "fullname": "Igor Marnat", "url": "http://mlsys.org/api/miniconf/users/28485?format=json", "institution": ""}, {"id": 14772, "fullname": "Henry (Hank) Hoffmann", "url": "http://mlsys.org/api/miniconf/users/14772?format=json", "institution": "The University of Chicago"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3542", "url": null, "sourceid": 21, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=l72e5oROLT", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 836, "modified": "2026-03-23T21:52:44.495969-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=l72e5oROLT", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "7", "related_events": ["http://mlsys.org/api/miniconf/events/3765?format=json"], "related_events_ids": [3765]}, {"id": 3765, "uid": "3c59dc048e8850243be8079a5c74d079", "name": "Cost-aware Duration Prediction for Software Upgrades in Datacenters", "authors": [{"id": 27360, "fullname": "Yi Ding", "url": "http://mlsys.org/api/miniconf/users/27360?format=json", "institution": "Purdue University"}, {"id": 28481, "fullname": "Aijia Gao", "url": "http://mlsys.org/api/miniconf/users/28481?format=json", "institution": "Meta Platforms Inc"}, {"id": 28482, "fullname": "Thibaud Ryden", "url": "http://mlsys.org/api/miniconf/users/28482?format=json", "institution": null}, {"id": 28483, "fullname": "Michal Sedlak", "url": "http://mlsys.org/api/miniconf/users/28483?format=json", "institution": ""}, {"id": 28484, "fullname": "Essam Ewaisha", "url": "http://mlsys.org/api/miniconf/users/28484?format=json", "institution": null}, {"id": 28485, "fullname": "Igor Marnat", "url": "http://mlsys.org/api/miniconf/users/28485?format=json", "institution": ""}, {"id": 14772, "fullname": "Henry (Hank) Hoffmann", "url": "http://mlsys.org/api/miniconf/users/14772?format=json", "institution": "The University of Chicago"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Agentic AI/MLSys", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3765", "url": null, "sourceid": -21, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T09:15:00-07:00", "endtime": "2026-05-21T09:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3700?format=json", "parent_id": 3700, "eventmedia": [{"id": 1158, "modified": "2026-05-16T05:37:35.010361-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3765.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3542?format=json"], "related_events_ids": [3542]}, {"id": 3594, "uid": "e2ef524fbf3d9fe611d5a8e90fefdc9c", "name": "Agentic Operator Generation for ML ASICs", "authors": [{"id": 27682, "fullname": "Alec Hammond", "url": "http://mlsys.org/api/miniconf/users/27682?format=json", "institution": "Meta"}, {"id": 27683, "fullname": "Aram Markosyan", "url": "http://mlsys.org/api/miniconf/users/27683?format=json", "institution": "Facebook"}, {"id": 27684, "fullname": "Aman Dontula", "url": "http://mlsys.org/api/miniconf/users/27684?format=json", "institution": "Meta"}, {"id": 27685, "fullname": "Simon Mahns", "url": "http://mlsys.org/api/miniconf/users/27685?format=json", "institution": null}, {"id": 27686, "fullname": "Zacharias Fisches", "url": "http://mlsys.org/api/miniconf/users/27686?format=json", "institution": "Facebook"}, {"id": 27687, "fullname": "Dmitrii Pedchenko", "url": "http://mlsys.org/api/miniconf/users/27687?format=json", "institution": "Meta FAIR"}, {"id": 27688, "fullname": "Keyur Muzumdar", "url": "http://mlsys.org/api/miniconf/users/27688?format=json", "institution": "Meta (FAIR)"}, {"id": 27689, "fullname": "Natacha Supper", "url": "http://mlsys.org/api/miniconf/users/27689?format=json", "institution": null}, {"id": 28493, "fullname": "Site Cao", "url": "http://mlsys.org/api/miniconf/users/28493?format=json", "institution": "Meta"}, {"id": 28494, "fullname": "Haishan Zhu", "url": "http://mlsys.org/api/miniconf/users/28494?format=json", "institution": null}, {"id": 27690, "fullname": "Mark Saroufim", "url": "http://mlsys.org/api/miniconf/users/27690?format=json", "institution": "Core Automation"}, {"id": 28495, "fullname": "Joe Isaacson", "url": "http://mlsys.org/api/miniconf/users/28495?format=json", "institution": "Meta"}, {"id": 27692, "fullname": "Laura Wang", "url": "http://mlsys.org/api/miniconf/users/27692?format=json", "institution": ""}, {"id": 27693, "fullname": "Warren Hunt", "url": "http://mlsys.org/api/miniconf/users/27693?format=json", "institution": "Facebook"}, {"id": 27694, "fullname": "Kaustubh Gondkar", "url": "http://mlsys.org/api/miniconf/users/27694?format=json", "institution": null}, {"id": 27695, "fullname": "Roman Levenstein", "url": "http://mlsys.org/api/miniconf/users/27695?format=json", "institution": null}, {"id": 27696, "fullname": "Gabriel Synnaeve", "url": "http://mlsys.org/api/miniconf/users/27696?format=json", "institution": "Meta"}, {"id": 27697, "fullname": "Richard Li", "url": "http://mlsys.org/api/miniconf/users/27697?format=json", "institution": null}, {"id": 27698, "fullname": "Jacob Kahn", "url": "http://mlsys.org/api/miniconf/users/27698?format=json", "institution": "FAIR, Meta AI"}, {"id": 27527, "fullname": "Ajit Mathews", "url": "http://mlsys.org/api/miniconf/users/27527?format=json", "institution": null}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3594", "url": null, "sourceid": 97, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=O3Bx0nNGnW", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 888, "modified": "2026-03-23T21:52:46.615166-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=O3Bx0nNGnW", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "5", "related_events": ["http://mlsys.org/api/miniconf/events/3817?format=json"], "related_events_ids": [3817]}, {"id": 3817, "uid": "e2ef524fbf3d9fe611d5a8e90fefdc9c", "name": "Agentic Operator Generation for ML ASICs", "authors": [{"id": 27682, "fullname": "Alec Hammond", "url": "http://mlsys.org/api/miniconf/users/27682?format=json", "institution": "Meta"}, {"id": 27683, "fullname": "Aram Markosyan", "url": "http://mlsys.org/api/miniconf/users/27683?format=json", "institution": "Facebook"}, {"id": 27684, "fullname": "Aman Dontula", "url": "http://mlsys.org/api/miniconf/users/27684?format=json", "institution": "Meta"}, {"id": 27685, "fullname": "Simon Mahns", "url": "http://mlsys.org/api/miniconf/users/27685?format=json", "institution": null}, {"id": 27686, "fullname": "Zacharias Fisches", "url": "http://mlsys.org/api/miniconf/users/27686?format=json", "institution": "Facebook"}, {"id": 27687, "fullname": "Dmitrii Pedchenko", "url": "http://mlsys.org/api/miniconf/users/27687?format=json", "institution": "Meta FAIR"}, {"id": 27688, "fullname": "Keyur Muzumdar", "url": "http://mlsys.org/api/miniconf/users/27688?format=json", "institution": "Meta (FAIR)"}, {"id": 27689, "fullname": "Natacha Supper", "url": "http://mlsys.org/api/miniconf/users/27689?format=json", "institution": null}, {"id": 28493, "fullname": "Site Cao", "url": "http://mlsys.org/api/miniconf/users/28493?format=json", "institution": "Meta"}, {"id": 28494, "fullname": "Haishan Zhu", "url": "http://mlsys.org/api/miniconf/users/28494?format=json", "institution": null}, {"id": 27690, "fullname": "Mark Saroufim", "url": "http://mlsys.org/api/miniconf/users/27690?format=json", "institution": "Core Automation"}, {"id": 28495, "fullname": "Joe Isaacson", "url": "http://mlsys.org/api/miniconf/users/28495?format=json", "institution": "Meta"}, {"id": 27692, "fullname": "Laura Wang", "url": "http://mlsys.org/api/miniconf/users/27692?format=json", "institution": ""}, {"id": 27693, "fullname": "Warren Hunt", "url": "http://mlsys.org/api/miniconf/users/27693?format=json", "institution": "Facebook"}, {"id": 27694, "fullname": "Kaustubh Gondkar", "url": "http://mlsys.org/api/miniconf/users/27694?format=json", "institution": null}, {"id": 27695, "fullname": "Roman Levenstein", "url": "http://mlsys.org/api/miniconf/users/27695?format=json", "institution": null}, {"id": 27696, "fullname": "Gabriel Synnaeve", "url": "http://mlsys.org/api/miniconf/users/27696?format=json", "institution": "Meta"}, {"id": 27697, "fullname": "Richard Li", "url": "http://mlsys.org/api/miniconf/users/27697?format=json", "institution": null}, {"id": 27698, "fullname": "Jacob Kahn", "url": "http://mlsys.org/api/miniconf/users/27698?format=json", "institution": "FAIR, Meta AI"}, {"id": 27527, "fullname": "Ajit Mathews", "url": "http://mlsys.org/api/miniconf/users/27527?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Agentic AI/MLSys", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3817", "url": null, "sourceid": -97, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T09:00:00-07:00", "endtime": "2026-05-21T09:15:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3700?format=json", "parent_id": 3700, "eventmedia": [{"id": 1046, "modified": "2026-05-14T12:27:17.078892-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3817.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3594?format=json"], "related_events_ids": [3594]}, {"id": 3611, "uid": "7647966b7343c29048673252e490f736", "name": "SHIP: SRAM-Based Huge Inference Pipelines for Fast LLM Serving", "authors": [{"id": 28469, "fullname": "Andrew Bitar", "url": "http://mlsys.org/api/miniconf/users/28469?format=json", "institution": "NVIDIA"}, {"id": 28499, "fullname": "Aravind Vayalapra", "url": "http://mlsys.org/api/miniconf/users/28499?format=json", "institution": null}, {"id": 28500, "fullname": "Baorui Zhou", "url": "http://mlsys.org/api/miniconf/users/28500?format=json", "institution": "Nvidia"}, {"id": 28501, "fullname": "Matthew Boyd", "url": "http://mlsys.org/api/miniconf/users/28501?format=json", "institution": "NVIDIA"}, {"id": 28502, "fullname": "Charlie Wang", "url": "http://mlsys.org/api/miniconf/users/28502?format=json", "institution": "Nvidia"}, {"id": 28503, "fullname": "Sahil Parmar", "url": "http://mlsys.org/api/miniconf/users/28503?format=json", "institution": null}, {"id": 28470, "fullname": "Eugene Sha", "url": "http://mlsys.org/api/miniconf/users/28470?format=json", "institution": "NVIDIA"}, {"id": 28504, "fullname": "Gautam Rayaprolu", "url": "http://mlsys.org/api/miniconf/users/28504?format=json", "institution": null}, {"id": 28505, "fullname": "Peter Hicks", "url": "http://mlsys.org/api/miniconf/users/28505?format=json", "institution": null}, {"id": 28506, "fullname": "Alex Bowe", "url": "http://mlsys.org/api/miniconf/users/28506?format=json", "institution": "NVIDIA"}, {"id": 28507, "fullname": "Roberto DiCecco", "url": "http://mlsys.org/api/miniconf/users/28507?format=json", "institution": null}, {"id": 28508, "fullname": "Santosh Raghavan", "url": "http://mlsys.org/api/miniconf/users/28508?format=json", "institution": "NVIDIA"}, {"id": 28509, "fullname": "Evan Patrick", "url": "http://mlsys.org/api/miniconf/users/28509?format=json", "institution": null}, {"id": 28510, "fullname": "Josip Smolcic", "url": "http://mlsys.org/api/miniconf/users/28510?format=json", "institution": null}, {"id": 28511, "fullname": "David Han", "url": "http://mlsys.org/api/miniconf/users/28511?format=json", "institution": null}, {"id": 28512, "fullname": "Kris Kang", "url": "http://mlsys.org/api/miniconf/users/28512?format=json", "institution": "Nvidia"}, {"id": 28513, "fullname": "Andy Rock", "url": "http://mlsys.org/api/miniconf/users/28513?format=json", "institution": null}, {"id": 28514, "fullname": "Josh Hay", "url": "http://mlsys.org/api/miniconf/users/28514?format=json", "institution": null}, {"id": 28515, "fullname": "Mohamed Eldafrawy", "url": "http://mlsys.org/api/miniconf/users/28515?format=json", "institution": "Nvidia"}, {"id": 28516, "fullname": "Mikhail Kandel", "url": "http://mlsys.org/api/miniconf/users/28516?format=json", "institution": null}, {"id": 28517, "fullname": "Daulet Zhanguzin", "url": "http://mlsys.org/api/miniconf/users/28517?format=json", "institution": null}, {"id": 28518, "fullname": "Omar Kilani", "url": "http://mlsys.org/api/miniconf/users/28518?format=json", "institution": null}, {"id": 28519, "fullname": "Liming Gong", "url": "http://mlsys.org/api/miniconf/users/28519?format=json", "institution": null}, {"id": 28520, "fullname": "Andrew Paprotskyi", "url": "http://mlsys.org/api/miniconf/users/28520?format=json", "institution": ""}, {"id": 28521, "fullname": "Arash Taheri-Dezfouli", "url": "http://mlsys.org/api/miniconf/users/28521?format=json", "institution": "Nvidia"}, {"id": 28522, "fullname": "Josh Fender", "url": "http://mlsys.org/api/miniconf/users/28522?format=json", "institution": null}, {"id": 28471, "fullname": "Andrew Ling", "url": "http://mlsys.org/api/miniconf/users/28471?format=json", "institution": "University of Toronto"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3611", "url": null, "sourceid": 89, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=IZaXDwDtL1", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 905, "modified": "2026-03-23T21:52:47.224690-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=IZaXDwDtL1", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "12", "related_events": ["http://mlsys.org/api/miniconf/events/3834?format=json"], "related_events_ids": [3834]}, {"id": 3639, "uid": "a684eceee76fc522773286a895bc8436", "name": "Sparing Strategies to Minimize Reliability Impact On Large Training Jobs", "authors": [{"id": 27967, "fullname": "Kevin Quirk", "url": "http://mlsys.org/api/miniconf/users/27967?format=json", "institution": null}, {"id": 27968, "fullname": "Matthew Lennie", "url": "http://mlsys.org/api/miniconf/users/27968?format=json", "institution": null}, {"id": 27969, "fullname": "Ehsan K. Ardestani", "url": "http://mlsys.org/api/miniconf/users/27969?format=json", "institution": "Meta"}, {"id": 27970, "fullname": "Satyajeet Ahuja", "url": "http://mlsys.org/api/miniconf/users/27970?format=json", "institution": null}, {"id": 27971, "fullname": "Matthew Bergeron", "url": "http://mlsys.org/api/miniconf/users/27971?format=json", "institution": null}, {"id": 27972, "fullname": "Andrew Grier", "url": "http://mlsys.org/api/miniconf/users/27972?format=json", "institution": null}, {"id": 27973, "fullname": "Zhaodong Wang", "url": "http://mlsys.org/api/miniconf/users/27973?format=json", "institution": "Facebook"}, {"id": 27974, "fullname": "Mustafa Ozdal", "url": "http://mlsys.org/api/miniconf/users/27974?format=json", "institution": null}, {"id": 27975, "fullname": "Xu Zhang", "url": "http://mlsys.org/api/miniconf/users/27975?format=json", "institution": "Meta Platforms"}, {"id": 27976, "fullname": "Abhinav Triguna", "url": "http://mlsys.org/api/miniconf/users/27976?format=json", "institution": null}, {"id": 27977, "fullname": "Ying Zhang", "url": "http://mlsys.org/api/miniconf/users/27977?format=json", "institution": "University of Michigan - Ann Arbor"}, {"id": 28524, "fullname": "Mathew Oldham", "url": "http://mlsys.org/api/miniconf/users/28524?format=json", "institution": null}, {"id": 28959, "fullname": "Chunqiang Tang", "url": "http://mlsys.org/api/miniconf/users/28959?format=json", "institution": "Facebook"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3639", "url": null, "sourceid": 54, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=18jPgte2tM", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 933, "modified": "2026-03-23T21:52:48.414812-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=18jPgte2tM", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "22", "related_events": ["http://mlsys.org/api/miniconf/events/3862?format=json"], "related_events_ids": [3862]}, {"id": 3534, "uid": "a5771bce93e200c36f7cd9dfd0e5deaa", "name": "ApproxMLIR : Accuracy-Aware Compiler for Compound ML System", "authors": [{"id": 27335, "fullname": "Hao Ren", "url": "http://mlsys.org/api/miniconf/users/27335?format=json", "institution": "University of Illinois Urbana-Champaign"}, {"id": 27336, "fullname": "Yi Mu", "url": "http://mlsys.org/api/miniconf/users/27336?format=json", "institution": "University of Illinois at Urbana-Champaign"}, {"id": 16274, "fullname": "Sasa Misailovic", "url": "http://mlsys.org/api/miniconf/users/16274?format=json", "institution": "UIUC"}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3534", "url": null, "sourceid": 38, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=nKm25GWbuB", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 828, "modified": "2026-03-23T21:52:44.161765-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=nKm25GWbuB", "resourcetype": "UriEventmedia"}, {"id": 1120, "file": "/media/PosterPDFs/MLSys%202026/3534.png", "modified": "2026-05-15T17:34:01.477533-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "41", "related_events": ["http://mlsys.org/api/miniconf/events/3757?format=json"], "related_events_ids": [3757]}, {"id": 3535, "uid": "ad61ab143223efbc24c7d2583be69251", "name": "SAKURAONE: An Open Ethernet\u2013Based AI HPC System and Its Observed Workload Dynamics in a Single-Tenant LLM Development Environment", "authors": [{"id": 27145, "fullname": "Fumikazu KONISHI", "url": "http://mlsys.org/api/miniconf/users/27145?format=json", "institution": "SAKURA internet inc."}, {"id": 26137, "fullname": "Yuuki Tsubouchi", "url": "http://mlsys.org/api/miniconf/users/26137?format=json", "institution": "SAKURA internet Inc."}, {"id": 25979, "fullname": "Hirofumi Tsuruta", "url": "http://mlsys.org/api/miniconf/users/25979?format=json", "institution": "SAKURA internet Inc."}], "topic": null, "keywords": [], "decision": "Conditional Accept", "session": "Poster Session 3", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/3535", "url": null, "sourceid": 74, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "https://openreview.net/forum?id=n7o6C3p3wk", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3719?format=json", "parent_id": 3719, "eventmedia": [{"id": 829, "modified": "2026-03-23T21:52:44.206854-07:00", "display_section": 1, "type": "URL", "name": "OpenReview", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "https://openreview.net/forum?id=n7o6C3p3wk", "resourcetype": "UriEventmedia"}, {"id": 987, "file": "/media/PosterPDFs/MLSys%202026/3535.png", "modified": "2026-05-10T22:48:39.826672-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 988, "file": "/media/PosterPDFs/MLSys%202026/3535-thumb.png", "modified": "2026-05-10T22:55:37.380512-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "38", "related_events": ["http://mlsys.org/api/miniconf/events/3758?format=json"], "related_events_ids": [3758]}, {"id": 3842, "uid": "02522a2b2726fb0a03bb19f2d8d9524d", "name": "Stream2LLM: Overlap Context Streaming and Prefill for Reduced Time-to-First-Token", "authors": [{"id": 27831, "fullname": "Rajveer Bachkaniwala", "url": "http://mlsys.org/api/miniconf/users/27831?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27832, "fullname": "Chengqi Luo", "url": "http://mlsys.org/api/miniconf/users/27832?format=json", "institution": null}, {"id": 27833, "fullname": "Richard So", "url": "http://mlsys.org/api/miniconf/users/27833?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27358, "fullname": "Divya Mahajan", "url": "http://mlsys.org/api/miniconf/users/27358?format=json", "institution": "Georgia Institute of Technology"}, {"id": 27834, "fullname": "Kexin Rong", "url": "http://mlsys.org/api/miniconf/users/27834?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: LLM Serving 1", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3842", "url": null, "sourceid": -134, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T14:45:00-07:00", "endtime": "2026-05-19T15:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3675?format=json", "parent_id": 3675, "eventmedia": [{"id": 1047, "modified": "2026-05-14T12:32:22.996857-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3842.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3619?format=json"], "related_events_ids": [3619]}, {"id": 3802, "uid": "eb160de1de89d9058fcb0b968dbbbd68", "name": "Efficient, VRAM-Constrained xLM Inference on Clients", "authors": [{"id": 27156, "fullname": "Aditya Ukarande", "url": "http://mlsys.org/api/miniconf/users/27156?format=json", "institution": "Nvidia"}, {"id": 27631, "fullname": "Deep Shekhar", "url": "http://mlsys.org/api/miniconf/users/27631?format=json", "institution": "Nvidia"}, {"id": 27632, "fullname": "Marc Blackstein", "url": "http://mlsys.org/api/miniconf/users/27632?format=json", "institution": null}, {"id": 27157, "fullname": "Ram Rangan", "url": "http://mlsys.org/api/miniconf/users/27157?format=json", "institution": "NVIDIA"}], "topic": null, "keywords": [], "decision": null, "session": "Industry Track Oral Presentation: Compilers/HW", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3802", "url": "https://github.com/deepshnv/pipeshard-mlsys26-ae", "sourceid": -117, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-22T08:30:00-07:00", "endtime": "2026-05-22T08:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3721?format=json", "parent_id": 3721, "eventmedia": [{"id": 1164, "modified": "2026-05-16T15:25:21.013776-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3802.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3579?format=json"], "related_events_ids": [3579]}, {"id": 3839, "uid": "65b9eea6e1cc6bb9f0cd2a47751a186f", "name": "REPARO: LOSS-RESILIENT GENERATIVE CODEC FOR VIDEO CONFERENCING", "authors": [{"id": 27821, "fullname": "Tianhong Li", "url": "http://mlsys.org/api/miniconf/users/27821?format=json", "institution": "Meta"}, {"id": 27822, "fullname": "Vibhaalakshmi Sivaraman", "url": "http://mlsys.org/api/miniconf/users/27822?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27823, "fullname": "Pantea Karimi", "url": "http://mlsys.org/api/miniconf/users/27823?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 27824, "fullname": "Lijie Fan", "url": "http://mlsys.org/api/miniconf/users/27824?format=json", "institution": "Google DeepMind"}, {"id": 12450, "fullname": "Mohammad Alizadeh", "url": "http://mlsys.org/api/miniconf/users/12450?format=json", "institution": "MIT CSAIL"}, {"id": 13201, "fullname": "Dina Katabi", "url": "http://mlsys.org/api/miniconf/users/13201?format=json", "institution": "MIT"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient ML", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3839", "url": null, "sourceid": -105, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-21T13:30:00-07:00", "endtime": "2026-05-21T13:45:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3710?format=json", "parent_id": 3710, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3616?format=json"], "related_events_ids": [3616]}, {"id": 3797, "uid": "a87ff679a2f3e71d9181a67b7542122c", "name": "Spira: Exploiting Voxel Data Structural Properties for Efficient Sparse Convolution in Point Cloud Networks", "authors": [{"id": 28464, "fullname": "Dionysios Adamopoulos", "url": "http://mlsys.org/api/miniconf/users/28464?format=json", "institution": "National Technical University of Athens"}, {"id": 27614, "fullname": "Anastasia Poulopoulou", "url": "http://mlsys.org/api/miniconf/users/27614?format=json", "institution": ""}, {"id": 27615, "fullname": "Georgios Goumas", "url": "http://mlsys.org/api/miniconf/users/27615?format=json", "institution": "National Technical University of Athens"}, {"id": 16879, "fullname": "Christina Giannoula", "url": "http://mlsys.org/api/miniconf/users/16879?format=json", "institution": "Max Planck Institute for Software Systems (MPI-SWS)"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Efficient Computation", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3797", "url": "https://github.com/SPIN-Research-Group/Spira", "sourceid": -4, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-22T08:15:00-07:00", "endtime": "2026-05-22T08:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3722?format=json", "parent_id": 3722, "eventmedia": [{"id": 1036, "modified": "2026-05-14T08:05:03.604631-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3797.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3574?format=json"], "related_events_ids": [3574]}, {"id": 3837, "uid": "a0a080f42e6f13b3a2df133f073095dd", "name": "DisAgg: Distributed Aggregators for Efficient Secure Aggregation", "authors": [{"id": 27813, "fullname": "Haaris Mehmood", "url": "http://mlsys.org/api/miniconf/users/27813?format=json", "institution": "Samsung"}, {"id": 28523, "fullname": "Giorgos Tatsis", "url": "http://mlsys.org/api/miniconf/users/28523?format=json", "institution": "CERTH/ITI"}, {"id": 27815, "fullname": "Dimitrios Alexopoulos", "url": "http://mlsys.org/api/miniconf/users/27815?format=json", "institution": "Pragma IoT Solutions"}, {"id": 27816, "fullname": "Karthikeyan Saravanan", "url": "http://mlsys.org/api/miniconf/users/27816?format=json", "institution": "Samsung"}, {"id": 25860, "fullname": "Jie Xi", "url": "http://mlsys.org/api/miniconf/users/25860?format=json", "institution": "Samsung R&amp;D Institute UK (SRUK)"}, {"id": 27817, "fullname": "Anastasios Drosou", "url": "http://mlsys.org/api/miniconf/users/27817?format=json", "institution": null}, {"id": 27818, "fullname": "Mete Ozay", "url": "http://mlsys.org/api/miniconf/users/27818?format=json", "institution": "Samsung Research"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Federated Learning", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3837", "url": null, "sourceid": -122, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T17:15:00-07:00", "endtime": "2026-05-19T17:30:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3672?format=json", "parent_id": 3672, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3614?format=json"], "related_events_ids": [3614]}, {"id": 3812, "uid": "6c8349cc7260ae62e3b1396831a8398f", "name": "CSLE: A Reinforcement Learning Platform for Autonomous Security Management", "authors": [{"id": 27661, "fullname": "Kim Hammar", "url": "http://mlsys.org/api/miniconf/users/27661?format=json", "institution": "University of Melbourne"}], "topic": null, "keywords": [], "decision": null, "session": "Research Track Oral Presentation: Security and Privacy", "eventtype": "Oral", "event_type": "Oral", "room_name": null, "virtualsite_url": "/virtual/2026/oral/3812", "url": null, "sourceid": -45, "sourceurl": "https://openreview.net/group?id=MLSys.org/2026/Conference", "starttime": "2026-05-19T16:45:00-07:00", "endtime": "2026-05-19T17:00:00-07:00", "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3673?format=json", "parent_id": 3673, "eventmedia": [{"id": 971, "modified": "2026-05-18T11:54:46.381490-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/3812_EZJ5vJH.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": null, "related_events": ["http://mlsys.org/api/miniconf/events/3589?format=json"], "related_events_ids": [3589]}, {"id": 10200, "uid": "", "name": "ForeCache: Understanding Workloads and Optimizing KVCache Management for Efficiently Serving LLM Coding Agents", "authors": [{"id": 29299, "fullname": "Shubham Tiwari", "url": "http://mlsys.org/api/miniconf/users/29299?format=json", "institution": "University of Washington"}, {"id": 29309, "fullname": "Tapan Chugh", "url": "http://mlsys.org/api/miniconf/users/29309?format=json", "institution": "University of Washington"}, {"id": 29310, "fullname": "Nash Rickert", "url": "http://mlsys.org/api/miniconf/users/29310?format=json", "institution": "University of Washington"}, {"id": 29311, "fullname": "Simon Peter", "url": "http://mlsys.org/api/miniconf/users/29311?format=json", "institution": "University of Washington"}, {"id": 28327, "fullname": "Ratul Mahajan", "url": "http://mlsys.org/api/miniconf/users/28327?format=json", "institution": "University of Washington"}, {"id": 27680, "fullname": "Haiying Shen", "url": "http://mlsys.org/api/miniconf/users/27680?format=json", "institution": null}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10200", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "4", "related_events": [], "related_events_ids": []}, {"id": 10198, "uid": "", "name": "Flexo: A User-Controllable Distributed Training System", "authors": [{"id": 28558, "fullname": "Megan Frisella", "url": "http://mlsys.org/api/miniconf/users/28558?format=json", "institution": "University of Washington"}, {"id": 29299, "fullname": "Shubham Tiwari", "url": "http://mlsys.org/api/miniconf/users/29299?format=json", "institution": "University of Washington"}, {"id": 29300, "fullname": "Parker Gustafson", "url": "http://mlsys.org/api/miniconf/users/29300?format=json", "institution": "University of Washington"}, {"id": 29301, "fullname": "Andy Ruan", "url": "http://mlsys.org/api/miniconf/users/29301?format=json", "institution": "University of Washington"}, {"id": 29302, "fullname": "Yi Pan", "url": "http://mlsys.org/api/miniconf/users/29302?format=json", "institution": "University of Washington and Shanghai jiaotong University"}, {"id": 29303, "fullname": "Mathew Jacob", "url": "http://mlsys.org/api/miniconf/users/29303?format=json", "institution": "University of Washington"}, {"id": 29304, "fullname": "Gilbert Bernstein", "url": "http://mlsys.org/api/miniconf/users/29304?format=json", "institution": "University of Washington"}, {"id": 17972, "fullname": "Stephanie Wang", "url": "http://mlsys.org/api/miniconf/users/17972?format=json", "institution": "UW &amp; Anyscale"}, {"id": 29305, "fullname": "Parker Gustafson", "url": "http://mlsys.org/api/miniconf/users/29305?format=json", "institution": "University of Washington"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10198", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "6", "related_events": [], "related_events_ids": []}, {"id": 10196, "uid": "", "name": "A Framework for Evaluating Neural Network Deployability on Analog In-Memory Computing Hardware", "authors": [{"id": 28531, "fullname": "Apuroop Mutyala", "url": "http://mlsys.org/api/miniconf/users/28531?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10196", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "8", "related_events": [], "related_events_ids": []}, {"id": 10192, "uid": "", "name": "Neuro-Analog", "authors": [{"id": 28531, "fullname": "Apuroop Mutyala", "url": "http://mlsys.org/api/miniconf/users/28531?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10192", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "12", "related_events": [], "related_events_ids": []}, {"id": 10201, "uid": "", "name": "Speciesism in the Assistant Axis: Probing Compassion Vectors in Post-Trained LLMs", "authors": [{"id": 29312, "fullname": "Shubham Gupta", "url": "http://mlsys.org/api/miniconf/users/29312?format=json", "institution": ""}, {"id": 29313, "fullname": "Jasmine Brazilek", "url": "http://mlsys.org/api/miniconf/users/29313?format=json", "institution": "CaML"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10201", "url": "https://shubham.is/compassion-axis", "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [{"id": 1250, "file": "/media/PosterPDFs/MLSys%202026/10201.png", "modified": "2026-06-07T10:18:09.649520-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "3", "related_events": [], "related_events_ids": []}, {"id": 10180, "uid": "", "name": "Communication-Efficient Distributed Inference for Transformer Models via Vector Quantized Context", "authors": [{"id": 29277, "fullname": "Xiao Liu", "url": "http://mlsys.org/api/miniconf/users/29277?format=json", "institution": "UMass Amherst"}, {"id": 29278, "fullname": "Lijun Zhang", "url": "http://mlsys.org/api/miniconf/users/29278?format=json", "institution": "Amazon"}, {"id": 29279, "fullname": "Deepak Ganesan", "url": "http://mlsys.org/api/miniconf/users/29279?format=json", "institution": "UMass Amherst"}, {"id": 11878, "fullname": "Hui Guan", "url": "http://mlsys.org/api/miniconf/users/11878?format=json", "institution": "University of Massachusetts, Amherst; Amazon"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10180", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "24", "related_events": [], "related_events_ids": []}, {"id": 10167, "uid": "", "name": "Equinox: Decentralized Scheduling for Hardware-aware Satellite Intelligence", "authors": [{"id": 27599, "fullname": "Ansel Erol", "url": "http://mlsys.org/api/miniconf/users/27599?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10167", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [{"id": 1212, "file": "/media/PosterPDFs/MLSys%202026/10167-thumb.png", "modified": "2026-05-18T13:15:49.830767-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1213, "file": "/media/PosterPDFs/MLSys%202026/10167.png", "modified": "2026-05-18T13:24:45.757286-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1211, "modified": "2026-05-18T13:14:08.531404-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/10167.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "37", "related_events": [], "related_events_ids": []}, {"id": 10199, "uid": "", "name": "SD-HC: Heterogeneous Functional Pipelining for Speculative LLM Decoding on AI PCs", "authors": [{"id": 29306, "fullname": "Xikai(Noah) Meng", "url": "http://mlsys.org/api/miniconf/users/29306?format=json", "institution": "University of Washington"}, {"id": 29307, "fullname": "Chao Li", "url": "http://mlsys.org/api/miniconf/users/29307?format=json", "institution": null}, {"id": 29308, "fullname": "Spandan Tiwari", "url": "http://mlsys.org/api/miniconf/users/29308?format=json", "institution": "AMD"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10199", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "5", "related_events": [], "related_events_ids": []}, {"id": 10176, "uid": "", "name": "Leveraging ASIC AI Chips for Homomorphic Encryption", "authors": [{"id": 13393, "fullname": "Jianming Tong", "url": "http://mlsys.org/api/miniconf/users/13393?format=json", "institution": "Georgia Tech/Google"}, {"id": 29261, "fullname": "Tianhao Huang", "url": "http://mlsys.org/api/miniconf/users/29261?format=json", "institution": "Massachusetts Institute of Technology"}, {"id": 29262, "fullname": "Jingtian Dang", "url": "http://mlsys.org/api/miniconf/users/29262?format=json", "institution": "Georgia Tech"}, {"id": 29263, "fullname": "Leo de Castro", "url": "http://mlsys.org/api/miniconf/users/29263?format=json", "institution": "MIT"}, {"id": 29264, "fullname": "Anirudh Itagi", "url": "http://mlsys.org/api/miniconf/users/29264?format=json", "institution": "Georgia Institute of Technology"}, {"id": 29265, "fullname": "Anupam Golder", "url": "http://mlsys.org/api/miniconf/users/29265?format=json", "institution": "Georgia Institute of Technology"}, {"id": 29266, "fullname": "Asra Ali", "url": "http://mlsys.org/api/miniconf/users/29266?format=json", "institution": "Google"}, {"id": 29267, "fullname": "Jevin Jiang", "url": "http://mlsys.org/api/miniconf/users/29267?format=json", "institution": "Google"}, {"id": 29268, "fullname": "Jeremy Kun", "url": "http://mlsys.org/api/miniconf/users/29268?format=json", "institution": "Google"}, {"id": 29269, "fullname": "Arvind Arvind", "url": "http://mlsys.org/api/miniconf/users/29269?format=json", "institution": "MIT"}, {"id": 29270, "fullname": "G. Edward Suh", "url": "http://mlsys.org/api/miniconf/users/29270?format=json", "institution": "NVIDIA / Cornell University"}, {"id": 11662, "fullname": "Tushar Krishna", "url": "http://mlsys.org/api/miniconf/users/11662?format=json", "institution": "Georgia Institute of Technology"}, {"id": 29271, "fullname": "Tianhao Huang", "url": "http://mlsys.org/api/miniconf/users/29271?format=json", "institution": "Meta Platforms, Inc."}, {"id": 29272, "fullname": "Jeremy Kun", "url": "http://mlsys.org/api/miniconf/users/29272?format=json", "institution": "Google"}, {"id": 29273, "fullname": "Jingtian Dang", "url": "http://mlsys.org/api/miniconf/users/29273?format=json", "institution": "Georgia Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10176", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "28", "related_events": [], "related_events_ids": []}, {"id": 10170, "uid": "", "name": "Kascade: A Practical Sparse Attention Method for Long-Context LLM Inference", "authors": [{"id": 26161, "fullname": "Dhruv Rajesh Deshmukh", "url": "http://mlsys.org/api/miniconf/users/26161?format=json", "institution": "Microsoft Research India"}, {"id": 29254, "fullname": "SAURABH GOYAL", "url": "http://mlsys.org/api/miniconf/users/29254?format=json", "institution": "Microsoft Research India"}, {"id": 29255, "fullname": "NIPUN KWATRA", "url": "http://mlsys.org/api/miniconf/users/29255?format=json", "institution": "Microsoft Research India"}, {"id": 16198, "fullname": "Ramachandran Ramjee", "url": "http://mlsys.org/api/miniconf/users/16198?format=json", "institution": "Microsoft Research"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10170", "url": "https://github.com/microsoft/kascade/tree/vllm_integration", "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [{"id": 1216, "file": "/media/PosterPDFs/MLSys%202026/10170.png", "modified": "2026-05-18T13:42:00.219466-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1217, "file": "/media/PosterPDFs/MLSys%202026/10170-thumb.png", "modified": "2026-05-18T13:42:00.296811-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "34", "related_events": [], "related_events_ids": []}, {"id": 10175, "uid": "", "name": "Shortcut-connected Expert Parallelism for Accelerating Mixture of Experts", "authors": [{"id": 25944, "fullname": "Weilin Cai", "url": "http://mlsys.org/api/miniconf/users/25944?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 29259, "fullname": "Le Qin", "url": "http://mlsys.org/api/miniconf/users/29259?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 29260, "fullname": "Junwei Cui", "url": "http://mlsys.org/api/miniconf/users/29260?format=json", "institution": "The Hong Kong University of Science and Technology (Guangzhou)"}, {"id": 19049, "fullname": "Jiayi Huang", "url": "http://mlsys.org/api/miniconf/users/19049?format=json", "institution": "HKUST(GZ)"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10175", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "29", "related_events": [], "related_events_ids": []}, {"id": 10188, "uid": "", "name": "LYNX: Workload-Agnostic Expert Remapping for Efficient MoE Inference", "authors": [{"id": 29294, "fullname": "Vima Gupta", "url": "http://mlsys.org/api/miniconf/users/29294?format=json", "institution": "Georgia Tech"}, {"id": 28020, "fullname": "Vima Gupta", "url": "http://mlsys.org/api/miniconf/users/28020?format=json", "institution": "Georgia Institute Of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10188", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "16", "related_events": [], "related_events_ids": []}, {"id": 10173, "uid": "", "name": "NeSyKV: Neuro-Symbolic Architecture-Specific KV-Cache Eviction for LLM Inference", "authors": [{"id": 16621, "fullname": "Pratik Poudel", "url": "http://mlsys.org/api/miniconf/users/16621?format=json", "institution": "Florida International University"}, {"id": 29257, "fullname": "Jason Liu", "url": "http://mlsys.org/api/miniconf/users/29257?format=json", "institution": "Florida International University"}, {"id": 23355, "fullname": "Yanzhao Wu", "url": "http://mlsys.org/api/miniconf/users/23355?format=json", "institution": "Florida International University"}, {"id": 29258, "fullname": "Sumit Jha", "url": "http://mlsys.org/api/miniconf/users/29258?format=json", "institution": "University of Florida"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10173", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "31", "related_events": [], "related_events_ids": []}, {"id": 10197, "uid": "", "name": "From 805 ms to 23 ms: Accelerating State-Space Models for Real-Time ICU Monitoring with Fused Triton Kernels", "authors": [{"id": 29291, "fullname": "Manpreet singh", "url": "http://mlsys.org/api/miniconf/users/29291?format=json", "institution": "Embedded LLM"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10197", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "7", "related_events": [], "related_events_ids": []}, {"id": 10183, "uid": "", "name": "BioTriton: Portable Cross-Vendor GPU Kernels for High-Throughput Bioinformatics via OpenAI Triton", "authors": [{"id": 29291, "fullname": "Manpreet singh", "url": "http://mlsys.org/api/miniconf/users/29291?format=json", "institution": "Embedded LLM"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10183", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "21", "related_events": [], "related_events_ids": []}, {"id": 10182, "uid": "", "name": "REMIX: Dynamic Partitioning for Fine-Grained Heterogeneous LLM Serving", "authors": [{"id": 28718, "fullname": "Victoria Clerico", "url": "http://mlsys.org/api/miniconf/users/28718?format=json", "institution": "IBM Research"}, {"id": 29283, "fullname": "Corey Lammie", "url": "http://mlsys.org/api/miniconf/users/29283?format=json", "institution": "IBM Research - 8803 Rueschlikon, Switzerland"}, {"id": 29284, "fullname": "Garima Singh", "url": "http://mlsys.org/api/miniconf/users/29284?format=json", "institution": "IBM Research - 8803 Rueschlikon, Switzerland"}, {"id": 29285, "fullname": "Orhun G\u221a\u2202rkem", "url": "http://mlsys.org/api/miniconf/users/29285?format=json", "institution": "IBM Research - 8803 Rueschlikon, Switzerland"}, {"id": 29286, "fullname": "William Simon", "url": "http://mlsys.org/api/miniconf/users/29286?format=json", "institution": "IBM Research - 8803 Rueschlikon, Switzerland"}, {"id": 29287, "fullname": "Hsinyu Tsai", "url": "http://mlsys.org/api/miniconf/users/29287?format=json", "institution": "IBM Research - Silicon Valley, 555 Bailey Avenue, San Jose, CA, USA"}, {"id": 29288, "fullname": "Jeronimo Castrillon", "url": "http://mlsys.org/api/miniconf/users/29288?format=json", "institution": "Technische Universit\u221a\u00a7t Dresden, Dresden, Germany"}, {"id": 29289, "fullname": "Abu Sebastian", "url": "http://mlsys.org/api/miniconf/users/29289?format=json", "institution": "IBM Research - 8803 Rueschlikon, Switzerland"}, {"id": 29290, "fullname": "Hadjer Benmeziane", "url": "http://mlsys.org/api/miniconf/users/29290?format=json", "institution": "IBM Research - 8803 Rueschlikon, Switzerland"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10182", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "22", "related_events": [], "related_events_ids": []}, {"id": 10193, "uid": "", "name": "On the Diminishing Returns of Expert Load Balancing in MoE LLM Serving", "authors": [{"id": 28343, "fullname": "Hanfei Yu", "url": "http://mlsys.org/api/miniconf/users/28343?format=json", "institution": "Stevens Institute of Technology"}, {"id": 29297, "fullname": "Jinru Duan", "url": "http://mlsys.org/api/miniconf/users/29297?format=json", "institution": "Northeastern University"}, {"id": 29298, "fullname": "Jiabin Luo", "url": "http://mlsys.org/api/miniconf/users/29298?format=json", "institution": "Peking University"}, {"id": 25598, "fullname": "Hao Wang", "url": "http://mlsys.org/api/miniconf/users/25598?format=json", "institution": "Stevens Institute of Technology "}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10193", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "11", "related_events": [], "related_events_ids": []}, {"id": 10202, "uid": "", "name": "HiSpec: Hierarchical Speculative Decoding for LLMs", "authors": [{"id": 25962, "fullname": "Avinash Kumar", "url": "http://mlsys.org/api/miniconf/users/25962?format=json", "institution": "The University of Texas at Austin"}, {"id": 29314, "fullname": "Sujay Sanghavi", "url": "http://mlsys.org/api/miniconf/users/29314?format=json", "institution": "University of Texas at Austin"}, {"id": 27845, "fullname": "Poulami Das", "url": "http://mlsys.org/api/miniconf/users/27845?format=json", "institution": "University of Texas at Austin"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10202", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "2", "related_events": [], "related_events_ids": []}, {"id": 10169, "uid": "", "name": "Designing Communication-Efficient AI Systems: An Interconnect-Aware HPC Perspective", "authors": [{"id": 26178, "fullname": "Jinghan Yao", "url": "http://mlsys.org/api/miniconf/users/26178?format=json", "institution": "The Ohio State University"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10169", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "35", "related_events": [], "related_events_ids": []}, {"id": 10172, "uid": "", "name": "DriftBench: Measuring and Predicting Infrastructure Drift in LLM Serving Systems", "authors": [{"id": 25492, "fullname": "Gianluigi Vitale", "url": "http://mlsys.org/api/miniconf/users/25492?format=json", "institution": "Universitas Mercatorum"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10172", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [{"id": 1194, "file": "/media/PosterPDFs/MLSys%202026/10172.png", "modified": "2026-05-17T18:52:06.567480-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "", "generated_from": null, "resourcetype": "EventmediaImageFile"}, {"id": 1195, "file": "/media/PosterPDFs/MLSys%202026/10172-thumb.png", "modified": "2026-05-17T18:52:06.679120-07:00", "display_section": 1, "type": "Poster", "name": "Poster", "visible": false, "sortkey": 0, "is_live_content": false, "detailed_kind": "thumb", "generated_from": null, "resourcetype": "EventmediaImageFile"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "32", "related_events": [], "related_events_ids": []}, {"id": 10203, "uid": "", "name": "Impact of Scheduling for Terminal Agent Workloads on Unified-Memory Workstations", "authors": [{"id": 17796, "fullname": "Yuanli Wang", "url": "http://mlsys.org/api/miniconf/users/17796?format=json", "institution": null}, {"id": 29315, "fullname": "Vasiliki Kalavri", "url": "http://mlsys.org/api/miniconf/users/29315?format=json", "institution": "Boston University"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10203", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "1", "related_events": [], "related_events_ids": []}, {"id": 10195, "uid": "", "name": "Towards Efficient Systems for Long-Context Automatic Speech Recognition", "authors": [{"id": 29036, "fullname": "Wei-Tzu Lee", "url": "http://mlsys.org/api/miniconf/users/29036?format=json", "institution": "University of Washington"}, {"id": 26295, "fullname": "Keisuke Kamahori", "url": "http://mlsys.org/api/miniconf/users/26295?format=json", "institution": "University of Washington"}, {"id": 17670, "fullname": "Baris Kasikci", "url": "http://mlsys.org/api/miniconf/users/17670?format=json", "institution": "University of Washington"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10195", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "9", "related_events": [], "related_events_ids": []}, {"id": 10194, "uid": "", "name": "Tiered Autonomy Framework for Human\u201a\u00c4\u00ecAgent Collaboration in Mission-Critical Cyber-Physical Systems", "authors": [{"id": 28722, "fullname": "David Akokodaripon", "url": "http://mlsys.org/api/miniconf/users/28722?format=json", "institution": "Komatsu MTS"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10194", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "10", "related_events": [], "related_events_ids": []}, {"id": 10191, "uid": "", "name": "SAT-Eval: A Framework for Preference Drift in Multi-Turn LLM Conversations", "authors": [{"id": 29295, "fullname": "Suryaprakash Vengadesan", "url": "http://mlsys.org/api/miniconf/users/29295?format=json", "institution": "University of Washington"}, {"id": 29296, "fullname": "Suryaprakash Vengadesan", "url": "http://mlsys.org/api/miniconf/users/29296?format=json", "institution": "UC Berkeley"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10191", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "13", "related_events": [], "related_events_ids": []}, {"id": 10190, "uid": "", "name": "Learning-Guided Design Optimization for Lifecycle Impact Analysis", "authors": [{"id": 28030, "fullname": "Grace Magny-Fokam", "url": "http://mlsys.org/api/miniconf/users/28030?format=json", "institution": "University of Maryland"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10190", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "14", "related_events": [], "related_events_ids": []}, {"id": 10189, "uid": "", "name": "Cascade: Utility-Driven Speculative Decoding for Mixture-of-Experts", "authors": [{"id": 28019, "fullname": "Anish Saxena", "url": "http://mlsys.org/api/miniconf/users/28019?format=json", "institution": "Georgia Tech"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10189", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "15", "related_events": [], "related_events_ids": []}, {"id": 10187, "uid": "", "name": "Automated Feature Engineering -- Faster Iteration to Solve Business Problems", "authors": [{"id": 28818, "fullname": "Peter Amenewolde", "url": "http://mlsys.org/api/miniconf/users/28818?format=json", "institution": "Google Cloud"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10187", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "17", "related_events": [], "related_events_ids": []}, {"id": 10186, "uid": "", "name": "ADAPTIVE ERASURE CODING FOR FAULT-TOLERANT LLM SERVING WITH CONTINUOUS BATCHING", "authors": [{"id": 27193, "fullname": "Chinmay Dhanraj Nehate", "url": "http://mlsys.org/api/miniconf/users/27193?format=json", "institution": "University of Central Florida"}, {"id": 26288, "fullname": "Jun Wang", "url": "http://mlsys.org/api/miniconf/users/26288?format=json", "institution": "University of Central Florida"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10186", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "18", "related_events": [], "related_events_ids": []}, {"id": 10185, "uid": "", "name": "Practical Unstructured Sparsity for Efficient LLM Inference", "authors": [{"id": 29292, "fullname": "Donghyeon Joo", "url": "http://mlsys.org/api/miniconf/users/29292?format=json", "institution": "University of Maryland, College Park"}, {"id": 29293, "fullname": "Bahar Asgari", "url": "http://mlsys.org/api/miniconf/users/29293?format=json", "institution": "University of Maryland, College Park"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10185", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "19", "related_events": [], "related_events_ids": []}, {"id": 10184, "uid": "", "name": "HiServe: A Prefix Cache Serving System for Hybrid LLMs", "authors": [{"id": 28779, "fullname": "Joshua Zhang", "url": "http://mlsys.org/api/miniconf/users/28779?format=json", "institution": "University of Washington"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10184", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "20", "related_events": [], "related_events_ids": []}, {"id": 10181, "uid": "", "name": "Toward a Small ML Runtime Stack for Raspberry Pi 5 QPUs", "authors": [{"id": 29280, "fullname": "Yiannis Hadjiyianni", "url": "http://mlsys.org/api/miniconf/users/29280?format=json", "institution": "National Technical University of Athens, Athens, Greece"}, {"id": 29281, "fullname": "Panos Michelakis", "url": "http://mlsys.org/api/miniconf/users/29281?format=json", "institution": "National Technical University of Athens, Athens, Greece"}, {"id": 29282, "fullname": "Dimitrios Stamoulis", "url": "http://mlsys.org/api/miniconf/users/29282?format=json", "institution": "Harbin Institute of Technology, Harbin, China"}, {"id": 28254, "fullname": "Yiannis Hadjiyianni", "url": "http://mlsys.org/api/miniconf/users/28254?format=json", "institution": "National Technical University of Athens"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10181", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "23", "related_events": [], "related_events_ids": []}, {"id": 10179, "uid": "", "name": "LearnedCache: An eBPF-Integrated Perceptron-Based Eviction Policy for the Linux Page Cache", "authors": [{"id": 28970, "fullname": "Zejia Qi", "url": "http://mlsys.org/api/miniconf/users/28970?format=json", "institution": ""}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10179", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "25", "related_events": [], "related_events_ids": []}, {"id": 10178, "uid": "", "name": "Accelerating LLM Inference: Self-Speculative Decoding via Learned Seed Injection", "authors": [{"id": 29276, "fullname": "Anuradha Pandey", "url": "http://mlsys.org/api/miniconf/users/29276?format=json", "institution": "Microsoft Research"}, {"id": 26202, "fullname": "Anuradha Pandey", "url": "http://mlsys.org/api/miniconf/users/26202?format=json", "institution": "Microsoft Research/ UIUC"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10178", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "26", "related_events": [], "related_events_ids": []}, {"id": 10177, "uid": "", "name": "HADIS: Hybrid Adaptive Diffusion Model Serving for Efficient Text-to-Image Generation", "authors": [{"id": 21127, "fullname": "Qizheng Yang", "url": "http://mlsys.org/api/miniconf/users/21127?format=json", "institution": "Department of Computer Science, University of Massachusetts at Amherst"}, {"id": 29274, "fullname": "Tung-I Chen", "url": "http://mlsys.org/api/miniconf/users/29274?format=json", "institution": "University of Massachusetts Amherst"}, {"id": 29275, "fullname": "Siyu Zhao", "url": "http://mlsys.org/api/miniconf/users/29275?format=json", "institution": "University of Massachusetts Amherst"}, {"id": 21133, "fullname": "Ramesh Sitaraman", "url": "http://mlsys.org/api/miniconf/users/21133?format=json", "institution": "Department of Computer Science, University of Massachusetts at Amherst"}, {"id": 11878, "fullname": "Hui Guan", "url": "http://mlsys.org/api/miniconf/users/11878?format=json", "institution": "University of Massachusetts, Amherst; Amazon"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10177", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "27", "related_events": [], "related_events_ids": []}, {"id": 10174, "uid": "", "name": "ov_training_kit : Model training and inference on local AI PC to strengthen the AI ecosystem", "authors": [{"id": 28702, "fullname": "Shivam Basia", "url": "http://mlsys.org/api/miniconf/users/28702?format=json", "institution": "Intel Corporation"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10174", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "30", "related_events": [], "related_events_ids": []}, {"id": 10171, "uid": "", "name": "ViRuleEval: A Neuro-Symbolic System for Interpretable Evaluation of Text-to-Video Generation", "authors": [{"id": 28897, "fullname": "Chufeng Jiang", "url": "http://mlsys.org/api/miniconf/users/28897?format=json", "institution": "City University of New York"}, {"id": 29256, "fullname": "Heng Li", "url": "http://mlsys.org/api/miniconf/users/29256?format=json", "institution": "The City University of New York"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10171", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [{"id": 1254, "modified": "2026-07-12T14:45:07.529462-07:00", "display_section": 1, "type": "PDF", "name": "Slides", "visible": true, "sortkey": 0, "is_live_content": false, "uri": "/media/mlsys-2026/Slides/10171.pdf", "resourcetype": "UriEventmedia"}], "show_in_schedule_overview": false, "visible": true, "poster_position": "33", "related_events": [], "related_events_ids": []}, {"id": 10168, "uid": "", "name": "AccelOpt: A Self-Improving LLM Agentic System for AI Accelerator Kernel Optimization", "authors": [{"id": 18114, "fullname": "Genghan Zhang", "url": "http://mlsys.org/api/miniconf/users/18114?format=json", "institution": "Stanford University"}, {"id": 27646, "fullname": "Shaowei Zhu", "url": "http://mlsys.org/api/miniconf/users/27646?format=json", "institution": "Amazon"}, {"id": 27647, "fullname": "Anjiang Wei", "url": "http://mlsys.org/api/miniconf/users/27647?format=json", "institution": null}, {"id": 27171, "fullname": "Zhenyu Song", "url": "http://mlsys.org/api/miniconf/users/27171?format=json", "institution": null}, {"id": 27648, "fullname": "Allen Nie", "url": "http://mlsys.org/api/miniconf/users/27648?format=json", "institution": "Google DeepMind"}, {"id": 15476, "fullname": "Zhen Jia", "url": "http://mlsys.org/api/miniconf/users/15476?format=json", "institution": "Amazon"}, {"id": 17626, "fullname": "Nandita Vijaykumar", "url": "http://mlsys.org/api/miniconf/users/17626?format=json", "institution": "Department of Computer Science, University of Toronto"}, {"id": 11990, "fullname": "Yida Wang", "url": "http://mlsys.org/api/miniconf/users/11990?format=json", "institution": "Amazon"}, {"id": 15013, "fullname": "Kunle Olukotun", "url": "http://mlsys.org/api/miniconf/users/15013?format=json", "institution": "Stanford"}, {"id": 29250, "fullname": "Shaowei Zhu", "url": "http://mlsys.org/api/miniconf/users/29250?format=json", "institution": "Princeton"}, {"id": 29251, "fullname": "Anjiang Wei", "url": "http://mlsys.org/api/miniconf/users/29251?format=json", "institution": "Stanford University"}, {"id": 29252, "fullname": "Zhenyu Song", "url": "http://mlsys.org/api/miniconf/users/29252?format=json", "institution": "Princeton University"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10168", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "36", "related_events": [], "related_events_ids": []}, {"id": 10166, "uid": "", "name": "BLAZE: Bias-Driven Load-Aware Zero-Overhead Expert Routing", "authors": [{"id": 28753, "fullname": "Yide Ran", "url": "http://mlsys.org/api/miniconf/users/28753?format=json", "institution": "Stevens Institute of Technology"}, {"id": 29246, "fullname": "DJ Matusz", "url": "http://mlsys.org/api/miniconf/users/29246?format=json", "institution": "Lambda"}, {"id": 29247, "fullname": "Jianwen Xie", "url": "http://mlsys.org/api/miniconf/users/29247?format=json", "institution": "Lambda"}, {"id": 29248, "fullname": "Chuan Li", "url": "http://mlsys.org/api/miniconf/users/29248?format=json", "institution": "Lambda"}, {"id": 29249, "fullname": "Zhaozhuo Xu", "url": "http://mlsys.org/api/miniconf/users/29249?format=json", "institution": "Stevens Institute of Technology"}], "topic": null, "keywords": [], "decision": null, "session": "YPS Poster Session & YPS Reception", "eventtype": "Poster", "event_type": "Poster", "room_name": null, "virtualsite_url": "/virtual/2026/poster/10166", "url": null, "sourceid": null, "sourceurl": null, "starttime": null, "endtime": null, "diversity_event": null, "paper_url": "", "paper_pdf_url": null, "children_url": null, "children": [], "children_ids": [], "parent": "http://mlsys.org/api/miniconf/events/3656?format=json", "parent_id": 3656, "eventmedia": [], "show_in_schedule_overview": false, "visible": true, "poster_position": "38", "related_events": [], "related_events_ids": []}]}