{"id":157,"date":"2024-04-20T10:08:31","date_gmt":"2024-04-20T10:08:31","guid":{"rendered":"https:\/\/ieee-ras.conferences.computer.org\/2024\/?page_id=157"},"modified":"2024-06-10T14:08:26","modified_gmt":"2024-06-10T14:08:26","slug":"program-structure","status":"publish","type":"page","link":"https:\/\/ieee-ras.conferences.computer.org\/2024\/program-structure\/","title":{"rendered":"Program Structure"},"content":{"rendered":"\t\t<div data-elementor-type=\"wp-page\" data-elementor-id=\"157\" class=\"elementor elementor-157\" data-elementor-post-type=\"page\">\n\t\t\t\t<div class=\"elementor-element elementor-element-fba9531 e-flex e-con-boxed e-con e-parent\" data-id=\"fba9531\" data-element_type=\"container\" data-e-type=\"container\">\n\t\t\t\t\t<div class=\"e-con-inner\">\n\t\t\t\t<div class=\"elementor-element elementor-element-683fa01 elementor-widget elementor-widget-spacer\" data-id=\"683fa01\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"spacer.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t\t\t<div class=\"elementor-spacer\">\n\t\t\t<div class=\"elementor-spacer-inner\"><\/div>\n\t\t<\/div>\n\t\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t<div class=\"elementor-element elementor-element-d68068f elementor-widget elementor-widget-heading\" data-id=\"d68068f\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"heading.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t<h4 class=\"elementor-heading-title elementor-size-default\"><h2 style=\"font-family: var( --e-global-typography-5d167aa-font-family ), Sans-serif;font-weight: var( --e-global-typography-5d167aa-font-weight );line-height: var( --e-global-typography-5d167aa-line-height );font-size: var( --e-global-typography-5d167aa-font-size );letter-spacing: var( --e-global-typography-5d167aa-letter-spacing )\">Tuesday, 11th June 2024 (SingleTrack)<\/h2><\/h4>\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t<div class=\"elementor-element elementor-element-80cf19a e-con-full e-flex e-con e-child\" data-id=\"80cf19a\" data-element_type=\"container\" data-e-type=\"container\">\n\t\t\t\t<div class=\"elementor-element elementor-element-e917b88 elementor-widget elementor-widget-text-editor\" data-id=\"e917b88\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"text-editor.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t\t\t\t\t<table width=\"1501\"><tbody><tr><td colspan=\"2\" width=\"187\"><strong>Timeslot<\/strong><\/td><td width=\"191\"><strong>Topic<\/strong><\/td><td width=\"273\"><strong>Organizer<\/strong><\/td><td width=\"185\"><strong>Moderator<\/strong><\/td><td width=\"357\"><strong>Speaker<\/strong><\/td><td width=\"308\"><strong>Title<\/strong><\/td><\/tr><tr><td colspan=\"2\" width=\"187\">7:00 \u2013 8:30<\/td><td colspan=\"5\" width=\"1315\">Registration and Breakfast<\/td><\/tr><tr><td colspan=\"2\" width=\"187\">8:30 \u2013 9:00<\/td><td width=\"191\">Opening Address<\/td><td colspan=\"3\" width=\"816\">Jyotika Athavale\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/Chair_Jyotika_Athavale_Bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span>, Yervant Zorian <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/Invited_talk_Yervant_Zorian_Bio\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span>, Dimitris Gizopoulos\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_dimitris_gizopoulos_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span>, Amr Haggag (Chairs)<\/td><td width=\"308\">Welcome<\/td><\/tr><tr><td rowspan=\"2\" width=\"100\">9:00 \u2013 10:00<\/td><td width=\"87\">9:00-9:30<\/td><td width=\"191\">Keynote 1<\/td><td colspan=\"2\" rowspan=\"2\" width=\"459\">Jyotika Athavale (IEEE Computer Society)<\/td><td width=\"357\">Ankur Garg (Microsoft) <span style=\"text-decoration: underline;color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/elementor-202\/\"><strong>BIO<\/strong><\/a><\/span><\/td><td width=\"308\">Navigating the AI Era: The Essential Role of RAS <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/keynote_ankur_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/td><\/tr><tr><td width=\"87\">9:30-10:00<\/td><td width=\"191\">Keynote 2<\/td><td width=\"357\">Steve Hesley (AMD) <span style=\"text-decoration: underline;color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/keynote_steven_hesley_amd_bio\/\"><strong>BIO<\/strong><\/a><\/span><\/td><td width=\"308\">The Vital Role of RAS <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/keynote_steven_hesley_amd_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/td><\/tr><tr><td colspan=\"2\" width=\"187\">10:00 \u2013 10:30<\/td><td colspan=\"5\" width=\"1315\">Coffee Break<\/td><\/tr><tr><td colspan=\"2\" width=\"187\">10:30 \u2013 12:00<\/td><td width=\"191\">Invited Special Session 1<br \/>(SS1 Quality)<\/td><td width=\"273\">Rama Govindaraju (Google)<\/td><td width=\"185\">Rama Govindaraju (Google)<\/td><td width=\"357\">Subhasish Mitra (Stanford)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_subhasish_mitra_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Vilas Sridharan (AMD)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_vilas_sridharan_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Harish Dixit (Meta)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_harish_dixit_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>David Lerner (Intel)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_david_lerner_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><\/td><td width=\"308\"><p><span style=\"text-decoration: underline\"><strong>SDC (ELF and best practices for in-situ screening)<\/strong><\/span><\/p><p>A Cambrian Explosion in Robust Computing Systems is Dead Ahead <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_subhasish_mitra_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>Addressing emerging fault modes with testing and reliability <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_vilas_sridharan_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>Silent Data Corruptions at Scale <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_harish_dixit_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>Silent Data Errors: Causes, Implications to AI Workloads, and In-Field Mitigation <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_david_lerner_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><\/td><\/tr><tr><td colspan=\"2\" width=\"187\">12:00 \u2013 13:00<\/td><td colspan=\"5\" width=\"1315\">Lunch<\/td><\/tr><tr><td rowspan=\"2\" width=\"100\">13:00 \u2013 14:00<\/td><td width=\"87\">13:00-13:30<\/td><td width=\"191\">Keynote 3<\/td><td colspan=\"2\" rowspan=\"2\" width=\"459\">Yervant Zorian (Synopsys)<\/td><td width=\"357\">George Tchaparian (OCP) <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/keynote_george_tchaparian_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><\/td><td width=\"308\">Challenges and OCP Community Progress towards Reliability, Availability, and Serviceability (RAS) with a Special Focus on Artificial Intelligence <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/keynote_george_tchaparian_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/td><\/tr><tr><td width=\"87\">13:30-14:00<\/td><td width=\"191\">Keynote 4<\/td><td width=\"357\">Zane Ball (Intel) <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/keynote_zane_ball_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><\/td><td width=\"308\">Pioneering Reliability, Availability, and Serviceability in the AI era <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/keynote_zane_ball_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/td><\/tr><tr><td colspan=\"2\" width=\"187\">14:00 \u2013 15:30<\/td><td width=\"191\">Invited Special Session 2<br \/>(SS2 Reliability)<\/td><td width=\"273\">Rama Bhimanadhuni (Microsoft)<\/td><td width=\"185\">Shawn Blanton (CMU)<\/td><td width=\"357\">Yogesh Varma (Intel)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_yogesh_varma-_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Rama Bhimanadhuni (MSFT)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_rama_bhimanadhuni-_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Drew Walton\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_drew_walton_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Dimitris Gizopoulos (U of Athens)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_dimitris_gizopoulos_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><\/td><td width=\"308\"><p><span style=\"text-decoration: underline\"><strong>Hardware Fault Management<\/strong><\/span><\/p><p>Towards Autonomous Hardware Fault Management <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_yogeshvarma-_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>Enabling Generative AI- Exploring RAS Requirements for Hyperscale AI Infrastructure <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_rama_bhimanadhuni_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>Efforts to Address Fault Management Challenges in OCP <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_drew_walton_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>The Role of Abstraction and Modeling in the Assessment of Hardware Faults Effects <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_dimitris_gizopoulos_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><\/td><\/tr><tr><td colspan=\"2\" width=\"187\">15:30 \u2013 16:00<\/td><td colspan=\"5\" width=\"1315\">Coffee Break<\/td><\/tr><tr><td colspan=\"2\" width=\"187\">16:00 &#8211; 17:30<\/td><td width=\"191\">Invited Special Session 3<br \/>(SS3 Availability)<\/td><td width=\"273\">Yogesh Varma (Intel)<\/td><td width=\"185\">Cecilia Metra (U of Bologna)<\/td><td width=\"357\">Swadesh Choudhary (Intel)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_swadesh_choudhary_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Yervant Zorian (Synopsys)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/Invited_talk_Yervant_Zorian_Bio\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Arijit Biswas (Intel)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_arijit_biswas_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Sanjay Gongalore (Nvidia)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_sanjay_gongalore_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><\/td><td width=\"308\"><p><span style=\"text-decoration: underline\"><strong>Pathfinding Toward SoC Self-Healing Architectur<\/strong><strong>e<\/strong><\/span><\/p><p>UCIe RAS Overview <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_swadesh_choudhary_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>RAS Challenges &amp; Solution for Today\u2019s Chiplet-based Systems <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/Invited_talk_Yervant_Abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>Pathfinding Toward SoC Self-Healing Architecture <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_arijit_biswas_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><p>Maximizing Availability for a Zettascale Datacenter <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_sanjay_gongalore_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><\/td><\/tr><tr><td colspan=\"2\" width=\"187\">17:30 \u2013 19:00<\/td><td colspan=\"5\" width=\"1315\">Reception with IEEE CS BOG<\/td><\/tr><tr><td colspan=\"2\" width=\"187\">19:00 \u2013 20:30<\/td><td width=\"191\">Invited Special Session 4<br \/>(SS4 Serviceability)<\/td><td width=\"273\">Drew Walton<\/td><td width=\"185\">Drew Walton\u00a0<\/td><td width=\"357\">John Holm (Intel)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_john_holm_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Rob Chappell (Microsoft)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_rob_chappell-_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Anil Agrawal (Meta)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_anil_agrawal_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><br \/>Amit Pandey (Amazon)\u00a0<span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_amit_pandey_bio\/\"><span style=\"text-decoration: underline\"><strong>BIO<\/strong><\/span><\/a><\/span><\/td><td width=\"308\"><p><strong><span style=\"text-decoration: underline\">In-fleet Serviceability<\/span><\/strong><\/p><p>Enhancing Computer Serviceability Through Error Telemetry <a href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_john_holm_abstract\/\"><span style=\"color: #0000ff\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/span><\/a><\/p><p><span class=\"fontstyle0\"><span style=\"font-family: inherit;font-size: inherit\">Challenges in Hyperscale Serviceability<\/span><span style=\"font-family: inherit;font-size: inherit\">\u00a0<\/span><span style=\"text-decoration: underline;color: #0000ff\"><span class=\"fontstyle0\" style=\"font-family: inherit;font-size: inherit\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_rob_chappell_abstract\/\"><strong>ABSTRACT<\/strong><\/a><\/span><\/span><\/span><\/p><p><span class=\"fontstyle0\">In-band Error Handling requirements for RAS in hyperscale data centers <a href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_anil_agrawal_abstract\/\"><span style=\"color: #0000ff\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/span><\/a><\/span><\/p><p>Addressing Serviceability throughout device lifecycle with High Speed Access for Test <span style=\"color: #0000ff\"><a style=\"color: #0000ff\" href=\"https:\/\/ieee-ras.conferences.computer.org\/2024\/invited_talk_amit_pandey_abstract\/\"><span style=\"text-decoration: underline\"><strong>ABSTRACT<\/strong><\/span><\/a><\/span><\/p><\/td><\/tr><\/tbody><\/table>\t\t\t\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t<div class=\"elementor-element elementor-element-623a16e elementor-hidden-desktop elementor-hidden-tablet elementor-hidden-mobile e-flex e-con-boxed e-con e-parent\" data-id=\"623a16e\" data-element_type=\"container\" data-e-type=\"container\" data-settings=\"{&quot;background_background&quot;:&quot;classic&quot;}\">\n\t\t\t\t\t<div class=\"e-con-inner\">\n\t\t\t\t<div class=\"elementor-element elementor-element-2fd2553 elementor-widget elementor-widget-heading\" data-id=\"2fd2553\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"heading.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t<h2 class=\"elementor-heading-title elementor-size-default\">Wednesday, 12th June 2024 (Dual Track)<\/h2>\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t<div class=\"elementor-element elementor-element-64a4016 elementor-widget elementor-widget-text-editor\" data-id=\"64a4016\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"text-editor.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t\t\t\t\t<table width=\"748\"><tbody><tr><td width=\"97\"><p>07:00 \u2013 08:00<\/p><\/td><td width=\"328\"><p><strong>Breakfast<\/strong><\/p><\/td><td width=\"322\"><p><strong>\u00a0<\/strong><\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>\u00a0<\/strong><\/p><\/td><td width=\"322\"><p><strong>\u00a0<\/strong><\/p><\/td><\/tr><tr><td width=\"97\"><p>08:00 \u2013 09:15<\/p><\/td><td width=\"328\"><p><strong>Session 1<br \/>Data Center RAS 1<\/strong><\/p><\/td><td width=\"322\"><p><strong>Session 2<\/strong><\/p><p><strong>Memory and Interconnects 1<\/strong><\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>1.1 \u2013 <\/strong><strong>Silent Data Corruption \u2013 Intel-Meta joint collaboration to detect and mitigate at-scale<\/strong><\/p><p>Shubhada Sahasrabudhe, Harish Dixit, David Lerner, Tejasvi Chakravarthy, Thiago Maceira, Matt Beadon, Sriram Sankar and Ethan Hansen (Intel and Meta)\u00a0\u00a0\u00a0\u00a0\u00a0<\/p><\/td><td width=\"322\"><p><strong>2.1 \u2013 <\/strong><strong>AI in BMC: Improving DDR5 Memory Reliability in Hyperscale Data Centers <\/strong><\/p><p>Shen Zhou, Dahai Zhou, Gaoyu Ruan, Zhibing Li, Yi Li and Keke Xie (Intel and Alibaba)\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>1.2 \u2013 <\/strong><strong>Silent Data Corruption &#8211; Meta-AMD silent error collaboration for screening efficiency at-scale<\/strong><\/p><p>Tejasvi Chakravarthy, Sankarnarayanan Gurumurthy, Harish Dattatreya Dixit and Abishek Hariharan (Meta and AMD)<\/p><\/td><td width=\"322\"><p><strong>2.2 \u2013 <\/strong><strong>The Future is Now: Empowering DRAM ECC through a Forgotten Coding Theory<\/strong><\/p><p>Kelly Fitzpatrick, Saeed Raja, Yang Liu and Tong Zhang (ScaleFlux)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>1.3 \u2013 <\/strong><strong>RAS Significance and Challenges in Hyper-Scalar Data Centers with Need for Industry Standardization<\/strong><\/p><p>Tulika Jha, Bob Krick, John Lee and Saurabh Agrawal (Microsoft)<\/p><\/td><td width=\"322\"><p><strong>2.3 \u2013 <\/strong><strong>Standardized RAS API using CXL Component Command Interface<\/strong><\/p><p>Shubhada Pugaonkar and Antonio Hasbun Marin (Intel)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>1.4 \u2013 <\/strong><strong>Innovative Approaches to Solving Flash-Induced Latencies in Hyperscale Environments<\/strong><\/p><p>Vineet Parekh, Suman Gumudaveli and Venkat Ramesh (Meta)<\/p><\/td><td width=\"322\"><p><strong>2.4 \u2013 <\/strong><strong>Reducing Memory Errors On-the-fly with Prediction-Guided Failure Prevention<\/strong><\/p><p>Shen Zhou, Yu Zhang, Chenchen Li, Linlin Han and Feng Xu (Intel and ByteDance)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>1.5 \u2013 <\/strong><strong>Open Compute Project&#8217;s Server Resilience Specification 1.0<\/strong><\/p><p>Thiago Macieira (Intel)<\/p><\/td><td width=\"322\"><p><strong>2.5 \u2013 <\/strong><strong>PCIe Error Handling Challenges in building AI\/ML systems in hyperscale datacenters<\/strong><\/p><p>Anil Agrawal and Bill Holland (Meta)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>\u00a0<\/strong><\/p><\/td><td width=\"322\"><p><strong>\u00a0<\/strong><\/p><\/td><\/tr><tr><td width=\"97\"><p>09:15 \u2013 10:30<\/p><\/td><td width=\"328\"><p><strong>Session 3<\/strong><\/p><p><strong>Data Center RAS 2<\/strong><\/p><\/td><td width=\"322\"><p><strong>Session 4<\/strong><\/p><p><strong>Memory and Interconnects 2<\/strong><\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>3.1 \u2013 <\/strong><strong>OpenDCDiag: A Scalable Open-Source Solution to Search for Silent Data Errors<\/strong><\/p><p>Thiago Macieira (Intel)<\/p><\/td><td width=\"322\"><p><strong>4.1 \u2013 <\/strong><strong>RAIDDR: Error Correction for Multi-device Busses<\/strong><\/p><p>Majid Nemati, Terry Grunzke, Brett Dodds and Adam Grenzebach (Microsoft)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>3.2 \u2013 <\/strong><strong>Writing SDE-finding tests using OpenDCDiag<\/strong><\/p><p>Rohit Agashe and Thiago Macieira (Intel)<\/p><\/td><td width=\"322\"><p><strong>4.2 \u2013 <\/strong><strong>CXL RAS learnings<\/strong><\/p><p>Manjunaatha Harapanahalli, Erwin Tsaur and Mahesh Natu (Intel)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>3.3 \u2013 <\/strong><strong>Maintaining data integrity during transformation<\/strong><\/p><p>Smita Kumar, Patrick Fleming, Gordon McFadden and Sailesh Bissessur (Intel)<\/p><\/td><td width=\"322\"><p><strong>4.3 \u2013 <\/strong><strong>Data Centers\u2019 Reliability Risks due to Faults\u00a0 Affecting their High Performance Microprocessors\u2019 Caches<\/strong><\/p><p>Martin Omana, Annalisa Manfredi, Cecilia Metra, Riccardo Locatelli, Monia Chiavacci and Stefano Petrucci (U Bologna, Intel)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>3.4 \u2013 <\/strong><strong>Microarchitectural Modeling of Modern CPUs for SDCs Prediction in Data Centers<\/strong><\/p><p>Dimitris Gizopoulos, George Papadimitriou and Odysseas Chatzopoulos (U Athens)\u00a0<\/p><\/td><td width=\"322\"><p><strong>4.4 \u2013 <\/strong><strong>The Management Era: Predictive DRAM Fault Analysis with Architecture Awareness<\/strong><\/p><p>Hoiju Chung, Yongjun Lee, Woongju Jang, Euisang Oh, Sanghwan Lee, Paul Fahey, Kijoong Choi, Arhatha Bramhanand and Brett Dodds (SK Hynix and Microsoft)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>3.5 \u2013 <\/strong><strong>The Challenges of Operating a Heterogeneous Edge Cluster<\/strong><\/p><p>Nicolas Oliver, Rajkumar Patel, Dean Throop and Mrinal Karvir (Intel)<\/p><\/td><td width=\"322\"><p><strong>4.5 \u2013 <\/strong><strong>Managing Memory Correctable Error Solutions<\/strong><\/p><p>Shawn Fan, Alex Zhou, Eric Li, Annie Yu, Taniya Siddiqua, Kaushik Balasubramanian, Fang Yuan and Xiaoguo Liang (Intel and Tencent)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p>\u00a0<\/p><\/td><td width=\"322\"><p>\u00a0<\/p><\/td><\/tr><tr><td width=\"97\"><p>10:30 \u2013 11:00<\/p><\/td><td width=\"328\"><p><strong>Coffee Break<\/strong><\/p><\/td><td width=\"322\"><p>\u00a0<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p>\u00a0<\/p><\/td><td width=\"322\"><p>\u00a0<\/p><\/td><\/tr><tr><td width=\"97\"><p>11:00 \u2013 12:30<\/p><\/td><td width=\"328\"><p><strong>Session 5<\/strong><\/p><p><strong>AI and RAS<\/strong><\/p><\/td><td width=\"322\"><p><strong>Session 6<\/strong><\/p><p><strong>Testing and Resilience<\/strong><\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>5.1 \u2013 <\/strong><strong>Meta AI Server Reliability Dimensional Analysis<\/strong><\/p><p>Peng Xiao and Mihir Patel (Meta)<\/p><\/td><td width=\"322\"><p><strong>6.1 \u2013 <\/strong><strong>Delay Monitoring Under Different PVT Corners<\/strong><\/p><p>Hari Addepalli, Jiezhong Wu, Nilanjan Mukherjee, Irith Pomeranz and Janusz Rajski (Purdue U and Siemens)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>5.2 \u2013 <\/strong><strong>Comprehensive Reliability Analysis in AI systems<\/strong><\/p><p>Anju John, Matt Bergeron and Mihir Patel (Meta)<\/p><\/td><td width=\"322\"><p><strong>6.2 \u2013 <\/strong><strong>Timing-Verification Test for Timing Related Defects<\/strong><\/p><p>Jiezhong Wu, Hari Addepalli, Nilanjan Mukherjee, Irith Pomeranz, Kun-Han Tsai and Janusz Rajski (Purdue U and Siemens)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>5.3 \u2013 <\/strong><strong>Build High Reliability\/Availability\/Serviceability head node for AI server<\/strong><\/p><p>Alex Zhou, Yu Zhang, Chenchen Li, Fang Yuan, Shijian Ge, Albert Hu, Liang Peng, Antonio J Hasbun Marin and Shawn Fan (Intel and ByteDance)<\/p><\/td><td width=\"322\"><p><strong>6.3 \u2013 <\/strong><strong>A Functionally-Aware Scan-Based Test Solution for Silent Data Corruption<\/strong><\/p><p>Irith Pomeranz and Yervant Zorian (Purdue U and Synopsys)<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>5.4 \u2013 <\/strong><strong>PVF (Parameter Vulnerability Factor): A Scalable Metric to Quantify AI Vulnerability to Parameter Corruptions<\/strong><\/p><p>Xun Jiao, Fred Lin and Harish Dixit (Meta)<\/p><\/td><td width=\"322\"><p><strong>6.4 \u2013 <\/strong><strong>ResGNN: A Generic Framework for Measuring Graph Neural Network Resilience Against Faults and Attacks in Hardware Systems<\/strong><\/p><p>Hanqiu Chen, Zishen Wan and Cong Hao (Georgia Tech)\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>5.5 \u2013 <\/strong><strong>What does measuring resilience in AI systems entail?<\/strong><\/p><p>Chitkala Sethuraman (Microsoft)\u00a0\u00a0\u00a0<\/p><\/td><td width=\"322\"><p>\u00a0<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p><strong>5.6 \u2013 <\/strong><strong>Dual Transformer Encoding: Remaining Useful Life Estimation through Channel-Independent and Collective Approach<\/strong><\/p><p>Paul Nikolian and Fadi Kurdahi (UC Invine)<\/p><\/td><td width=\"322\"><p>\u00a0<\/p><\/td><\/tr><tr><td width=\"97\"><p>\u00a0<\/p><\/td><td width=\"328\"><p>\u00a0<\/p><\/td><td width=\"322\"><p>\u00a0<\/p><\/td><\/tr><tr><td width=\"97\"><p>12:30 \u2013 14:00<\/p><\/td><td width=\"328\"><p><strong>Networking Lunch<\/strong><\/p><\/td><td width=\"322\"><p>\u00a0<\/p><\/td><\/tr><\/tbody><\/table>\t\t\t\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t<div class=\"elementor-element elementor-element-1543b50 e-flex e-con-boxed e-con e-parent\" data-id=\"1543b50\" data-element_type=\"container\" data-e-type=\"container\" data-settings=\"{&quot;background_background&quot;:&quot;classic&quot;}\">\n\t\t\t\t\t<div class=\"e-con-inner\">\n\t\t\t\t<div class=\"elementor-element elementor-element-503385d elementor-widget elementor-widget-heading\" data-id=\"503385d\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"heading.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t<h2 class=\"elementor-heading-title elementor-size-default\">Wednesday, 12th June 2024 (Dual Track)<\/h2>\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t<div class=\"elementor-element elementor-element-00746a3 e-flex e-con-boxed e-con e-parent\" data-id=\"00746a3\" data-element_type=\"container\" data-e-type=\"container\">\n\t\t\t\t\t<div class=\"e-con-inner\">\n\t\t\t\t<div class=\"elementor-element elementor-element-ebab228 elementor-widget elementor-widget-text-editor\" data-id=\"ebab228\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"text-editor.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t\t\t\t\t<table width=\"748\"><tbody><tr><td width=\"97\"><p>07:00 \u2013 08:00<\/p><\/td><td width=\"328\"><p><strong>Breakfast<\/strong><\/p><\/td><td width=\"322\"><p><strong>\u00a0<\/strong><\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p>\u00a0(Speaker Name<strong><em> Highlighted<\/em><\/strong>)<\/p><\/td><td width=\"322\"><p><strong>\u00a0<\/strong><\/p><\/td><\/tr><tr><td width=\"97\"><p>08:00 \u2013 09:15<\/p><\/td><td width=\"328\"><p><strong>Session 1<\/strong><\/p><p><strong>Data Center RAS 1<\/strong><\/p><p><strong>Moderator: <\/strong>Bharath Parthasarathy<\/p><\/td><td width=\"322\"><p><strong>Session 2<\/strong><\/p><p><strong>Memory and Interconnects 1<\/strong><\/p><p><strong>Moderator: <\/strong>Kwabena Boateng<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>1.1 \u2013 <\/strong><strong>Silent Data Corruption \u2013 Intel-Meta joint collaboration to detect and mitigate at-scale<\/strong><\/p><p>Shubhada Sahasrabudhe, Harish Dixit, <strong><em>David Lerner<\/em><\/strong>, Tejasvi Chakravarthy, Thiago Maceira, Matt Beadon, Sriram Sankar and Ethan Hansen (Intel and Meta)\u00a0\u00a0\u00a0\u00a0\u00a0<\/p><\/td><td width=\"322\"><p><strong>2.1 \u2013 <\/strong><strong>AI in BMC: Improving DDR5 Memory Reliability in Hyperscale Data Centers <\/strong><\/p><p>Shen Zhou, Dahai Zhou, Haoyu Ruan, Zhibing Li, Yi Li, Keke Xie, and <strong><em>Yogesh Varma<\/em><\/strong> (Intel and Alibaba)\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>1.2 \u2013 <\/strong><strong>Silent Data Corruption &#8211; Meta-AMD silent error collaboration for screening efficiency at-scale<\/strong><\/p><p>Gautham Vunnam, <strong><em>Abishek Hariharan<\/em><\/strong>, Sankarnarayanan Gurumurthy, Tejasvi Chakravarthy, Harish Dattatraya Dixit (Meta and AMD)<\/p><\/td><td width=\"322\"><p><strong>2.2 \u2013 <\/strong><strong>The Future is Now: Empowering DRAM ECC through a Forgotten Coding Theory<\/strong><\/p><p>Kelly Fitzpatrick, Saeed Raja, Yang Liu and <em><strong>Tong Zhang<\/strong><\/em> (ScaleFlux)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>1.3 \u2013 <\/strong><strong>RAS Significance and Challenges in Hyper-Scalar Data Centers with Need for Industry Standardization<\/strong><\/p><p><strong><em>Tulika Jha<\/em><\/strong>, Bob Krick, John Lee and Saurabh Agrawal (Microsoft)<\/p><\/td><td width=\"322\"><p><strong>2.3 \u2013 <\/strong><strong>Standardized RAS API using CXL Component Command Interface<\/strong><\/p><p><strong><em>Shubhada Pugaonkar<\/em><\/strong> and Antonio Hasbun Marin (Intel)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>1.4 \u2013 <\/strong><strong>Innovative Approaches to Solving Flash-Induced Latencies in Hyperscale Environments<\/strong><\/p><p><strong><em>Vineet Parekh<\/em><\/strong>, Suman Gumudaveli and Venkat Ramesh (Meta)<\/p><\/td><td width=\"322\"><p><strong>2.4 \u2013 <\/strong><strong>Reducing Memory Errors On-the-fly with Prediction-Guided Failure Prevention<\/strong><\/p><p>Shen Zhou, Yu Zhang, <strong><em>Chenchen Li<\/em><\/strong>, Linlin Han and Feng Xu (Intel and ByteDance)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>1.5 \u2013 <\/strong><strong>Open Compute Project&#8217;s Server Resilience Specification 1.0<\/strong><\/p><p><strong><em>Thiago Macieira<\/em><\/strong> (Intel)<\/p><\/td><td width=\"322\"><p><strong>2.5 \u2013 <\/strong><strong>PCIe Error Handling Challenges in building AI\/ML systems in hyperscale datacenters<\/strong><\/p><p>Anil Agrawal and <strong><em>Bill Holland<\/em><\/strong> (Meta)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>\u00a0<\/strong><\/p><\/td><td width=\"322\"><p><strong>\u00a0<\/strong><\/p><\/td><\/tr><tr><td width=\"97\"><p>09:15 \u2013 10:30<\/p><\/td><td width=\"328\"><p><strong>Session 3<\/strong><\/p><p><strong>Data Center RAS 2<\/strong><\/p><p><strong>Moderator: <\/strong>Harish Dixit<\/p><\/td><td width=\"322\"><p><strong>Session 4<\/strong><\/p><p><strong>Memory and Interconnects 2<\/strong><\/p><p><strong>Moderator: <\/strong>Sreejit Chakravarty<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>3.1 \u2013 <\/strong><strong>OpenDCDiag: A Scalable Open-Source Solution to Search for Silent Data Errors<\/strong><\/p><p><strong><em>Thiago Macieira<\/em><\/strong> (Intel)<\/p><\/td><td width=\"322\"><p><strong>4.1 \u2013 <\/strong><strong>RAIDDR: Error Correction for Multi-device Busses<\/strong><\/p><p><strong><em>Majid Nemati<\/em><\/strong>, Terry Grunzke, Brett Dodds and Adam Grenzebach (Microsoft)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>3.2 \u2013 <\/strong><strong>Writing SDE-finding tests using OpenDCDiag<\/strong><\/p><p><strong><em>Rohit Agashe<\/em><\/strong> and Thiago Macieira (Intel)<\/p><\/td><td width=\"322\"><p><strong>4.2 \u2013 <\/strong><strong>CXL RAS learnings<\/strong><\/p><p><strong><em>Manjunaatha Harapanahalli<\/em><\/strong>, Erwin Tsaur and Mahesh Natu (Intel)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>3.3 \u2013 <\/strong><strong>Maintaining data integrity during transformation<\/strong><\/p><p>Smita Kumar, Patrick Fleming, Gordon McFadden and <strong><em>Sailesh Bissessur<\/em><\/strong> (Intel)<\/p><\/td><td width=\"322\"><p><strong>4.3 \u2013 <\/strong><strong>Data Centers\u2019 Reliability Risks due to Faults\u00a0 Affecting their High Performance Microprocessors\u2019 Caches<\/strong><\/p><p>Martin Omana, Annalisa Manfredi, <strong><em>Cecilia Metra<\/em><\/strong>, Riccardo Locatelli, Monia Chiavacci and Stefano Petrucci (U Bologna, Intel)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>3.4 \u2013 <\/strong><strong>Microarchitectural Modeling of Modern CPUs for SDCs Prediction in Data Centers<\/strong><\/p><p><strong><em>Dimitris Gizopoulos<\/em><\/strong>, George Papadimitriou and Odysseas Chatzopoulos (U Athens)\u00a0<\/p><\/td><td width=\"322\"><p><strong>4.4 \u2013 <\/strong><strong>The Management Era: Predictive DRAM Fault Analysis with Architecture Awareness<\/strong><\/p><p><strong><em>Hoiju Chung<\/em><\/strong>, Yongjun Lee, Woongju Jang, Euisang Oh, Sanghwan Lee, Paul Fahey, Kijoong Choi, Arhatha Bramhanand and Brett Dodds (SK Hynix and Microsoft)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>3.5 \u2013 <\/strong><strong>The Challenges of Operating a Heterogeneous Edge Cluster<\/strong><\/p><p><strong><em>Nicolas Oliver<\/em><\/strong>, Rajkumar Patel, Dean Throop and Mrinal Karvir (Intel)<\/p><\/td><td width=\"322\"><p><strong>4.5 \u2013 <\/strong><strong>Managing Memory Correctable Error Solutions<\/strong><\/p><p>Shawn Fan, Alex Zhou, Eric Li, Annie Yu, <strong><em>Zengping Xu<\/em><\/strong>, Taniya Siddiqua, Kaushik Balasubramanian, Fang Yuan and Xiaoguo Liang (Intel and Tencent)\u00a0<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\">\u00a0<\/td><td width=\"322\">\u00a0<\/td><\/tr><tr><td width=\"97\"><p>10:30 \u2013 11:00<\/p><\/td><td width=\"328\"><p><strong>Coffee Break<\/strong><\/p><\/td><td width=\"322\">\u00a0<\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\">\u00a0<\/td><td width=\"322\">\u00a0<\/td><\/tr><tr><td width=\"97\"><p>11:00 \u2013 12:30<\/p><\/td><td width=\"328\"><p><strong>Session 5<\/strong><\/p><p><strong>AI and RAS<\/strong><\/p><p><strong>Moderator: <\/strong>Preeti Chauhan<\/p><\/td><td width=\"322\"><p><strong>Session 6<\/strong><\/p><p><strong>Testing and Resilience<\/strong><\/p><p><strong>Moderator: <\/strong>Chris Connor<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>5.1 \u2013 <\/strong><strong>Meta AI Server Reliability Dimensional Analysis<\/strong><\/p><p><strong><em>Peng Xiao<\/em><\/strong> and Mihir Patel (Meta)<\/p><\/td><td width=\"322\"><p><strong>6.1 \u2013 <\/strong><strong>Delay Monitoring Under Different PVT Corners<\/strong><\/p><p>Hari Addepalli, Jiezhong Wu, <strong><em>Nilanjan Mukherjee<\/em><\/strong>, Irith Pomeranz and Janusz Rajski (Purdue U and Siemens)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>5.2 \u2013 <\/strong><strong>Comprehensive Reliability Analysis in AI systems<\/strong><\/p><p><strong><em>Anju John<\/em><\/strong>, Matt Bergeron and Mihir Patel (Meta)<\/p><\/td><td width=\"322\"><p><strong>6.2 \u2013 <\/strong><strong>Timing-Verification Test for Timing Related Defects<\/strong><\/p><p>Jiezhong Wu, Hari Addepalli, Nilanjan Mukherjee, Irith Pomeranz, Kun-Han Tsai and <strong><em>Janusz Rajski<\/em> <\/strong>(Purdue U and Siemens)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>5.3 \u2013 <\/strong><strong>Build High Reliability\/Availability\/Serviceability head node for AI server<\/strong><\/p><p>Alex Zhou, Yu Zhang, Chenchen Li, Fang Yuan, <strong><em>Shijian Ge<\/em><\/strong>, Albert Hu, Liang Peng, Antonio J Hasbun Marin and Shawn Fan (Intel and ByteDance)<\/p><\/td><td width=\"322\"><p><strong>6.3 \u2013 <\/strong><strong>A Functionally-Aware Scan-Based Test Solution for Silent Data Corruption<\/strong><\/p><p><strong><em>Irith Pomeranz<\/em><\/strong> (Purdue U)<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>5.4 \u2013 <\/strong><strong>PVF (Parameter Vulnerability Factor): A Scalable Metric to Quantify AI Vulnerability to Parameter Corruptions<\/strong><\/p><p><strong><em>Xun Jiao<\/em><\/strong>, Fred Lin and Harish Dixit (Meta)<\/p><\/td><td width=\"322\"><p><strong>6.4 \u2013 <\/strong><strong>ResGNN: A Generic Framework for Measuring Graph Neural Network Resilience Against Faults and Attacks in Hardware Systems<\/strong><\/p><p><strong><em>Hanqiu Chen<\/em><\/strong>, Zishen Wan and Cong Hao (Georgia Tech)\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0\u00a0<\/p><\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>5.5 \u2013 <\/strong><strong>What does measuring resilience in AI systems entail?<\/strong><\/p><p><strong><em>Chitkala Sethuraman<\/em><\/strong> (Microsoft)\u00a0\u00a0\u00a0<\/p><\/td><td width=\"322\">\u00a0<\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\"><p><strong>5.6 \u2013 Multi Channel Transformer<\/strong><strong>: Remaining Useful Life Estimation through Channel-Independent and Collective Approach<\/strong><\/p><p><strong><em>Paul Nikolian<\/em><\/strong> and Fadi Kurdahi (UC Invine)<\/p><\/td><td width=\"322\">\u00a0<\/td><\/tr><tr><td width=\"97\">\u00a0<\/td><td width=\"328\">\u00a0<\/td><td width=\"322\">\u00a0<\/td><\/tr><tr><td width=\"97\"><p>12:30 \u2013 14:00<\/p><\/td><td width=\"328\"><p><strong>Networking Lunch<\/strong><\/p><\/td><td width=\"322\">\u00a0<\/td><\/tr><\/tbody><\/table>\t\t\t\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t<div class=\"elementor-element elementor-element-e8c101e e-flex e-con-boxed e-con e-parent\" data-id=\"e8c101e\" data-element_type=\"container\" data-e-type=\"container\">\n\t\t\t\t\t<div class=\"e-con-inner\">\n\t\t\t\t<div class=\"elementor-element elementor-element-f894486 elementor-widget elementor-widget-text-editor\" data-id=\"f894486\" data-element_type=\"widget\" data-e-type=\"widget\" data-widget_type=\"text-editor.default\">\n\t\t\t\t<div class=\"elementor-widget-container\">\n\t\t\t\t\t\t\t\t\t<p><strong>Registration will be located outside of Sedona<\/strong><\/p><p>Registration Hours: 7:00 am &#8211; 8:30 am\u00a0<\/p><p><strong><u>Tuesday, June 11<\/u><\/strong><\/p><p>All sessions will be held in Sedona<\/p><p>Breakfast &amp; Lunch will be located in Salons 7-9<\/p><p>Reception will be held in the Orchard Lounge\u00a0<\/p><p><strong><u>Wednesday, June 12 (half day session)<\/u><\/strong><\/p><p>Breakout Session #1- Salon A<\/p><p>Breakout Session #2- Salon B\u00a0<\/p><p>Breakfast and Lunch will be located in Salons 7-9<\/p>\t\t\t\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t<div class=\"elementor-element elementor-element-2f5579c e-flex e-con-boxed e-con e-parent\" data-id=\"2f5579c\" data-element_type=\"container\" data-e-type=\"container\">\n\t\t\t\t\t<div class=\"e-con-inner\">\n\t\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t\t\t<\/div>\n\t\t","protected":false},"excerpt":{"rendered":"<p>\/*! elementor &#8211; v3.21.0 &#8211; 26-05-2024 *\/ .elementor-column .elementor-spacer-inner{height:var(&#8211;spacer-size)}.e-con{&#8211;container-widget-width:100%}.e-con-inner&gt;.elementor-widget-spacer,.e-con&gt;.elementor-widget-spacer{width:var(&#8211;container-widget-width,var(&#8211;spacer-size));&#8211;align-self:var(&#8211;container-widget-align-self,initial);&#8211;flex-shrink:0}.e-con-inner&gt;.elementor-widget-spacer&gt;.elementor-widget-container,.e-con&gt;.elementor-widget-spacer&gt;.elementor-widget-container{height:100%;width:100%}.e-con-inner&gt;.elementor-widget-spacer&gt;.elementor-widget-container&gt;.elementor-spacer,.e-con&gt;.elementor-widget-spacer&gt;.elementor-widget-container&gt;.elementor-spacer{height:100%}.e-con-inner&gt;.elementor-widget-spacer&gt;.elementor-widget-container&gt;.elementor-spacer&gt;.elementor-spacer-inner,.e-con&gt;.elementor-widget-spacer&gt;.elementor-widget-container&gt;.elementor-spacer&gt;.elementor-spacer-inner{height:var(&#8211;container-widget-height,var(&#8211;spacer-size))}.e-con-inner&gt;.elementor-widget-spacer.elementor-widget-empty,.e-con&gt;.elementor-widget-spacer.elementor-widget-empty{position:relative;min-height:22px;min-width:22px}.e-con-inner&gt;.elementor-widget-spacer.elementor-widget-empty .elementor-widget-empty-icon,.e-con&gt;.elementor-widget-spacer.elementor-widget-empty .elementor-widget-empty-icon{position:absolute;top:0;bottom:0;left:0;right:0;margin:auto;padding:0;width:22px;height:22px} \/*! elementor &#8211; v3.21.0 &#8211; 26-05-2024 *\/ .elementor-heading-title{padding:0;margin:0;line-height:1}.elementor-widget-heading .elementor-heading-title[class*=elementor-size-]&gt;a{color:inherit;font-size:inherit;line-height:inherit}.elementor-widget-heading .elementor-heading-title.elementor-size-small{font-size:15px}.elementor-widget-heading .elementor-heading-title.elementor-size-medium{font-size:19px}.elementor-widget-heading .elementor-heading-title.elementor-size-large{font-size:29px}.elementor-widget-heading .elementor-heading-title.elementor-size-xl{font-size:39px}.elementor-widget-heading .elementor-heading-title.elementor-size-xxl{font-size:59px} Tuesday, 11th June 2024 (SingleTrack) Timeslot Topic Organizer Moderator Speaker Title 7:00 \u2013 8:30 Registration and Breakfast 8:30 \u2013 9:00 Opening Address Jyotika Athavale\u00a0BIO, Yervant Zorian BIO, Dimitris Gizopoulos\u00a0BIO, Amr [&hellip;]<\/p>\n","protected":false},"author":8,"featured_media":0,"parent":0,"menu_order":0,"comment_status":"closed","ping_status":"closed","template":"elementor_header_footer","meta":{"footnotes":""},"class_list":["post-157","page","type-page","status-publish","hentry"],"_links":{"self":[{"href":"https:\/\/ieee-ras.conferences.computer.org\/2024\/wp-json\/wp\/v2\/pages\/157","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/ieee-ras.conferences.computer.org\/2024\/wp-json\/wp\/v2\/pages"}],"about":[{"href":"https:\/\/ieee-ras.conferences.computer.org\/2024\/wp-json\/wp\/v2\/types\/page"}],"author":[{"embeddable":true,"href":"https:\/\/ieee-ras.conferences.computer.org\/2024\/wp-json\/wp\/v2\/users\/8"}],"replies":[{"embeddable":true,"href":"https:\/\/ieee-ras.conferences.computer.org\/2024\/wp-json\/wp\/v2\/comments?post=157"}],"version-history":[{"count":0,"href":"https:\/\/ieee-ras.conferences.computer.org\/2024\/wp-json\/wp\/v2\/pages\/157\/revisions"}],"wp:attachment":[{"href":"https:\/\/ieee-ras.conferences.computer.org\/2024\/wp-json\/wp\/v2\/media?parent=157"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}