<!DOCTYPE html><html lang="en" xmlns="http://www.w3.org/1999/xhtml" xmlns:v="urn:schemas-microsoft-com:vml" xmlns:o="urn:schemas-microsoft-com:office:office" style="font-size:16px;"><head></head><head><meta charset="utf-8"/><!--[if !mso]><!--><meta http-equiv="X-UA-Compatible" content="IE=edge"/><!--<![endif]--><meta name="viewport" content="width=device-width,initial-scale=1"/><meta name="x-apple-disable-message-reformatting"/><meta name="format-detection" content="telephone=no,address=no,email=no,date=no,url=no"/><meta name="color-scheme" content="light"/><meta name="supported-color-schemes" content="light"/><title>DeepSeek Just Added Parameters Where There Were None...</title><!--[if mso]><xml><o:OfficeDocumentSettings><o:AllowPNG/><o:PixelsPerInch>96</o:PixelsPerInch></o:OfficeDocumentSettings></xml><![endif]--><style>
:root { color-scheme: light; supported-color-schemes: light; }
body { margin: 0; padding: 0; min-width: 100%!important; -ms-text-size-adjust: 100% !important; -webkit-transform: scale(1) !important; -webkit-text-size-adjust: 100% !important; -webkit-font-smoothing: antialiased !important; }
.body { word-wrap: normal; word-spacing:normal; }
table.mso { width: 100%; border-collapse: collapse; padding: 0; table-layout: fixed; }
img { border: 0; outline: none; }
table { mso-table-lspace: 0px; mso-table-rspace: 0px; }
td, a, span { mso-line-height-rule: exactly; }
#root [x-apple-data-detectors=true],
a[x-apple-data-detectors=true],
#MessageViewBody a { color: inherit !important; text-decoration: inherit !important; font-size: inherit !important; font-family: inherit !important; font-weight: inherit !important; line-height: inherit !important; }
span.MsoHyperlink { color: inherit !important; mso-style-priority: 99 !important; }
span.MsoHyperlinkFollowed { color: inherit !important; mso-style-priority: 99 !important; }
.a { background-color:#dedede; }
.b { background-color:#2a2a2a; }
.c { background-color:#ffffff; }
.d { background-color:#fff0c8; }
.d2 { background-color:#FFFFFF; }
.d3 { background-color:#FFFFFF; }
h1 a { text-decoration:none;color:#2C81E5 !important;font-style:italic; }
h2 a { text-decoration:none;color:#2C81E5 !important;font-style:italic; }
h3 a { text-decoration:none;color:#2C81E5 !important;font-style:italic; }
h4 a { text-decoration:none;color:#2C81E5 !important;font-style:italic; }
h5 a { text-decoration:none;color:#2C81E5 !important;font-style:italic; }
h6 a { text-decoration:none;color:#2C81E5 !important;font-style:italic; }
h1, h1 a, h2, h2 a, h3, h3 a, h4, h4 a, h5, h5 a, h6, h6 a, ul, li, ol, p, p a { margin: 0;padding: 0; }
h1 { font-family:'Trebuchet MS','Lucida Grande',Tahoma,sans-serif;font-weight:700;font-size:28px;color:#2A2A2A;line-height:42px;padding-bottom:4px;padding-top:16px;mso-margin-top-alt:16px;mso-margin-bottom-alt:4px }
h2 { font-family:'Trebuchet MS','Lucida Grande',Tahoma,sans-serif;font-weight:700;font-size:24px;color:#2A2A2A;line-height:36px;padding-bottom:4px;padding-top:16px;mso-margin-top-alt:16px;mso-margin-bottom-alt:4px }
h3 { font-family:'Trebuchet MS','Lucida Grande',Tahoma,sans-serif;font-weight:400;font-size:20px;color:#2A2A2A;line-height:30px;padding-bottom:4px;padding-top:16px;mso-margin-top-alt:16px;mso-margin-bottom-alt:4px }
h4 { font-family:'Trebuchet MS','Lucida Grande',Tahoma,sans-serif;font-weight:400;font-size:18px;color:#2A2A2A;line-height:27px;padding-bottom:4px;padding-top:16px;mso-margin-top-alt:16px;mso-margin-bottom-alt:4px }
h5 { font-family:'Trebuchet MS','Lucida Grande',Tahoma,sans-serif;font-weight:400;font-size:16px;color:#2A2A2A;line-height:24px;padding-bottom:4px;padding-top:16px;mso-margin-top-alt:16px;mso-margin-bottom-alt:4px }
h6 { font-family:'Trebuchet MS','Lucida Grande',Tahoma,sans-serif;font-weight:400;font-size:14px;color:#2A2A2A;line-height:21px;padding-bottom:4px;padding-top:16px;mso-margin-top-alt:16px;mso-margin-bottom-alt:4px }
p { font-family:'Georgia','Times New Roman',serif;font-weight:400;color:#2D2D2D;font-size:16px;line-height:24px;padding-bottom:8px;padding-top:8px;mso-margin-top-alt:8px;mso-margin-bottom-alt:8px; }
p a, .e a, ul a, li a, .h a, .h2 a, .h3 a { word-break:break-word;color:#2C81E5 !important;text-decoration:none;font-style:italic; }
p a span, .e a span, ul a span, li a span { color: inherit }
p .bold { font-weight:bold;color:#2D2D2D; }
p span[style*="font-size"] { line-height: 1.6; }
.f p { font-size:12px;line-height:15px;color:#2D2D2D;padding:0; }
.f p a { color:#2D2D2D !important; }
.g p { font-family:'Helvetica',Arial,sans-serif;font-size:14px;line-height:20px;font-weight:normal;margin:0; }
.g p a { text-decoration: underline; }
.i p { font-family:'Helvetica',Arial,sans-serif;line-height:23px;font-size:15px;color:#2D2D2D; }
.i p a { color:#2D2D2D !important; }
.i2 p { font-family:'Helvetica',Arial,sans-serif;line-height:23px;font-size:15px;color:#2D2D2D; }
.i2 p a { color:#2D2D2D !important; }
.i3 p { font-family:'Helvetica',Arial,sans-serif;line-height:43px;font-size:24px;color:#2D2D2D; }
.i3 p a { color:#2D2D2D !important; }
.h p a { color:#595959 !important; }
.h2 p a { color:#595959 !important; }
.h3 p a { color:#595959 !important; }
.f p a, .i p a, .i2 p a, .i3 p a, .h p a, .h2 p a, .h3 p a { text-decoration:underline; }
.j { border-top:3px solid #ffeb2d; }
.k p { padding-left:15px;padding-bottom:0px;padding-top:6px;mso-margin-top-alt:6px;mso-margin-bottom-alt:0px;mso-margin-left-alt:15px; }
.o { background-color:#FFFFFF;border:1px solid #F1F1F1;border-radius:5px; }
.o p { font-family:'Helvetica',Arial,sans-serif;padding:0px;margin:0px; }
.l p,
.l p a, .l a { font-size:14px;line-height:20px;font-weight: bold;color:#2D2D2D;padding-bottom:6px;mso-margin-bottom-alt:6px;text-decoration:none; }
.m p,
.m p a { font-size:13px;line-height:18px;font-weight:400;color:#2D2D2D;padding-bottom:6px;mso-margin-bottom-alt:6px;text-decoration:none; }
.n p,
.n p a { font-size:12px;line-height:17px;font-weight:400;color:#2D2D2D;padding-bottom:6px;mso-margin-bottom-alt:6px;text-decoration:none; }
.p { background-color:#FFFFFF;max-width:520px;border:1px solid #E1E8ED;border:1px solid rgba(80, 80, 80, 0.3);border-radius:5px; }
.q { font-size:16px;font-family:Helvetica,Roboto,Calibri,sans-serif !important;border:1px solid #e1e8ed;border:1px solid rgba(80, 80, 80, 0.3);border-radius:10px;background-color:#FFFFFF; }
.q p { font-size:16px;font-family:system-ui,Helvetica,Roboto,Calibri,sans-serif !important;color:#222222;padding:4px 0; }
.r { border:1px solid #E1E8ED !important;border-radius:5px; }
.s p { font-size: 14px; line-height: 17px; font-weight: 400; color: #697882; text-decoration: none; }
.t p { font-family:'Helvetica',Arial,sans-serif;font-size:12px;line-height:18px;font-weight:400;color:#000000;font-style:italic;padding:4px 0px 0px; }
.v { border-radius:10px;border:solid 0px #DFD150;background-color:#2C81E5;font-family:'Open Sans','Segoe UI','Apple SD Gothic Neo','Lucida Grande','Lucida Sans Unicode',sans-serif;color:#FFFFFF; }
.v a { text-decoration:none;display:block;color:#FFFFFF; }
.w p { font-size:12px;line-height:15px;font-weight:400;color:#FFFFFF; }
.w p a { text-decoration: underline !important;color:#FFFFFF !important; }
ul { font-family:'Helvetica',Arial,sans-serif;margin:0px 0px 0px 25px !important;padding:0px !important;color:#2D2D2D;line-height:24px;list-style:disc;font-size:16px; }
ul > li { font-family:'Helvetica',Arial,sans-serif;margin:10px 0px 0px 0px !important;padding: 0px 0px 0px 0px !important; color: #2D2D2D; list-style:disc; }
ol { font-family:'Helvetica',Arial,sans-serif;margin: 0px 0px 0px 25px !important;padding:0px !important;color:#2D2D2D;line-height:24px;list-style:decimal;font-size:16px; }
ol > li { font-family:'Helvetica',Arial,sans-serif;margin:10px 0px 0px 0px !important;padding: 0px 0px 0px 0px !important; color: #2D2D2D; }
.e h3,
.e p,
.e span { padding-bottom:0px;padding-top:0px;mso-margin-top-alt:0px;mso-margin-bottom-alt:0px; }
.e span,
.e li { font-family:'Helvetica',Arial,sans-serif;font-size:16px;color:#2D2D2D;line-height:24px; }
.rec { font-family: ui-sans-serif, system-ui, -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, "Helvetica Neue", Arial, "Noto Sans", sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol", "Noto Color Emoji" !important; }
.rec__button:hover { background-color: #f9fafb !important; }
.copyright a {color: inherit !important; text-decoration: none !important; font-size: inherit !important; font-family: inherit !important; font-weight: inherit !important; line-height: inherit !important;}
.txt_social p { padding: 0; word-break: break-all; }
.table, .table-c, .table-h { border: 1px solid #C0C0C0; }
.table-c { padding:5px; background-color:#FFFFFF; }
.table-c p { color: #2D2D2D; font-family:'Helvetica',Arial,sans-serif !important;overflow-wrap: break-word; }
.table-h { padding:5px; background-color:#F1F1F1; }
.table-h p { color: #2A2A2A; font-family:'Trebuchet MS','Lucida Grande',Tahoma,sans-serif !important;overflow-wrap: break-word; }
@media only screen and (max-width:667px) {
.aa, .w100pc { width: 100% !important; }
.bb img { width: 100% !important; height: auto !important; max-width: none !important; }
.cc { padding: 0px 8px !important; }
.ee { padding-top:10px !important;padding-bottom:10px !important; }
.ff ul, .ff ol { margin: 0px 0px 0px 10px !important;padding: 0px !important; }
.ff li { margin:10px 0px 0px 10px !important; }
.r {height:140px !important;}
.s p { font-size:13px !important;line-height:15px !important; }
.mob-hide {display:none !important;}
.mob-show {display: block !important; width: auto !important; overflow: visible !important; float: none !important; max-height: inherit !important; line-height: inherit !important;}
.mob-stack {width:100% !important;display:block !important;}
.mob-w-full {width:100% !important;}
.mob-block {display:block !important;}
.embed-img {padding:0px 0px 12px 0px !important;}
.socialShare {padding-top:15px !important;}
.rec { padding-left:15px!important;padding-right:15px!important; }
.bodyWrapper { padding:7px 4px 7px 4px !important; }
.social-mobile {float:left !important;margin-top:10px !important;}
}
@media screen and (max-width: 480px) {
u + .a .gg { width: 100% !important; width: 100vw !important; }
.tok-heart { padding-top:75% !important; }
.tok-play { padding-top: 250px !important; }
}
@media screen and (max-width: 320px) {
.tok-heart { padding-top:65% !important; }
}
.u { border: 1px solid #CACACA !important; border-radius: 2px !important; background-color: #ffffff !important; padding: 0px 13px 0px 13px !important; font-family:ui-sans-serif,system-ui,-apple-system,BlinkMacSystemFont,"Segoe UI",Roboto,"Helvetica Neue",Arial,"Noto Sans",sans-serif !important;font-size: 12px !important; color: #767676 !important; }
.u a { text-decoration: none; display: block !important; color: #767676 !important; margin: 0px !important; }
.u span, .u img { color: #767676 !important;margin:0px !important; max-height:32px !important;background-color:#ffffff !important; }
</style><!--[if mso]><style type="text/css">
h1, h2, h3, h4, h5, h6 {font-family: Arial, sans-serif !important;}
body, table, td, p, a, span {font-family: Arial, sans-serif !important;}
sup { font-size: 100% !important;vertical-align: .5em !important;mso-text-raise: -1.5% !important;line-height: 0 !important; }
ul { margin-left:0px !important; margin-right:10px !important; margin-top:20px !important; margin-bottom:20px !important; }
ul li { margin-left: 0px !important; mso-special-format: decimal; }
ol { margin-left:0px !important; margin-right:10px !important; margin-top:20px !important; margin-bottom:20px !important; }
ol li { margin-left: 0px !important; mso-special-format: decimal; }
li.listItem { margin-left:15px !important; margin-top:0px !important; }
.paddingDesktop { padding: 10px 0 !important; }
.edm_outlooklist { margin-left: -20px !important; }
.embedImage { display:none !important; }
</style><![endif]--><!-- __merge_tags_in_links__ --><style>
@font-face {
font-family: 'Open Sans';
font-style: normal;
font-weight: 700;
font-display: swap;
src: url('https://fonts.gstatic.com/s/opensans/v40/memSYaGs126MiZpBA-UvWbX2vVnXBbObj2OVZyOOSr4dVJWUgsg-1x4gaVIUwaEQbjA.woff2') format('woff2');
}
@font-face {
font-family: 'Open Sans';
font-style: italic;
font-weight: 700;
font-display: swap;
src: url('https://fonts.googleapis.com/css2?family=Open+Sans:ital,wght@1,700&display=swap') format('woff2');
}
</style></head><body class="a" style="margin:0px auto;padding:0px;word-wrap:normal;word-spacing:normal;background-color:#dedede;"><div role="article" aria-roledescription="email" aria-label="email_name" lang="en" style="font-size:1rem"><div style="display:none;max-height:0px;overflow:hidden;"> And more about Recursive Language Models, LongCat ZigZag Attention, and LoRA RL  ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ ‌ </div><table role="none" width="100%" border="0" cellspacing="0" align="center" cellpadding="0" class="gg"><tr><td align="center" valign="top"><table role="none" width="670" border="0" cellspacing="0" cellpadding="0" class="aa" style="width:670px;table-layout:fixed;"><tr><td class="bodyWrapper" align="center" valign="top" style="padding:7px 7px 7px 7px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td align="center" valign="top" style="border-width:0px 0px 0px 0px;border-style: solid; border-color: #2a2a2a;border-radius:10px 10px 0px 0px;background-color:#ffffff;" class="c"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr id="header"><td style="padding:15px 15px 0px 15px;"><div style="padding-top:0px;padding-right:0px;padding-bottom:20px;padding-left:0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td class="f" align="right" valign="top"><p> January 06, 2026 | <a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.c6q0w4g5sodbtO4I1B_pxSdB5RCIH6yy1Fm1CYma3ExdbBinL5YXCU6xtTJpsbvd7IcUI2vTnWLQ-7azABhddwl-mBH61Q-2rpQhYHfoba5VSWse1qlmSu1pywFigAD8JdN_CUHi9soox6_X2EOrkqmZLc924-YMwzLMKjJfbTwhQNQeFBIWBgVhMr9B4i9uZs6Lh0i_ReeaQ20yZ7CDAgSHMMB-JGmS2quL4KE8XLTKq9DISA0hzmEJinZhH58LjtpMroHqUXwyL3pPr5XIbsnsQhFKL3hBtfN8N-yc7LwTGiKZXHEFbXFQTdVvDp2raVspI1ZhV9aXPKLSDQIj8HyZIYnSi9PE4Pc_N-Y12mdj5tcA5xiIKkz-iE9-qnV0wO0k2FwFQBtLfnaYaWzC072DvqrE4E_SXdowLHpgDj1Xooi0k1h0lBLUJSau24idNfjV4rBoP5XxaB8dOvaK6LeS1JM3sBjOKFcklwcKuH-WcSYJYK5k654gWGmR4RLl7wZYvHJDgFpRJzywbhYDIdMQV_4KcYzuy7fGS0FQZwaRJf4O8miY0ZJO-rf2PSVt0Qj19_mE0xbJo3Athf7chsJ2adI0YVWJUi-FoEKZZYMtJz76167racGO7zWv4EF9za3hWvZxpIvujVyBcjW-4aukkOKlIdO9GSjNGYmuW5BWI-6Rgh5w3JAQCAOJzQhDrp5Q8c1C-TEBSgr0SeIwoO8dXlgh7XSuEFziqp7Orlr78kKbqaUaf531syNTJyOav-BK8QyRkyMNnGwRwI_Eh0UnSd7qc2IOPrU6F7u-feUYlJpUx5q0t-VMgHj58URQsItpP1Wa9Tk2cyuvlVOVLCgGV_e6eWFAJjeoOJjrMemjFOsFs9T-hzzEOoYIX01DNCXOHy7fZRyaLYxlsEHaPQ/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h0/h001.ySBr8H9DG4zHTHq2zlJBYuMQ4rEcpI9evwLazrygTQA"><span class="translation_missing" title="translation missing: en.templates.posts.email.header.read_online">Read Online</span></a></p></td></tr><tr><td class="dd" align="center" valign="top" style="padding:15px 0;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td align="center" valign="top"><h1 style="text-align:left;font-family:'Open Sans','Segoe UI','Apple SD Gothic Neo','Lucida Grande','Lucida Sans Unicode',sans-serif;font-weight:Bold;font-size:32px;color:#2A2A2A;padding:2px 0;line-height:38px;"> DeepSeek Just Added Parameters Where There Were None... </h1><p style="text-align:left;font-family:'Helvetica',Arial,sans-serif;font-weight:normal;font-size:20px;color:#3E3E3E;padding:5px 0;line-height:24px;"> And more about Recursive Language Models, LongCat ZigZag Attention, and LoRA RL </p></td></tr></table></td></tr><tr><td style="line-height:0;"><div data-open-tracking="true"> <img src="https://elink4f7.mail.bycloud.ai/ss/o/u001.3wmUuY8gEWd4_869a_eXcg/4n2/b1HjxW_sTXWv5GsEHVrZdQ/ho.gif" alt="" width="1" height="1" border="0" style="height:1px !important;width:1px !important;border-width:0 !important;margin-top:0 !important;margin-bottom:0 !important;margin-right:0 !important;margin-left:0 !important;padding-top:0 !important;padding-bottom:0 !important;padding-right:0 !important;padding-left:0 !important;"/> </div></td></tr></table></div></td></tr><tr id="content-blocks"><td class="email-card-body" align="center" valign="top" style="padding-bottom:15px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td id="nov-18-th-nov-24-th-33-latest-ai-re" class="dd" align="left" valign="top" style="color:#2A2A2A;font-weight:normal;padding:0px 28px;text-align:left;"><h6 style="color:#2A2A2A;font-weight:normal;mso-line-height-alt:87.5%;"><i>Dec 31st ~ Jan 6th</i><br><i>#89 Latest AI Research Explained Simply</i></h6></td></tr><tr><td><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" style=""><tr><td bgcolor="#222222" style="background-color:#222222;padding:0.0px 0.0px 0.0px 0.0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"></p></td></tr></table></td></tr></table></td></tr><tr><td id="industry-news-in-1-line" class="dd" align="left" valign="top" style="color:#2A2A2A;font-weight:Bold;padding:0px 28px;text-align:left;"><h2 style="color:#2A2A2A;font-weight:Bold;mso-line-height-alt:150.0%;">🗞️ Industry News in 1 Line</h2></td></tr><tr><td style="padding-bottom:12px;padding-left:50px;padding-right:40px;padding-top:12px;" class="ee"><div style="margin-left:0px;" class="edm_outlooklist"><ol start="1" style="list-style-type:decimal;margin:0px 0px;padding:0px 0px 0px 0px;"><li class="listItem ultext"><p style="mso-line-height-alt:150.0%;padding:0px;text-align:left;word-break:break-word;"><span style="background-color:#e0e0e0;"><span style="color:rgb(255, 58, 58);font-size:0.6rem;">♥ 7.2k</span></span> NVIDIA has announced <a class="link" href="https://elink4f7.mail.bycloud.ai/ss/c/u001.sa7HIrCkEzyny8lstY55mLTYRGG0aKtvMtefff0l07Me71fBV2-WuPt05UAeBe7S7tKag97boH6pq6XutQkAu0cfX8ldIjtOeB2KYgj_eBStIECAlmRe1MlwHy20NbZC8sSkY7D2mXFiJcEZRIRzDf6BX3toC4D5QaWCKsfjaZbGiSsuLM5soLRB90KveotkM1iyQTudZBDlxje5gCQ5-JsvdRyST0IIUEiEBdwnWYc8l_EEguHT5I1KA1zctgvFjbOU74Vgens1w3q40ulNsCMhRVjvq83mclvsNIKzR3W_UriInXg-aFIfri1WmiwFbBW_XAnP8blfNHT3stCTtLfHhxZ0WVxgsdOluxDNvq8/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h1/h001.mtXEYSBtw38Y4a8rEawaLoTMKGoApEHPVMFAS0BHK5M" target="_blank" rel="noopener noreferrer nofollow"><span>Alpamayo</span></a>, a new “thinking, reasoning” autonomous-vehicle AI. The first rollout is slated to <b>reach U.S. roads</b> in Q1 2026, starting with the all-new Mercedes-Benz CLA. NVIDIA’s first model, <b>Alpamayo 1 (10B parameters)</b>, uses video to generate driving trajectories and reasoning traces, now available <a class="link" href="https://elink4f7.mail.bycloud.ai/ss/c/u001.CxDkkVpJsBdVoe83c_tBWvVJJJpDteHEtluzCRcV1LYKukoKpMTA_6WEbz1J8BMir02lHqKuPkS3mRQNhp39yCcPYdh6HT7trVjXqvpsTLd7M7nW0anmDL0PrgdOZH9EryfYTecRMsnZaqUJLfxCnXbRqe2t78IERVI3NgsLNR4k-SR3XDyNW-6fCX_eD3YCSAU2NgmXovYeqc0MiZFmCLVaAp5h1FslvMBR3AO5d6s5l9l3sOVVjPXCoUvbHD9K9I98tqn2nyZnxEt_aGlsQvG4MIxDNRmCq38OmOOqbUI/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h2/h001.FqdL_o6EKxVqTCW2NW9xFjX7WolSdi_ZK_c3NAEF-vY" target="_blank" rel="noopener noreferrer nofollow"><span>on HuggingFace</span></a>. </p><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:500px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/f68d59e0-555a-4d9f-a81c-4f9f23d0a1a7/nvidia-alpamayo.jpg?t=1767717691" alt="" height="auto" width="500" style="display:block;width:100%;" border="0"/></td></tr></table></li><li class="listItem ultext"><p style="mso-line-height-alt:150.0%;padding:0px;text-align:left;word-break:break-word;"><span style="background-color:#e0e0e0;"><span style="color:rgb(255, 58, 58);font-size:0.6rem;">♥ 17k</span></span> Boston Dynamics has released a new video of its upgraded next-gen humanoid robot, <a class="link" href="https://elink4f7.mail.bycloud.ai/ss/c/u001.oB7zuO_W-X4Toa45C28ng-1l9mAqQ0cB2UErjCNG8Z2-NV12tCZeMPJFLFqeoWpVjWUnAjuME0nOXSR5sjt1f9dtTYJbRuonvGKsodvA_Yljum1Hi4rvSrlTi5O0--XkWQLac4XRxDRopPn9ZIO-91zf_ArPlUbOKEivPUiIhAot6l0dQVhMHvxDsyu9pGuibDIQrYfpKIiJuRzo9oXdgfZJLUwb0eLacn47qnhxEJ2legPoGggm22neHCLY98gksrKTszPNiWw8CN13_PODQ0w_k5oZmzZT_SyHqH_4Fv0/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h3/h001.s4eNZ6Tj1VTBkEmv-SqwCI-KJkWpIBJpUBM5Bn4IjQM" target="_blank" rel="noopener noreferrer nofollow"><span>Atlas</span></a>, now fully electric with a <b>4-hour swappable battery</b> for continuous operation. Atlas stands 6'2", weighs 198 lbs, has 56 degre </p><p style="mso-line-height-alt:150.0%;padding:0px;text-align:left;word-break:break-word;"> es of freedom, can lift 110 lbs (66 lbs sustained), and reach 7.5 ft, using tactile, reconfigurable hands to adapt grip in real time. </p><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:532px;"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.oB7zuO_W-X4Toa45C28ng-1l9mAqQ0cB2UErjCNG8Z2-NV12tCZeMPJFLFqeoWpVjWUnAjuME0nOXSR5sjt1f9dtTYJbRuonvGKsodvA_Yljum1Hi4rvSrlTi5O0--XkWQLac4XRxDRopPn9ZIO-91zf_ArPlUbOKEivPUiIhAot6l0dQVhMHvxDsyu9pGuibDIQrYfpKIiJuRzo9oXdgf4CnA9MUXj8Af0T0I06jax7SaM_AMPs-qMbi5HT2J5LoyFWzbLRvbsxMgIcqz_MzItf2DySQBa4V6YnweoUZ_s/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h4/h001.U4t8lylI36ITbKerov5uEj91Sokt-zzClOufN8GdxAk" target="_blank" rel="noopener noreferrer nofollow" style="text-decoration:none;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/6d548227-d06a-4a5d-882a-a39fe42a8dc2/image.png?t=1767717649" alt="" height="auto" width="532" style="display:block;width:100%;" border="0"/></a></td></tr></table></li><li class="listItem ultext"><p style="mso-line-height-alt:150.0%;padding:0px;text-align:left;word-break:break-word;"><span style="background-color:#e0e0e0;"><span style="color:rgb(255, 58, 58);font-size:0.6rem;">♥ 1k</span></span> Liquid AI has released <a class="link" href="https://elink4f7.mail.bycloud.ai/ss/c/u001.DUiN96-Eq7pUHzwEhy5j25vh6ZeGvucFird4NDCQc48SRigd0ZJan0RiLACXrthuOCStWngUGzDAXqSx-ZCswZBHf1fI5Xnwyy4nZJ8Nybr5e3Ng5rNwbepbgJ-olO8lCPfJsl-xPGiKW4kFJ-gWAng1xa22xXP16qd_qqVrNUIthqj_lAwrQGGjRnhUT_TZqe7taUnq4pssBuDw8VYnwfvtpC_fEDWlHs8eIMOM90oRIi_8bzot_I0taHWJDfoZ22LAv-QEjwORLG0ccOKXf0oT4hj_ldVnBpDR7JHMgZgvklvenJnquSV9ZRVNaEZ05QQ-NQ4u3gNkJMFh4F8oigRj1Lm8ueAfutpbSq59IE8/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h5/h001.8grt425g3200PCpvI9_gmZrgvDFVJBaIt7WnuTL8ik0" target="_blank" rel="noopener noreferrer nofollow"><span>LFM2.5</span></a>, its most capable family of <b>tiny on-device foundation models</b> (~1B class). Built on the LFM2 hybrid, device-optimized architecture, LFM2.5 scales pretraining from 10T → 28T tokens and expands RL post-training to improve instruction following. The initial open-weight lineup (including 1.2B Base/Instruct, plus vision-language and native audio-language variants) is available on <a class="link" href="https://elink4f7.mail.bycloud.ai/ss/c/u001.CxDkkVpJsBdVoe83c_tBWno2StfHgkdXyV9QnRyXhkufQ72eg52KTAi_AUEOuJJ1nyhY2QsSJNFMIk3USx_CGJmattP9pDORiPpywiUUTo0syonysuTZuJmsx2APnlpaKZLxEvtPDRjKjAveymC0sG1vcn0vrFL393Eg7JU57ASewCLlC-LcD8cys61n_9sM_4I1m3rh_6pUsawdluixVkfRv7LsXt0syh93STZVWq4wWZc0dnuKKPELZuwgY-1xK0hrTvEcOqCKOzcKJ5TNIeBhPjRmLIETKAW32YaVUcI/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h6/h001.bLiYwFfyrpqXzaSgUMhbIiCbEwQjOEoY37ntzzC6TiE" target="_blank" rel="noopener noreferrer nofollow"><span>HuggingFace</span></a>. </p><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:500px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/7fa4ed84-8984-4c6c-b34f-1d1eba1470b1/image.png?t=1767717792" alt="" height="auto" width="500" style="display:block;width:100%;" border="0"/></td></tr></table></li></ol></div></td></tr><tr><td><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" style=""><tr><td bgcolor="#222222" style="background-color:#222222;padding:0.0px 0.0px 0.0px 0.0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"></p></td></tr></table></td></tr></table></td></tr><tr><td><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" style=""><tr><td bgcolor="transparent" style="background-color:transparent;border-color:#2C81E5;border-style:solid;border-width:5px;padding:0.0px 0.0px 0.0px 0.0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td class="dd" align="left" valign="top" style="color:#2A2A2A;font-weight:Bold;padding:0px 28px;text-align:left;"><h2 style="color:#2A2A2A;font-weight:Bold;mso-line-height-alt:150.0%;"><span style="">Support My Newsletter</span></h2></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"><span style="color:rgb(34, 34, 34);font-family:Georgia, "Times New Roman", serif;font-size:16px;">As I aim to keep this newsletter free forever, your support means a lot. If you like reading The AI Timeline, consider forwarding it to another research enthusiast. It helps us keep this up for free!</span></p></td></tr><tr><td align="center" valign="top"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td align="center" valign="top" style="font-size:0px;line-height:0px;padding:30px 0px 30px;" class="dd"><table class="j" role="none" width="50%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td> </td></tr></table></td></tr><tr><td class="dd" align="left" valign="top" style="color:#2A2A2A;font-weight:Bold;padding:0px 28px;text-align:left;"><h2 style="color:#2A2A2A;font-weight:Bold;mso-line-height-alt:150.0%;">Share The AI Timeline</h2></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> You currently have <strong>0</strong> referrals. </p></td></tr><tr><td align="left" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; display:none;width:0px;max-height:0px;overflow:hidden;mso-hide:all;height:0;font-size:0;max-height:0;line-height:0;margin:0 auto;" class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 0;"><tr><td align="center" valign="top" style="width:313px;"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.c6q0w4g5sodbtO4I1B_pxWc4htTObwdorovK0nFHVH-4pUdVE0ELYH5DsNemk732SjNwhPNJ25r0O8B5vYifsGNUqyW5TiZkyMsF1yreu0byy2KW36J1wDdpoLuXg2TU1F1OW8OHoHaU4-ZmrZpPU4RN-crQCEimD190CSn9fPuxpIRojBJyu1VfV5KtQD3QMVdSg2JrjEj5-xm4r4E12Whf08itqPCb9Q5W0X4rt3ubYkqCmWnLeZpmb3_RZcbIk0UE5wZnFLCQJHLFs0qZ0OGpXp89o1HU4mWIBur5Or4tQGm5M_Y8m5PvTEfYfxLRyrcRv7GyVs5oLtFfiySZ2SqtZypLA-h50h61p0uPiA7iA_PiMqlVLtM-87XL33VZi05_O3UTpWE_0nAzFRJ4TW1ayz3_vn4Zlp9IERdbnnD61McS5GXBelKUeBLoqNKgcYTm8jBGhEIGBJ873Uvp3cAjt7ndntRNWYvyp1zxe5a87sDDw-k3VXE1327VudgY00DQ3iwdssqDiTaJZnNUI5aqjOeHhuZO6Gu_0C8rNhKI18fsc9KMB8K3xkon8hwAVAKddNEGC59XqQUg2vpg0JM29VMz2BzXC8phjkdgISXcbZ78n13f_Bh6fN2HjWporYhB54KMfDafOYVGvDwgyhdZNII_D6TO01Zg6R6tOtY/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h7/h001.QKzDCLTtb0D8Kp52t5iGzhVTJDmUaVg5rA5v5qNEEns" rel="noopener noreferrer nofollow" style="text-decoration:none;" target="_blank"><img src="" alt="" height="auto" width="313" style="display:block;width:100%;" border="0"/></a></td></tr></table></td></tr><tr class="btn_row"><td valign="top" style="padding-bottom:14px;padding-left:28px;padding-right:28px;padding-top:14px;text-align:left;width:100%;word-break:break-word;" class="dd"><table width="100%" role="none" border="0" cellspacing="0" cellpadding="0" style="margin:14px auto 14px auto;"><tr><td align="left" valign="middle"><table role="none" border="0" cellspacing="0" cellpadding="0"><tr><td style="background-color:#2C81E5;border-radius:8px;mso-padding-alt:14px 20px;" class="btn"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.c6q0w4g5sodbtO4I1B_pxWc4htTObwdorovK0nFHVH-4pUdVE0ELYH5DsNemk732SjNwhPNJ25r0O8B5vYifsGNUqyW5TiZkyMsF1yreu0byy2KW36J1wDdpoLuXg2TU1F1OW8OHoHaU4-ZmrZpPU4RN-crQCEimD190CSn9fPuxpIRojBJyu1VfV5KtQD3QMVdSg2JrjEj5-xm4r4E12Whf08itqPCb9Q5W0X4rt3ubYkqCmWnLeZpmb3_RZcbIk0UE5wZnFLCQJHLFs0qZ0OGpXp89o1HU4mWIBur5Or4tQGm5M_Y8m5PvTEfYfxLRyrcRv7GyVs5oLtFfiySZ2SqtZypLA-h50h61p0uPiA7iA_PiMqlVLtM-87XL33VZi05_O3UTpWE_0nAzFRJ4TW1ayz3_vn4Zlp9IERdbnnD61McS5GXBelKUeBLoqNKgcYTm8jBGhEIGBJ873Uvp3cAjt7ndntRNWYvyp1zxe5a87sDDw-k3VXE1327VudgY00DQ3iwdssqDiTaJZnNUI5aqjOeHhuZO6Gu_0C8rNhKI18fsc9KMB8K3xkon8hwAVAKddNEGC59XqQUg2vpg0JM29VMz2BzXC8phjkdgISXcbZ78n13f_Bh6fN2HjWporYhB54KMfDafOYVGvDwgyhdZNII_D6TO01Zg6R6tOtY/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h8/h001.i2cmSC493C5-twAzsm5aiTWxxSxlbDssH-8xd2Gb5B8" target="_blank" rel="noopener noreferrer nofollow" style="background-color:#2C81E5;border-radius:8px;color:#FFFFFF;display:inline-block;font-family:'Open Sans','Segoe UI','Apple SD Gothic Neo','Lucida Grande','Lucida Sans Unicode',sans-serif;font-size:16px;font-weight:normal;line-height:18px;padding:14px 20px;text-decoration:none;"> Click to Share </a></td></tr></table></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> Or copy and paste this link to others: <a class="link" href="https://mail.bycloud.ai/subscribe?ref=6SqUHb8KiF&_bhlid=bf7a73b936aab597b0df9777ef50b28c5a049d32" target="_blank" rel="noopener noreferrer nofollow" clicktracking="off"><span>https://mail.bycloud.ai/subscribe?ref=6SqUHb8KiF</span></a></p></td></tr><tr><td align="center" valign="top" style="font-size:0px;line-height:0px;padding:30px 0px 30px;" class="dd"><table class="j" role="none" width="50%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td> </td></tr></table></td></tr></table></td></tr><tr class="btn_row"><td valign="top" style="padding-bottom:14px;padding-left:28px;padding-right:28px;padding-top:14px;text-align:center;width:100%;word-break:break-word;" class="dd"><table width="100%" role="none" border="0" cellspacing="0" cellpadding="0" style="margin:14px auto 14px auto;"><tr><td align="center" valign="middle"><table role="none" border="0" cellspacing="0" cellpadding="0"><tr><td style="background-color:#2C81E5;border-radius:8px;mso-padding-alt:14px 20px;" class="btn"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.zNfxTwpJFmrsCuJJphGRkKSrCVph9-fOYkcjx4VfJRyUw-Iv7GHKoTyxc57iFdcabeJrUAXVgdJXAkTcc7bS82ZF6NEkQHkUBgqGaM66RDbyMBpTK8pOBl6aVCc1cb8u-t3pD0dZw7DwoSxp9xqCkawZYqRg4asGOqOcs6FCGYmxU9peR5UnvkkaBJahF8Wn1gqwRPttn22xr3hjD4_D5DKGQPSeokr0Y3joOkcmAg9KZmy7REOO1uHjq4-twoGFOs2LLnshxACAAp6AWvj0_A/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h9/h001.hVkxpAQqRcYzUH_2G7UCarGYp8WBRfVZVBkF1w1XupI" target="_blank" rel="noopener noreferrer nofollow" style="background-color:#2C81E5;border-radius:8px;color:#FFFFFF;display:inline-block;font-family:'Open Sans','Segoe UI','Apple SD Gothic Neo','Lucida Grande','Lucida Sans Unicode',sans-serif;font-size:16px;font-weight:normal;line-height:18px;padding:14px 20px;text-decoration:none;"> Check Out My Patreon </a></td></tr></table></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"><span style=""><a class="link" href="https://elink4f7.mail.bycloud.ai/ss/c/u001.tLfGW26lAwaS9gFg17HSoGymQ3NNPtd5dE5MV_8UgjLbPKYFbBPtV6oAT4VYSncNiXOMe0ETHKViEemkGKRuti97gDsqlNJXOC9cMEoZt4vqGEMzd3CYIoAvubE-GTMMAL1dvUxqvavfUMtVmTn-D9-px1H0hF-6GNLiNZYJGBiI4gap_dOWrNROSvlX91xqePyZw4YoYPCLatsyc58TnwdvkVko3YpqmHzNQ1-0QlgQTCOSCWLyBxQxLyfSS71Uou8sFJZVtNh2wehnXMIrUw/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h10/h001.gR3UQ7rX47ZXo_EIFVmpAXiTEsUTiTD-RDrU3FW0vMU" target="_blank" rel="noopener noreferrer nofollow"><span>Advertise with The AI Timeline! </span></a></span></p></td></tr></table></td></tr></table></td></tr><tr><td><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" style=""><tr><td bgcolor="#222222" style="background-color:#222222;padding:0.0px 0.0px 0.0px 0.0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"></p></td></tr></table></td></tr></table></td></tr><tr><td id="recursive-language-models" class="dd" align="left" valign="top" style="color:#2A2A2A;font-weight:Bold;padding:0px 28px;text-align:left;"><h2 style="color:#2A2A2A;font-weight:Bold;mso-line-height-alt:150.0%;">Recursive Language Models</h2></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"><i>Zhang et al. [MIT CSAIL]</i></p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"><span style="background-color:#e0e0e0;"><span style="color:rgb(255, 58, 58);font-size:0.6rem;"> ♥ 2k </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span><span style="background-color:#e0e0e0;"><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> LM Context </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span></p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> LLMs are making significant progress and can handle several complex tasks but, they struggle when we try to process massive amounts of information in a context window, like trying to read a library of books simultaneously without losing the plot. Even the most advanced models suffer from a phenomenon known as "context rot," where their reasoning ability degrades as the context is used up overtime. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/e76afe45-4fcc-4250-93ce-2b85d5677ef1/CleanShot_2026-01-06_at_18.56.39_2x.png?t=1767706010" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>A Recursive Language Model (RLM) treats prompts as part of the environment.</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> This paper tries to determine if it is possible to enable AI to tackle long-horizon tasks involving millions of words without needing a bigger brain, but rather a smarter way to manage information. </p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> The team introduced a concept called Recursive Language Models (RLMs). Instead of forcing a neural network to ingest a massive document all at once, this approach treats the text as an external part of the environment, much like a reference book sitting on a desk rather than a memory in one's head. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/c35bac89-c7b3-455b-b7da-5e14b93437f9/CleanShot_2026-01-06_at_18.57.14_2x.png?t=1767706045" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>Performance comparison of different methods across long-context benchmarks of varying complexity.</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> The AI effectively acts as a programmer, writing code to peek into specific parts of the text, break complex problems into smaller chunks, and recursively call upon copies of itself to analyze those snippets. This strategy allowed models to successfully handle inputs up to two orders of magnitude larger than their designed limits. </p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> On complex reasoning tasks, this method dramatically <b>outperformed standard models</b> and summarization techniques, while maintaining high accuracy even as the information load grew immense. </p></td></tr><tr class="btn_row"><td valign="top" style="padding-bottom:14px;padding-left:28px;padding-right:28px;padding-top:14px;text-align:center;width:100%;word-break:break-word;" class="dd"><table width="100%" role="none" border="0" cellspacing="0" cellpadding="0" style="margin:14px auto 14px auto;"><tr><td align="center" valign="middle"><table role="none" border="0" cellspacing="0" cellpadding="0"><tr><td style="background-color:#2C81E5;border-radius:8px;mso-padding-alt:14px 20px;" class="btn"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.DUiN96-Eq7pUHzwEhy5j28yjf9KIXZdsXoh1WlHvvKm9pWL7gLGYulIDeY5iXIFelDUbWJ2v2qgj6eLSj2kY2BJJv6Iqs1rbmAGdHMzME8yEqqRQJnjtPFX3SFek209rFWf3MVkm-kjQYaTdyvsH6bdlH-glC2TLgMTMafCqBJHvMZtJfQyP2lsFLzjo99gCTqXDZW0vg99VeG_bv8P7HvvaE49q2bWiZ-WSBZY20PcFLXwiYT5LzhhaIzW1wTkIGCq1sGdaXwskKqLOHRvazA/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h11/h001.oPyjZFeU1yakinEihd27DZEmkGm8S_ZGuCZ5tYLcQS0" target="_blank" rel="noopener noreferrer nofollow" style="background-color:#2C81E5;border-radius:8px;color:#FFFFFF;display:inline-block;font-family:'Open Sans','Segoe UI','Apple SD Gothic Neo','Lucida Grande','Lucida Sans Unicode',sans-serif;font-size:16px;font-weight:normal;line-height:18px;padding:14px 20px;text-decoration:none;"> Read Full Paper </a></td></tr></table></td></tr></table></td></tr><tr><td><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" style=""><tr><td bgcolor="#222222" style="background-color:#222222;padding:0.0px 0.0px 0.0px 0.0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"></p></td></tr></table></td></tr></table></td></tr><tr><td id="m-hc-manifold-constrained-hyper-con" class="dd" align="left" valign="top" style="color:#2A2A2A;font-weight:Bold;padding:0px 28px;text-align:left;"><h1 style="color:#2A2A2A;font-weight:Bold;mso-line-height-alt:175.0%;"><b>mHC: Manifold-Constrained Hyper-Connections</b></h1></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> Xie<i> et al. [</i>DeepSeek AI<i>]</i></p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"><span style="background-color:#e0e0e0;"><span style="color:rgb(255, 58, 58);font-size:0.6rem;"> ♥ 3k </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span><span style="background-color:#e0e0e0;"><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> Residual Connection </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span><span style="background-color:#e0e0e0;"><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> bycloud’s pick </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span></p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> Transformers lean heavily on residual connections because they keep information and gradients flowing cleanly through many layers. Hyper-Connections (HC) try to push this idea further by widening the residual stream into multiple parallel “streams” and learning how to mix them, so the model can exchange information across depth without increasing the core layer FLOPs much. </p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> The problem is that the more freedom HC gives those cross-stream mixing matrices, the less it behaves like an identity path. When you stack many layers, the product of these unconstrained residual mixing matrices can amplify or shrink signals unpredictably, which shows up as training instability in large runs. In their 27B setup, the paper reports a loss surge for HC around 12k steps and extremely large composite “gain magnitudes” that can peak around 3000, a sign of exploding residual dynamics. </p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> Their fix is <b>Manifold-Constrained Hyper-Connections (mHC)</b>. Instead of letting the residual mixing matrix be anything, they project it onto the manifold of doubly stochastic matrices, meaning all entries are non-negative and every row and column sums to 1. That keeps the residual pathway closer to a stable identity-like behavior while still allowing streams to mix, since each stream becomes a convex combination of the others rather than an arbitrary linear remapping. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/68e2e976-8c5b-41ea-be3a-eb1fdde71892/CleanShot_2026-01-06_at_18.59.11_2x.png?t=1767706172" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>Illustrations of Residual Connection Paradigms.</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> Practically, they build this projection with the Sinkhorn-Knopp algorithm, running a limited number of iterations (they use 20) to turn an unconstrained matrix into an approximately doubly stochastic one. Because doubly stochastic matrices stay doubly stochastic under multiplication, the stability property should persist even when you multiply many layers’ residual mappings together, which is exactly where HC would tend to drift. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/8dfc6c2b-9827-4b95-9b6f-254704dba951/CleanShot_2026-01-06_at_19.00.20_2x.png?t=1767706233" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>Visualizations of Learnable Mappings.</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> They also treat systems cost as part of the method. Widening the residual stream increases memory traffic and activation storage, so they add fused kernels, mixed precision kernels, and selective recomputation, and adjust pipeline overlap. With expansion rate n = 4, they report only about a 6.7% training time overhead after these optimizations. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/0b439787-6306-4463-a4ce-910a14d863dc/CleanShot_2026-01-06_at_19.00.59_2x.png?t=1767706269" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>Training Stability of Manifold-Constrained Hyper-Connections (mHC).</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> On results, mHC appears to keep HC’s accuracy benefits while avoiding its instability. In the 27B run, mHC reaches a final training loss reduction of 0.021 versus the baseline and keeps gradient norms closer to baseline behavior. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/906b37b3-675b-43b5-a749-e82ec63cc1bb/image.png?t=1767719908" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>mHC benchmark against baseline</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> On downstream benchmarks, mHC beats the baseline across the board and usually edges out HC too, for example improving BBH and DROP relative to HC by about 2.1 and 2.3 points, respectively. On the stability metrics, the composite gain that could hit ~3000 in HC stays bounded around ~1.6 in mHC, which matches the paper’s story that constraining the residual topology can make this kind of widened residual stream scale more safely. </p></td></tr><tr class="btn_row"><td valign="top" style="padding-bottom:14px;padding-left:28px;padding-right:28px;padding-top:14px;text-align:center;width:100%;word-break:break-word;" class="dd"><table width="100%" role="none" border="0" cellspacing="0" cellpadding="0" style="margin:14px auto 14px auto;"><tr><td align="center" valign="middle"><table role="none" border="0" cellspacing="0" cellpadding="0"><tr><td style="background-color:#2C81E5;border-radius:8px;mso-padding-alt:14px 20px;" class="btn"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.fUNb4GdFo9D3F8WuLArtoZr-f6keVrG1GKuVv1wQKvpRAu1w5EIFjqBvw_O83B36D47UwwwBK6e7HkdDuGGnLcB2AKa7UbswbIZ5EpaWLS6gcHLXCjHv64zHfigfHSRy1fX0W_1eIBpFqHp8lRYxWjuo6bclPUhCKXZaW1g_XDWlTYJPu4-KjawOMAbAhq55KHvVy8z0ucTPVKoExyGVKxOBARRFQ3KlCHbH5fXyabCWJBYCinngqihnyRBmyfN3HyI8hJBEtqD--7Cxn7ppSQ/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h12/h001.ehjT_LOHjL59_RoaXc0s2mx4dIqclIBdln16_wkjfiE" target="_blank" rel="noopener noreferrer nofollow" style="background-color:#2C81E5;border-radius:8px;color:#FFFFFF;display:inline-block;font-family:'Open Sans','Segoe UI','Apple SD Gothic Neo','Lucida Grande','Lucida Sans Unicode',sans-serif;font-size:16px;font-weight:normal;line-height:18px;padding:14px 20px;text-decoration:none;"> Read Full Paper </a></td></tr></table></td></tr></table></td></tr><tr><td><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" style=""><tr><td bgcolor="#222222" style="background-color:#222222;padding:0.0px 0.0px 0.0px 0.0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"></p></td></tr></table></td></tr></table></td></tr><tr><td id="efficient-context-scaling-with-long" class="dd" align="left" valign="top" style="color:#2A2A2A;font-weight:Bold;padding:0px 28px;text-align:left;"><h1 style="color:#2A2A2A;font-weight:Bold;mso-line-height-alt:175.0%;"><b>Efficient Context Scaling with LongCat ZigZag Attention</b></h1></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> Zhang<i> et al. [</i>Meituan<i>]</i></p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"><span style="background-color:#e0e0e0;"><span style="color:rgb(255, 58, 58);font-size:0.6rem;"> ♥ 211 </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span><span style="background-color:#e0e0e0;"><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> LLM Attention </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span></p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> There is a bottleneck in how AI processes information, as models try to "read" longer documents (like entire books, legal archives, or massive codebases), the computational cost skyrockets because the system traditionally tries to pay equal attention to every single connection between every word. </p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> The research team sought a way to break this inefficient cycle, aiming to create a model that can handle up to one million tokens of context without the computational weight that comes with it. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/a3787feb-b2f5-4ab2-aabd-bd36da2fb43f/CleanShot_2026-01-06_at_19.20.26_2x.png?t=1767707437" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>The illustration of LongCat ZigZag Attention (LoZA), which involves first calibration and then training for realizing the sparsity.</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> The team discovered a method called <b>LongCat ZigZag Attention (LoZA)</b>, which effectively teaches the model how to "skim" intelligently without missing the details. By carefully calibrating the system, researchers identified which layers of the network were doing the most important work and which could be optimized. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/b1df88f2-cc3f-49bf-bed1-84c241ee91da/CleanShot_2026-01-06_at_19.21.19_2x.png?t=1767707493" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>The efficiency of LoZA. The relative cost and speed-up are practically measured on H20 clusters.</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> They found a streamlined structure hidden inside the larger model, converting about half of the attention mechanisms to a "sparse" mode that focuses only on essential information. They found that by retraining the model mid-process after this switch, they could lock in significant speed improvements while maintaining the same high level of intelligence and accuracy as the heavier, original models. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/18d69597-1672-4cab-a28d-cc440dfe229a/CleanShot_2026-01-06_at_19.21.54_2x.png?t=1767707523" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>The effectiveness of LongCat-Flash-Exp-Chat across different context lengths on MRCR. </p></td></tr></table></td></tr><tr class="btn_row"><td valign="top" style="padding-bottom:14px;padding-left:28px;padding-right:28px;padding-top:14px;text-align:center;width:100%;word-break:break-word;" class="dd"><table width="100%" role="none" border="0" cellspacing="0" cellpadding="0" style="margin:14px auto 14px auto;"><tr><td align="center" valign="middle"><table role="none" border="0" cellspacing="0" cellpadding="0"><tr><td style="background-color:#2C81E5;border-radius:8px;mso-padding-alt:14px 20px;" class="btn"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.fUNb4GdFo9D3F8WuLArtoZr-f6keVrG1GKuVv1wQKvqgNEL01EOU6GQub1AdkhEVAFvnuW_r7BGlt-GRD7nN_qLXqes3a4sEgQ4w_mKahKb71NgDCXSAhptGdEwx-1B7h692eU_5wDUQIFVmsdJhPAX5pXfeYL7Mp3FRSZT8dQcJ0nk2dsL2TvpJmJLGk2hupdX-0phu6XzafBkRU-kkdRYdCAcRN0TFAMeOCLFqmd4_CKY1_n8T8bLrbFDFt-JosjV3kg4bb5iwYPXNSugl4w/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h13/h001._spBs5y2H6fhor2sI0l_l7Z5KSm0QtYFpISnlDxvUQc" target="_blank" rel="noopener noreferrer nofollow" style="background-color:#2C81E5;border-radius:8px;color:#FFFFFF;display:inline-block;font-family:'Open Sans','Segoe UI','Apple SD Gothic Neo','Lucida Grande','Lucida Sans Unicode',sans-serif;font-size:16px;font-weight:normal;line-height:18px;padding:14px 20px;text-decoration:none;"> Read Full Paper </a></td></tr></table></td></tr></table></td></tr><tr><td><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" style=""><tr><td bgcolor="#222222" style="background-color:#222222;padding:0.0px 0.0px 0.0px 0.0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"></p></td></tr></table></td></tr></table></td></tr><tr><td id="evaluating-parameter-efficient-meth" class="dd" align="left" valign="top" style="color:#2A2A2A;font-weight:Bold;padding:0px 28px;text-align:left;"><h1 style="color:#2A2A2A;font-weight:Bold;mso-line-height-alt:175.0%;"><b>Evaluating Parameter Efficient Methods for RLVR</b></h1></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> Yin<i> et al. [</i>Zhejiang University, HKUST, WUST, USTC, Brown University, Hong Kong Polytechnic University, INSAIT<i>]</i></p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"><span style="background-color:#e0e0e0;"><span style="color:rgb(255, 58, 58);font-size:0.6rem;"> ♥ 433 </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span><span style="background-color:#e0e0e0;"><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> LLM RLVR </span></span><span style="color:rgb(44, 129, 229);font-size:0.6rem;"> </span></p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> As artificial intelligence moves from simply predicting the next word to solving complex mathematical problems, the training process has evolved. Researchers are increasingly relying on <b>Reinforcement Learning with Verifiable Rewards (RLVR)</b>, a method where models improve by receiving a simple "correct" or "incorrect" signal on their reasoning. While this approach is powerful, retraining an entire massive model is incredibly expensive. </p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> To save cost and time, the industry has largely settled on a specific efficiency shortcut known as <b>LoRA (Low-Rank Adaptation)</b>. However, is this tool that everyone uses actually the best one for this specific type of learning, or are we leaving performance on the table by ignoring better alternatives? </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/64fac71e-fa13-4e03-91e6-eeb2a226f193/CleanShot_2026-01-06_at_19.22.43_2x.png?t=1767707583" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> The team discovered that the industry standard is suboptimal for reinforcement learning. By testing over a dozen different efficiency methods, they found that newer "structural" variants (approaches that change how weight updates are structured rather than just adding a simple adapter) consistently outperformed the default method. In some cases, these structural variants even surpassed the performance of full-parameter training, which is typically considered the gold standard. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/0384ea49-6284-4356-bda5-0902d01b2b1e/CleanShot_2026-01-06_at_19.23.12_2x.png?t=1767707604" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>A variety of PEFT methods are listed, each with its specific update formulation and initialization strategy. LN denotes Layernorm.</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> The study also revealed a fascinating mismatch in how models learn. Some advanced methods try to initialize training by focusing on the model's "loudest" or most significant existing features. The researchers found this causes the training to collapse because reinforcement learning actually thrives by tweaking the quieter, less dominant parts of the network. </p></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> Additionally, the team identified a strict limit to efficiency. While it is possible to freeze large portions of a model, attempting extreme compression bottlenecks the system. To learn complex reasoning, the model retains a need for a minimum amount of "plasticity," or trainable parameters, without which its ability to evolve stalls completely. </p></td></tr><tr><td align="center" valign="top" style="padding-bottom:20px;padding-left:15px;padding-right:15px;padding-top:20px; " class="dd"><table role="none" border="0" cellspacing="0" cellpadding="0" style="margin:0 auto 0 auto;"><tr><td align="center" valign="top" style="width:626px;"><img src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/uploads/asset/file/c692261a-315e-42e5-af10-0e4394156a8a/CleanShot_2026-01-06_at_19.24.05_2x.png?t=1767707657" alt="" height="auto" width="626" style="display:block;width:100%;" border="0"/></td></tr><tr><td align="center" valign="top" class="t" style="width:626px; padding: 4px 0px 4px 0px;"><p>Comparison of accuracy and pass scores (all values are reported in percentages).</p></td></tr></table></td></tr><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"> By moving away from the default adoption of standard LoRA and using structural variants like DoRA, engineers can build models that are not only computationally cheaper but also significantly smarter at math and logic. </p></td></tr><tr class="btn_row"><td valign="top" style="padding-bottom:14px;padding-left:28px;padding-right:28px;padding-top:14px;text-align:center;width:100%;word-break:break-word;" class="dd"><table width="100%" role="none" border="0" cellspacing="0" cellpadding="0" style="margin:14px auto 14px auto;"><tr><td align="center" valign="middle"><table role="none" border="0" cellspacing="0" cellpadding="0"><tr><td style="background-color:#2C81E5;border-radius:8px;mso-padding-alt:14px 20px;" class="btn"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.DUiN96-Eq7pUHzwEhy5j28yjf9KIXZdsXoh1WlHvvKmw3nQ2ZdDXZmFwSGL8HqXRCuKNVmhmtIpg_L7a7gZ1sAyrwWjJu6D9MEUSzmUoohngY410YVBx4vaa0hidBDVL8rAaflV5OiuST6npxQLuZMelxDkGB48kgiOkeu_r4RaDxM1QLVN6Q2CcrWHyoPfejSmc4C3UTDHOYdgvBk21vLP-26vkhpNzSL3gzyNSMXkrdCKeqGufcSIRvKmYyH_1ED326suXvEPH8VyPXf4woA/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h14/h001.OtS6J6qulv4mqaPX-KTCY1UQV3AH2cbvjaigI8gne44" target="_blank" rel="noopener noreferrer nofollow" style="background-color:#2C81E5;border-radius:8px;color:#FFFFFF;display:inline-block;font-family:'Open Sans','Segoe UI','Apple SD Gothic Neo','Lucida Grande','Lucida Sans Unicode',sans-serif;font-size:16px;font-weight:normal;line-height:18px;padding:14px 20px;text-decoration:none;"> Read Full Paper </a></td></tr></table></td></tr></table></td></tr><tr><td><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" style=""><tr><td bgcolor="#222222" style="background-color:#222222;padding:0.0px 0.0px 0.0px 0.0px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td class="dd" align="left" style="padding:0px 28px;text-align:left;word-break:break-word;"><p style="mso-line-height-alt:150.0%;"></p></td></tr></table></td></tr></table></td></tr><tr><td class="dd" align="center" valign="top" style="padding:20px;"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.amatuKKICSickUKplYJXmM0F_Ptg_K-gzvQTp820Ae25HaDgcbgnsryxsusW510mRJ4bdxJNEROV7EUkvJTcqtSNMsiZyR2CVE5JbJWZbyzvVsu4uVTGr2SGVkda_6m7ta5C7SQheYe9WcigrCLsmlGdRW6Aek60xtFOLoIgE2BApeRcfuGHj6HM1zGDPv1_VAvFHc1WUEKA-nBvD6HUAHmPP9hF1aaX_k7zwkna1n1xHiK5sUgeksOdrPxm5hEmH-Q27TIcJZq2-Fi8OHZt6DureMThkuGPXetwfMbOyf4/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h15/h001.ujOUks0kikZw3Rtp8IIY11X-i1bht2bsFcFLKoGzWyo" style="text-decoration:none;"><table align="center" width="100%" cellpadding="0" cellspacing="0" border="0" role="none" style="max-width:520px;margin:0 auto;"><tr><td class="p" width="100%" style="padding:2px;border:none;"><table width="100%" cellpadding="0" cellspacing="0" border="0" role="none"><tr><td align="center" valign="top" style="width:100%;"><div style="max-height:0;position:relative;opacity:0.999;width:100%;mso-hide:all;"><div style="display:inline-block;width:100%;padding-top:25%;"><img width="20%" height="auto" loading="lazy" alt="" style="border:0;" src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/static_assets/youtube_play_icon.png"/></div></div><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.amatuKKICSickUKplYJXmM0F_Ptg_K-gzvQTp820Ae25HaDgcbgnsryxsusW510mRJ4bdxJNEROV7EUkvJTcqtSNMsiZyR2CVE5JbJWZbyzvVsu4uVTGr2SGVkda_6m7ta5C7SQheYe9WcigrCLsmlGdRW6Aek60xtFOLoIgE2BApeRcfuGHj6HM1zGDPv1_VAvFHc1WUEKA-nBvD6HUAHmPP9hF1aaX_k7zwkna1n0fqtyBT7TCKTK7JXWRannFNm58vH3pecHEt1qdw8VVSFZwOhVdH3G5q2HJdg967rc/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h16/h001.ADoTUYXDo6scc0tis64LdFNHp62g2cY-m41XqT0zKoQ" style="text-decoration:none;"><img src="https://i.ytimg.com/vi/ZgwHaI2C-9s/maxresdefault.jpg" width="480" height="auto" loading="lazy" alt="YouTube video by bycloud" style="display:block;height:auto;border:0;outline:none;text-decoration:none;background-color:#000000;width:100%;"/></a></td></tr><tr><td><p style="font-size:12px;font-weight:500;font-style:italic;font-family:Helvetica, Calibri, sans-serif;color: #686a6d; padding-top:0 !important;padding-bottom:6px !important; padding-left:4px !important;"> How did a 27M Model even beat ChatGPT? </p></td></tr></table></td></tr></table></a></td></tr></table></td></tr></table></td></tr><tr><td align="center" valign="top"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td><tr><td class="b" align="center" valign="top" bgcolor="#2a2a2a" style="padding:0px 0px 0px 0px;border-style:solid;border-width: 0px 0px 0px 0px;border-color: #2a2a2a;border-bottom-left-radius:10px;border-bottom-right-radius:10px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td align="center" valign="top" bgcolor="#73ddff" style="padding:12px"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td><span style="padding-left:1px;"></span></td><td align="center" valign="middle" width="75" style="width:75px;"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.1muhFWIqieRYpaJ-FbWSCQqcWoV4NNHHr5SkP9THApWUO4S9eWSDBFDMKQ83N4CY1l4kXQTU9YnEEqXRrg_2uhS94rQOKDl60C6UO57Zu1mJCFi_zhfD-a_hnJHdTQ7ETFy7sNYcLlR33s8U8GEdxWA9Nh7h9TbkSgy4yfLZMes1bNpoIynBHCXou4H2Bj_GSTJPl8UmV30YTlXxfLDCSSrBKzvHkvdQWu81-kiohesmKXhrRWMpLRysKtpLg9456xshWUH2HenU6LQ1YUkhdQ/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h17/h001.8OTszKx1nGBKUQxeXn7hHX4Q7vOId2Jh9Z9HBRsGhYo" style="text-decoration:none;"><img width="22" height="22" alt="tw" border="0" style="display:block;max-width:22px;color:Dark" src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/static_assets/x_dark.png"/></a></td><td align="center" valign="middle" width="75" style="width:75px;"><a href="https://elink4f7.mail.bycloud.ai/ss/c/u001.amatuKKICSickUKplYJXmBoQnQ9VXnB2zTxBG4HeHBi5iti4l06m5fR1UTFq_vFgQaGMmutCjJbuBFU8WHbRj6heToGsiZHlry3dxu5DEimeQbpBAMyhKdSbaWrmIf3bVsliDpYY7zgp96oJEjCcq-vkRw3o0CBSqK1Av7jCUVaCI3CnoCJAV60jHLc3ePMDSaP486nOzLSrCyxhDujb92SZ-7efOV8_dxFak-8plpOkcxK4zMzlRtdpY3y8ua8vGQQipv5R9embLlgkJxePWA/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h18/h001.UkR4xUEHX1FMbWlW3wQdZFXqSQRCURiOIzAEGXpu1lc" style="text-decoration:none;"><img width="22" height="16" alt="yt" border="0" style="display:block;max-width:22px;color:Dark" src="https://media.beehiiv.com/cdn-cgi/image/fit=scale-down,format=auto,onerror=redirect,quality=80/static_assets/youtube_dark.png"/></a></td><td><span style="padding-left:1px;"></span></td></tr></table></td></tr><tr><td height="10" style="line-height:1px;font-size:1px;height:10px;"> </td></tr><tr><td class="w" align="center" valign="top" style="padding:15px 15px 15px 15px;"><table role="none" width="100%" border="0" cellspacing="0" cellpadding="0" align="center"><tr><td align="center" valign="top"><p style="font-family:'Verdana',Geneva,sans-serif;color:#FFFFFF!important;"> Update your email preferences or unsubscribe <a class="link" href="https://elink4f7.mail.bycloud.ai/ss/c/u001.c6q0w4g5sodbtO4I1B_pxWc4htTObwdorovK0nFHVH-4pUdVE0ELYH5DsNemk732SjNwhPNJ25r0O8B5vYifsBhEpz-DJgyVFmavJPa0OyKRRnvw4o7XGyvIv7PRofnmnFTsMWDozp8OEKBZL4uFEizxJm8teheEskWxdQUbEIzd1MbE9P2cF8DHwCrfPpDicAoV7b7vJ3M4OlJN8jS4yUKCgwICDOTmQMqlrfTxTFtRgk9kymy-HeXwJVykDeR_dEMZ5Khuff-ma6_KE1rTRKqPVXXxfaQUPxOz1jeOrAfHIcxVdQocidzdyiLYkyrvhHebuf4ofqwvxvX77RdpzG-8G94WoQOrBRRs9SBJ-wQJ72xkGGsV_KSZCL02O_ZB_yk9HNSQCNubLmGKwN_vEJvaOWZXyRsUr_QPn3j7YVfX45TWbyZKxSDoVIcTMVMNqFjLC5lZAwFi-CEJQRdC0Yf95jn28G92Q2Cn5Ma1CZuSMBZGySlgjBCN49CoZNZ7VvZ36OnEE1Wh4nRIkhHZHDJ_8L_MrWJ_hIO-sHRMCza1HLlteBH6JQhBiUVLw9BtrwkfH6ivfVEx5GsH4DrOKeyoBIlPPcosVQe1Hmy1oJ-z7Dy_unQIePG05Dg399pKD1a4NmUt8LE-1Wna7C4wq6vHlg5l-q3qDETob5lCHxBIvtNgSnUC0k6xPeRCs6GxfXXFlE-lim-qGZkZ0o0OLpJeC8ELoBLz3fWMeMOKMFDrb67wYom4avz4A-UBtgvH2rUUUy2rhi9Xg8mFVKIIP7qFUfFa48WTCgpe0KkqlFG_xVuzr6jhQokWvuR6CD5gsfooI30POEccJgbJetq2gdLzCT_d432_wfxUJxtbu3vPRCUClG47fXIQDU-MHRBVH_eigmNwSMs473nAQQP4TMVwhZVb2ZcyVKteeqwab309J83IqqsLtXDScshhRR7C_9TZk615_hSGfV9wgyDeQOtcR2DUmhF21GBDJEshHHXTjVSOR-pmKklHgTyU-jWSoTD7OpdFGNfDB_yVLDLYXJmkk101-lElRLhu2PNm6ZM/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h19/h001.U6iwrV2SrtVm3gzhlfsNccsHcetzLLnfVzMRX86CDFU" style="text-decoration:underline;text-decoration-color:#FFFFFF!important;color:#FFFFFF!important;"> here</a></p><p class="copyright" style="font-family:'Verdana',Geneva,sans-serif;color:#FFFFFF!important;"> © 2026 bycloudai </p><p style="font-family:'Verdana',Geneva,sans-serif;color:#FFFFFF!important;"> 228 Park Ave S, #29976, New York, New York 10003, United States </p></td></tr><tr style="display: table-row !important;"><td align="center" valign="top" style="padding-top:20px;" style="display:table-cell !important;"><table role="none" border="0" cellspacing="0" cellpadding="0" align="center" style="display:table !important;"><tr style="display:table-row !important;"><td class="u" align="center" valign="middle" height="32" style="height:32px;display:table-cell !important; max-height: 32px !important;margin:0px !important; background-color: #ffffff !important;"><a style="line-height:32px !important;text-decoration:none;display:block !important;" href="https://elink4f7.mail.bycloud.ai/ss/c/u001.DUiN96-Eq7pUHzwEhy5j28olDWFpV5DDKfdk_OdOKOiYO1IemX6_pzctsWh1ijBIPLFNQundXNKs9MS-Jc7H1C8WtwsPim97oo9zQ21gFlcEIDG9QyLc_EG04iireG6guSzz8jGXfBxVTHvXdOt21xvpLSAhOAY4cudxZZ9g55Zv9cLd5Z7yFRrl1-4bAKLp35RYfpjAfHb6_qPXdgts5Jl9ngumAk_rqwCOHzO3g3n9AFGv7HLtWljSp0r_MFqw/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h20/h001.AeDC-03AuNLfTssGMkyZcSHR-cUOdn7ybSoBgiSRI2s"><img src="https://media.beehiiv.com/output-onlinepngtools.png" width="16" alt="beehiiv logo" style="display:inline-block !important;max-width:16px !important; vertical-align:-3px !important;width: 16px !important;" border="0"/><span style="padding-left:11px !important;display: inline-block !important;">Powered by beehiiv</span></a></td></tr></table></td></tr><tr><td align="left" valign="top" height="2" style="height:2px;"><a href='https://elink4f7.mail.bycloud.ai/ss/c/u001.CxDkkVpJsBdVoe83c_tBWsHIaP4XNp0WgUYqLvHcKk_3uqk_KIkz4ddLinhFbud6JuxLFdSUhYnR7b1NSsmbtzXNGNblnEEMKUtkCAjkn8Y/4n2/b1HjxW_sTXWv5GsEHVrZdQ/h21/h001.I8ToSn4Tquzk85MvMQCByr0thApWdhJ4xId_cZepYMo' style="color: #2a2a2a !important; cursor: default; font-size: 1px; text-decoration: none;"> Terms of Service </a></td></tr><tr><td align="left" valign="top" height="2" style="height:2px;"><a href='https://email.beehiivstatus.com/96d3dcc3836c4a40a9a4c896ca75f4c1f2d07056/hclick' clicktracking="off" style="color: #2a2a2a !important; cursor: default; font-size: 1px; text-decoration: none;"></a></td></tr></table></td></tr></table></td></tr></td></tr></table></td></tr></table></td></tr></table></td></tr></table></div></body></html>