<?xml version="1.0" encoding="utf-8" standalone="yes" ?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Foundation Model | Yequan&#39;s Academic</title>
    <link>http://localhost:1313/tag/foundation-model/</link>
      <atom:link href="http://localhost:1313/tag/foundation-model/index.xml" rel="self" type="application/rss+xml" />
    <description>Foundation Model</description>
    <generator>Wowchemy (https://wowchemy.com)</generator><language>en-us</language><lastBuildDate>Sat, 16 Aug 2025 00:00:00 +0000</lastBuildDate>
    <image>
      <url>http://localhost:1313/media/icon_hu041b0395efa72cb92c3618e7883e8354_359622_512x512_fill_lanczos_center_3.png</url>
      <title>Foundation Model</title>
      <link>http://localhost:1313/tag/foundation-model/</link>
    </image>
    
    <item>
      <title>Not All Layers of LLMs Are Necessary During Inference</title>
      <link>http://localhost:1313/publication/ijcai2025-adainfer/</link>
      <pubDate>Sat, 16 Aug 2025 00:00:00 +0000</pubDate>
      <guid>http://localhost:1313/publication/ijcai2025-adainfer/</guid>
      <description></description>
    </item>
    
    <item>
      <title>Few-Shot Learner Generalizes Across AI-Generated Image Detection</title>
      <link>http://localhost:1313/publication/icml2025/</link>
      <pubDate>Tue, 15 Jul 2025 00:00:00 +0000</pubDate>
      <guid>http://localhost:1313/publication/icml2025/</guid>
      <description></description>
    </item>
    
    <item>
      <title>52B to 1T: Lessons Learned via Tele-FLM Series</title>
      <link>http://localhost:1313/publication/arxiv2024-tele-flm-1t/</link>
      <pubDate>Wed, 03 Jul 2024 00:00:00 +0000</pubDate>
      <guid>http://localhost:1313/publication/arxiv2024-tele-flm-1t/</guid>
      <description></description>
    </item>
    
    <item>
      <title>Masked Structural Growth for 2x Faster Language Model Pre-training</title>
      <link>http://localhost:1313/publication/iclr2024-msg/</link>
      <pubDate>Tue, 07 May 2024 00:00:00 +0000</pubDate>
      <guid>http://localhost:1313/publication/iclr2024-msg/</guid>
      <description></description>
    </item>
    
    <item>
      <title>Research without Re-search: Maximal Update Parametrization Yields Accurate Loss Prediction across Scales</title>
      <link>http://localhost:1313/publication/arxiv2023-mu-scaling/</link>
      <pubDate>Fri, 14 Apr 2023 00:00:00 +0000</pubDate>
      <guid>http://localhost:1313/publication/arxiv2023-mu-scaling/</guid>
      <description></description>
    </item>
    
  </channel>
</rss>
