<?xml version="1.0" encoding="utf-8" standalone="yes" ?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Pre-trained Language Model | Yequan&#39;s Academic</title>
    <link>http://localhost:1313/tag/pre-trained-language-model/</link>
      <atom:link href="http://localhost:1313/tag/pre-trained-language-model/index.xml" rel="self" type="application/rss+xml" />
    <description>Pre-trained Language Model</description>
    <generator>Wowchemy (https://wowchemy.com)</generator><language>en-us</language><lastBuildDate>Wed, 03 Jul 2024 00:00:00 +0000</lastBuildDate>
    <image>
      <url>http://localhost:1313/media/icon_hu041b0395efa72cb92c3618e7883e8354_359622_512x512_fill_lanczos_center_3.png</url>
      <title>Pre-trained Language Model</title>
      <link>http://localhost:1313/tag/pre-trained-language-model/</link>
    </image>
    
    <item>
      <title>52B to 1T: Lessons Learned via Tele-FLM Series</title>
      <link>http://localhost:1313/publication/arxiv2024-tele-flm-1t/</link>
      <pubDate>Wed, 03 Jul 2024 00:00:00 +0000</pubDate>
      <guid>http://localhost:1313/publication/arxiv2024-tele-flm-1t/</guid>
      <description></description>
    </item>
    
    <item>
      <title>Masked Structural Growth for 2x Faster Language Model Pre-training</title>
      <link>http://localhost:1313/publication/iclr2024-msg/</link>
      <pubDate>Tue, 07 May 2024 00:00:00 +0000</pubDate>
      <guid>http://localhost:1313/publication/iclr2024-msg/</guid>
      <description></description>
    </item>
    
    <item>
      <title>Research without Re-search: Maximal Update Parametrization Yields Accurate Loss Prediction across Scales</title>
      <link>http://localhost:1313/publication/arxiv2023-mu-scaling/</link>
      <pubDate>Fri, 14 Apr 2023 00:00:00 +0000</pubDate>
      <guid>http://localhost:1313/publication/arxiv2023-mu-scaling/</guid>
      <description></description>
    </item>
    
    <item>
      <title>The overview of Big Language Model and ChatGPT</title>
      <link>http://localhost:1313/talk/the-overview-of-big-language-model-and-chatgpt/</link>
      <pubDate>Thu, 23 Feb 2023 09:00:00 +0000</pubDate>
      <guid>http://localhost:1313/talk/the-overview-of-big-language-model-and-chatgpt/</guid>
      <description>&lt;p&gt;This talk aims to clearly reveal the challenge and the powerful abilities of ChatGPT and the used GPT series language models. More importantly, we hope to discuss the future direction of both academic and industry.&lt;/p&gt;
&lt;p&gt;Specifically, we introduce the language model, Wudao 2.0 and the academic research of language model. The slides used will be released after the stage of anonymous appraisal.&lt;/p&gt;
</description>
    </item>
    
  </channel>
</rss>
