<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>某位老王的小窝</title>
    <link>https://mars160.github.io/</link>
    <description>Recent content on 某位老王的小窝</description>
    <generator>Hugo -- gohugo.io</generator>
    <language>zh-cn</language>
    <copyright>© 2026 Abanana</copyright>
    <lastBuildDate>Sat, 06 Dec 2025 17:02:12 +0800</lastBuildDate><atom:link href="https://mars160.github.io/index.xml" rel="self" type="application/rss+xml" />
    
    <item>
      <title>面向大语言模型的门控注意力机制：非线性、稀疏性和Attention-Sink-Free</title>
      <link>https://mars160.github.io/posts/%E9%9D%A2%E5%90%91%E5%A4%A7%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E9%97%A8%E6%8E%A7%E6%B3%A8%E6%84%8F%E5%8A%9B%E6%9C%BA%E5%88%B6%E9%9D%9E%E7%BA%BF%E6%80%A7%E7%A8%80%E7%96%8F%E6%80%A7%E5%92%8Cattention-sink-free/</link>
      <pubDate>Sat, 06 Dec 2025 17:02:12 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E9%9D%A2%E5%90%91%E5%A4%A7%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E9%97%A8%E6%8E%A7%E6%B3%A8%E6%84%8F%E5%8A%9B%E6%9C%BA%E5%88%B6%E9%9D%9E%E7%BA%BF%E6%80%A7%E7%A8%80%E7%96%8F%E6%80%A7%E5%92%8Cattention-sink-free/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;面向大语言模型的门控注意力机制：非线性、稀疏性和 Attention-Sink-Free
    &lt;div id=&#34;面向大语言模型的门控注意力机制非线性稀疏性和-attention-sink-free&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#%e9%9d%a2%e5%90%91%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e9%97%a8%e6%8e%a7%e6%b3%a8%e6%84%8f%e5%8a%9b%e6%9c%ba%e5%88%b6%e9%9d%9e%e7%ba%bf%e6%80%a7%e7%a8%80%e7%96%8f%e6%80%a7%e5%92%8c-attention-sink-free&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;&lt;figure&gt;&lt;img
    class=&#34;my-0 rounded-md&#34;
    loading=&#34;lazy&#34;
    decoding=&#34;async&#34;
    fetchpriority=&#34;low&#34;
    alt=&#34;&#34;
    src=&#34;https://mars160.github.io/post_imgs/%E9%9D%A2%E5%90%91%E5%A4%A7%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E9%97%A8%E6%8E%A7%E6%B3%A8%E6%84%8F%E5%8A%9B%E6%9C%BA%E5%88%B6%EF%BC%9A%E9%9D%9E%E7%BA%BF%E6%80%A7%E3%80%81%E7%A8%80%E7%96%8F%E6%80%A7%E5%92%8CAttention-Sink-Free/VeBEbQu4tokbLoxifqrc69bJnjh.png&#34;
    &gt;&lt;/figure&gt;
&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/%E9%9D%A2%E5%90%91%E5%A4%A7%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E9%97%A8%E6%8E%A7%E6%B3%A8%E6%84%8F%E5%8A%9B%E6%9C%BA%E5%88%B6%E9%9D%9E%E7%BA%BF%E6%80%A7%E7%A8%80%E7%96%8F%E6%80%A7%E5%92%8Cattention-sink-free/featured.png" />
    </item>
    
    <item>
      <title>Saber：一种针对扩散语言模型的自适应加速与回溯增强的高效采样方法</title>
      <link>https://mars160.github.io/posts/saber%E4%B8%80%E7%A7%8D%E9%92%88%E5%AF%B9%E6%89%A9%E6%95%A3%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E8%87%AA%E9%80%82%E5%BA%94%E5%8A%A0%E9%80%9F%E4%B8%8E%E5%9B%9E%E6%BA%AF%E5%A2%9E%E5%BC%BA%E7%9A%84%E9%AB%98%E6%95%88%E9%87%87%E6%A0%B7%E6%96%B9%E6%B3%95/</link>
      <pubDate>Fri, 07 Nov 2025 15:56:05 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/saber%E4%B8%80%E7%A7%8D%E9%92%88%E5%AF%B9%E6%89%A9%E6%95%A3%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E8%87%AA%E9%80%82%E5%BA%94%E5%8A%A0%E9%80%9F%E4%B8%8E%E5%9B%9E%E6%BA%AF%E5%A2%9E%E5%BC%BA%E7%9A%84%E9%AB%98%E6%95%88%E9%87%87%E6%A0%B7%E6%96%B9%E6%B3%95/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;Saber：一种针对扩散语言模型的自适应加速与回溯增强的高效采样方法
    &lt;div id=&#34;saber一种针对扩散语言模型的自适应加速与回溯增强的高效采样方法&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#saber%e4%b8%80%e7%a7%8d%e9%92%88%e5%af%b9%e6%89%a9%e6%95%a3%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e8%87%aa%e9%80%82%e5%ba%94%e5%8a%a0%e9%80%9f%e4%b8%8e%e5%9b%9e%e6%ba%af%e5%a2%9e%e5%bc%ba%e7%9a%84%e9%ab%98%e6%95%88%e9%87%87%e6%a0%b7%e6%96%b9%e6%b3%95&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Saber: An Efficient Sampling with Adaptive Acceleration and Backtracking Enhanced Remasking for Diffusion Language Model&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/saber%E4%B8%80%E7%A7%8D%E9%92%88%E5%AF%B9%E6%89%A9%E6%95%A3%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E8%87%AA%E9%80%82%E5%BA%94%E5%8A%A0%E9%80%9F%E4%B8%8E%E5%9B%9E%E6%BA%AF%E5%A2%9E%E5%BC%BA%E7%9A%84%E9%AB%98%E6%95%88%E9%87%87%E6%A0%B7%E6%96%B9%E6%B3%95/featured.png" />
    </item>
    
    <item>
      <title>R-STITCH：用于高效推理的动态轨迹拼接</title>
      <link>https://mars160.github.io/posts/r-stitch%E7%94%A8%E4%BA%8E%E9%AB%98%E6%95%88%E6%8E%A8%E7%90%86%E7%9A%84%E5%8A%A8%E6%80%81%E8%BD%A8%E8%BF%B9%E6%8B%BC%E6%8E%A5/</link>
      <pubDate>Fri, 07 Nov 2025 15:55:51 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/r-stitch%E7%94%A8%E4%BA%8E%E9%AB%98%E6%95%88%E6%8E%A8%E7%90%86%E7%9A%84%E5%8A%A8%E6%80%81%E8%BD%A8%E8%BF%B9%E6%8B%BC%E6%8E%A5/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;R-STITCH：用于高效推理的动态轨迹拼接
    &lt;div id=&#34;r-stitch用于高效推理的动态轨迹拼接&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#r-stitch%e7%94%a8%e4%ba%8e%e9%ab%98%e6%95%88%e6%8e%a8%e7%90%86%e7%9a%84%e5%8a%a8%e6%80%81%e8%bd%a8%e8%bf%b9%e6%8b%bc%e6%8e%a5&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;R-STITCH: DYNAMIC TRAJECTORY STITCHING FOR  EFFICIENT REASONING&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/r-stitch%E7%94%A8%E4%BA%8E%E9%AB%98%E6%95%88%E6%8E%A8%E7%90%86%E7%9A%84%E5%8A%A8%E6%80%81%E8%BD%A8%E8%BF%B9%E6%8B%BC%E6%8E%A5/featured.png" />
    </item>
    
    <item>
      <title>真-Self-Spec-DLM</title>
      <link>https://mars160.github.io/posts/%E7%9C%9F-self-spec-dlm/</link>
      <pubDate>Fri, 07 Nov 2025 15:55:28 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E7%9C%9F-self-spec-dlm/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;真-Self-Spec-DLM
    &lt;div id=&#34;真-self-spec-dlm&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#%e7%9c%9f-self-spec-dlm&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;SELF SPECULATIVE DECODING FOR DIFFUSION  LARGE LANGUAGE MODELS&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/%E7%9C%9F-self-spec-dlm/featured.png" />
    </item>
    
    <item>
      <title>SlowFast采样加速DLM</title>
      <link>https://mars160.github.io/posts/slowfast%E9%87%87%E6%A0%B7%E5%8A%A0%E9%80%9Fdlm/</link>
      <pubDate>Fri, 07 Nov 2025 15:55:08 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/slowfast%E9%87%87%E6%A0%B7%E5%8A%A0%E9%80%9Fdlm/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;SlowFast 采样加速 DLM
    &lt;div id=&#34;slowfast-采样加速-dlm&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#slowfast-%e9%87%87%e6%a0%b7%e5%8a%a0%e9%80%9f-dlm&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;ACCELERATING DIFFUSION LARGE LANGUAGE MODELS WITH SLOWFAST SAMPLING: THE THREE GOLDEN  PRINCIPLES&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/slowfast%E9%87%87%E6%A0%B7%E5%8A%A0%E9%80%9Fdlm/featured.png" />
    </item>
    
    <item>
      <title>简洁提示：通过生成过程中的连续简洁提示提升推理效率</title>
      <link>https://mars160.github.io/posts/%E7%AE%80%E6%B4%81%E6%8F%90%E7%A4%BA%E9%80%9A%E8%BF%87%E7%94%9F%E6%88%90%E8%BF%87%E7%A8%8B%E4%B8%AD%E7%9A%84%E8%BF%9E%E7%BB%AD%E7%AE%80%E6%B4%81%E6%8F%90%E7%A4%BA%E6%8F%90%E5%8D%87%E6%8E%A8%E7%90%86%E6%95%88%E7%8E%87/</link>
      <pubDate>Fri, 10 Oct 2025 15:59:21 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E7%AE%80%E6%B4%81%E6%8F%90%E7%A4%BA%E9%80%9A%E8%BF%87%E7%94%9F%E6%88%90%E8%BF%87%E7%A8%8B%E4%B8%AD%E7%9A%84%E8%BF%9E%E7%BB%AD%E7%AE%80%E6%B4%81%E6%8F%90%E7%A4%BA%E6%8F%90%E5%8D%87%E6%8E%A8%E7%90%86%E6%95%88%E7%8E%87/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;简洁提示：通过生成过程中的连续简洁提示提升推理效率
    &lt;div id=&#34;简洁提示通过生成过程中的连续简洁提示提升推理效率&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#%e7%ae%80%e6%b4%81%e6%8f%90%e7%a4%ba%e9%80%9a%e8%bf%87%e7%94%9f%e6%88%90%e8%bf%87%e7%a8%8b%e4%b8%ad%e7%9a%84%e8%bf%9e%e7%bb%ad%e7%ae%80%e6%b4%81%e6%8f%90%e7%a4%ba%e6%8f%90%e5%8d%87%e6%8e%a8%e7%90%86%e6%95%88%e7%8e%87&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;ConciseHint: Boosting Efficient Reasoning via Continuous Concise Hints during Generation&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/%E7%AE%80%E6%B4%81%E6%8F%90%E7%A4%BA%E9%80%9A%E8%BF%87%E7%94%9F%E6%88%90%E8%BF%87%E7%A8%8B%E4%B8%AD%E7%9A%84%E8%BF%9E%E7%BB%AD%E7%AE%80%E6%B4%81%E6%8F%90%E7%A4%BA%E6%8F%90%E5%8D%87%E6%8E%A8%E7%90%86%E6%95%88%E7%8E%87/featured.png" />
    </item>
    
    <item>
      <title>Prophet：Diffusion模型基于置信度的Decoding早停</title>
      <link>https://mars160.github.io/posts/prophetdiffusion%E6%A8%A1%E5%9E%8B%E5%9F%BA%E4%BA%8E%E7%BD%AE%E4%BF%A1%E5%BA%A6%E7%9A%84decoding%E6%97%A9%E5%81%9C/</link>
      <pubDate>Fri, 10 Oct 2025 15:58:42 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/prophetdiffusion%E6%A8%A1%E5%9E%8B%E5%9F%BA%E4%BA%8E%E7%BD%AE%E4%BF%A1%E5%BA%A6%E7%9A%84decoding%E6%97%A9%E5%81%9C/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;Prophet：Diffusion 模型基于置信度的 Decoding 早停
    &lt;div id=&#34;prophetdiffusion-模型基于置信度的-decoding-早停&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#prophetdiffusion-%e6%a8%a1%e5%9e%8b%e5%9f%ba%e4%ba%8e%e7%bd%ae%e4%bf%a1%e5%ba%a6%e7%9a%84-decoding-%e6%97%a9%e5%81%9c&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Prophet: Fast Decoding for Diffusion Language Models&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/prophetdiffusion%E6%A8%A1%E5%9E%8B%E5%9F%BA%E4%BA%8E%E7%BD%AE%E4%BF%A1%E5%BA%A6%E7%9A%84decoding%E6%97%A9%E5%81%9C/featured.png" />
    </item>
    
    <item>
      <title>SpecDiff：使用扩散模型作为Draft模型</title>
      <link>https://mars160.github.io/posts/specdiff%E4%BD%BF%E7%94%A8%E6%89%A9%E6%95%A3%E6%A8%A1%E5%9E%8B%E4%BD%9C%E4%B8%BAdraft%E6%A8%A1%E5%9E%8B/</link>
      <pubDate>Fri, 10 Oct 2025 15:57:40 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/specdiff%E4%BD%BF%E7%94%A8%E6%89%A9%E6%95%A3%E6%A8%A1%E5%9E%8B%E4%BD%9C%E4%B8%BAdraft%E6%A8%A1%E5%9E%8B/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;SpecDiff：使用扩散模型作为 Draft 模型
    &lt;div id=&#34;specdiff使用扩散模型作为-draft-模型&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#specdiff%e4%bd%bf%e7%94%a8%e6%89%a9%e6%95%a3%e6%a8%a1%e5%9e%8b%e4%bd%9c%e4%b8%ba-draft-%e6%a8%a1%e5%9e%8b&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Speculative Diffusion Decoding: Accelerating Language Generation through Diffusion&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/specdiff%E4%BD%BF%E7%94%A8%E6%89%A9%E6%95%A3%E6%A8%A1%E5%9E%8B%E4%BD%9C%E4%B8%BAdraft%E6%A8%A1%E5%9E%8B/featured.png" />
    </item>
    
    <item>
      <title>DiffuSpec：解锁DLM做投机采样</title>
      <link>https://mars160.github.io/posts/diffuspec%E8%A7%A3%E9%94%81dlm%E5%81%9A%E6%8A%95%E6%9C%BA%E9%87%87%E6%A0%B7/</link>
      <pubDate>Fri, 10 Oct 2025 13:11:36 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/diffuspec%E8%A7%A3%E9%94%81dlm%E5%81%9A%E6%8A%95%E6%9C%BA%E9%87%87%E6%A0%B7/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;DiffuSpec：解锁 DLM 做投机采样
    &lt;div id=&#34;diffuspec解锁-dlm-做投机采样&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#diffuspec%e8%a7%a3%e9%94%81-dlm-%e5%81%9a%e6%8a%95%e6%9c%ba%e9%87%87%e6%a0%b7&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;DIFFUSPEC: UNLOCKING DIFFUSION LANGUAGE  MODELS FOR SPECULATIVE DECODING&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/diffuspec%E8%A7%A3%E9%94%81dlm%E5%81%9A%E6%8A%95%E6%9C%BA%E9%87%87%E6%A0%B7/featured.png" />
    </item>
    
    <item>
      <title>后端部署第二步：本地到公网——如何使用 Nginx 发布 FastAPI 服务</title>
      <link>https://mars160.github.io/posts/%E5%90%8E%E7%AB%AF%E9%83%A8%E7%BD%B2%E7%AC%AC%E4%BA%8C%E6%AD%A5%E6%9C%AC%E5%9C%B0%E5%88%B0%E5%85%AC%E7%BD%91%E5%A6%82%E4%BD%95%E4%BD%BF%E7%94%A8-nginx-%E5%8F%91%E5%B8%83-fastapi-%E6%9C%8D%E5%8A%A1/</link>
      <pubDate>Fri, 05 Sep 2025 18:40:15 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E5%90%8E%E7%AB%AF%E9%83%A8%E7%BD%B2%E7%AC%AC%E4%BA%8C%E6%AD%A5%E6%9C%AC%E5%9C%B0%E5%88%B0%E5%85%AC%E7%BD%91%E5%A6%82%E4%BD%95%E4%BD%BF%E7%94%A8-nginx-%E5%8F%91%E5%B8%83-fastapi-%E6%9C%8D%E5%8A%A1/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;后端部署第二步：本地到公网——如何使用 Nginx 发布 FastAPI 服务
    &lt;div id=&#34;后端部署第二步本地到公网如何使用-nginx-发布-fastapi-服务&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#%e5%90%8e%e7%ab%af%e9%83%a8%e7%bd%b2%e7%ac%ac%e4%ba%8c%e6%ad%a5%e6%9c%ac%e5%9c%b0%e5%88%b0%e5%85%ac%e7%bd%91%e5%a6%82%e4%bd%95%e4%bd%bf%e7%94%a8-nginx-%e5%8f%91%e5%b8%83-fastapi-%e6%9c%8d%e5%8a%a1&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;在当今的开发环境中，快速构建和部署后端服务变得至关重要。FastAPI 作为一个高性能、现代化的 Python 异步 Web 框架，广受开发者喜爱。而 Nginx 则是部署 Web 应用最常见也是最稳定的解决方案之一。&lt;/p&gt;</description>
      
    </item>
    
    <item>
      <title>Fast-dLLM：通过KV Cache和并行Decoding加速dLLM</title>
      <link>https://mars160.github.io/posts/fast-dllm%E9%80%9A%E8%BF%87kv-cache%E5%92%8C%E5%B9%B6%E8%A1%8Cdecoding%E5%8A%A0%E9%80%9Fdllm/</link>
      <pubDate>Fri, 05 Sep 2025 02:24:01 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/fast-dllm%E9%80%9A%E8%BF%87kv-cache%E5%92%8C%E5%B9%B6%E8%A1%8Cdecoding%E5%8A%A0%E9%80%9Fdllm/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;Fast-dLLM：通过 KV Cache 和并行 Decoding 加速 dLLM
    &lt;div id=&#34;fast-dllm通过-kv-cache-和并行-decoding-加速-dllm&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#fast-dllm%e9%80%9a%e8%bf%87-kv-cache-%e5%92%8c%e5%b9%b6%e8%a1%8c-decoding-%e5%8a%a0%e9%80%9f-dllm&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Fast-dLLM: Training-free Acceleration of Diffusion LLM by Enabling KV Cache and Parallel Decoding&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/fast-dllm%E9%80%9A%E8%BF%87kv-cache%E5%92%8C%E5%B9%B6%E8%A1%8Cdecoding%E5%8A%A0%E9%80%9Fdllm/featured.png" />
    </item>
    
    <item>
      <title>后端部署第一步：Nginx 发布服务前的万全准备</title>
      <link>https://mars160.github.io/posts/%E5%90%8E%E7%AB%AF%E9%83%A8%E7%BD%B2%E7%AC%AC%E4%B8%80%E6%AD%A5nginx-%E5%8F%91%E5%B8%83%E6%9C%8D%E5%8A%A1%E5%89%8D%E7%9A%84%E4%B8%87%E5%85%A8%E5%87%86%E5%A4%87/</link>
      <pubDate>Wed, 03 Sep 2025 02:36:15 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E5%90%8E%E7%AB%AF%E9%83%A8%E7%BD%B2%E7%AC%AC%E4%B8%80%E6%AD%A5nginx-%E5%8F%91%E5%B8%83%E6%9C%8D%E5%8A%A1%E5%89%8D%E7%9A%84%E4%B8%87%E5%85%A8%E5%87%86%E5%A4%87/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;后端部署第一步：Nginx 发布服务前的准备工作
    &lt;div id=&#34;后端部署第一步nginx-发布服务前的准备工作&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#%e5%90%8e%e7%ab%af%e9%83%a8%e7%bd%b2%e7%ac%ac%e4%b8%80%e6%ad%a5nginx-%e5%8f%91%e5%b8%83%e6%9c%8d%e5%8a%a1%e5%89%8d%e7%9a%84%e5%87%86%e5%a4%87%e5%b7%a5%e4%bd%9c&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;你是不是刚刚用 Java、Python 或 Go 写出了第一个后端程序？它在本地跑得飞快，通过
&lt;code&gt;localhost:8080&lt;/code&gt; 就能访问，功能也都挺顺畅。接下来，自然而然会冒出一个念头：&lt;strong&gt;“我要怎样才能让别人也能访问到它？”&lt;/strong&gt;&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/%E5%90%8E%E7%AB%AF%E9%83%A8%E7%BD%B2%E7%AC%AC%E4%B8%80%E6%AD%A5nginx-%E5%8F%91%E5%B8%83%E6%9C%8D%E5%8A%A1%E5%89%8D%E7%9A%84%E4%B8%87%E5%85%A8%E5%87%86%E5%A4%87/featured.png" />
    </item>
    
    <item>
      <title>自信地深度思考</title>
      <link>https://mars160.github.io/posts/%E8%87%AA%E4%BF%A1%E5%9C%B0%E6%B7%B1%E5%BA%A6%E6%80%9D%E8%80%83/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:48 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E8%87%AA%E4%BF%A1%E5%9C%B0%E6%B7%B1%E5%BA%A6%E6%80%9D%E8%80%83/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;自信地深度思考
    &lt;div id=&#34;自信地深度思考&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#%e8%87%aa%e4%bf%a1%e5%9c%b0%e6%b7%b1%e5%ba%a6%e6%80%9d%e8%80%83&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;DEEP THINK WITH CONFIDENCE&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/%E8%87%AA%E4%BF%A1%E5%9C%B0%E6%B7%B1%E5%BA%A6%E6%80%9D%E8%80%83/featured.png" />
    </item>
    
    <item>
      <title>TriangleMix：无损且高效的用于预填充阶段的注意力模式</title>
      <link>https://mars160.github.io/posts/trianglemix%E6%97%A0%E6%8D%9F%E4%B8%94%E9%AB%98%E6%95%88%E7%9A%84%E7%94%A8%E4%BA%8E%E9%A2%84%E5%A1%AB%E5%85%85%E9%98%B6%E6%AE%B5%E7%9A%84%E6%B3%A8%E6%84%8F%E5%8A%9B%E6%A8%A1%E5%BC%8F/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:45 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/trianglemix%E6%97%A0%E6%8D%9F%E4%B8%94%E9%AB%98%E6%95%88%E7%9A%84%E7%94%A8%E4%BA%8E%E9%A2%84%E5%A1%AB%E5%85%85%E9%98%B6%E6%AE%B5%E7%9A%84%E6%B3%A8%E6%84%8F%E5%8A%9B%E6%A8%A1%E5%BC%8F/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;TriangleMix：无损且高效的用于预填充阶段的注意力模式
    &lt;div id=&#34;trianglemix无损且高效的用于预填充阶段的注意力模式&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#trianglemix%e6%97%a0%e6%8d%9f%e4%b8%94%e9%ab%98%e6%95%88%e7%9a%84%e7%94%a8%e4%ba%8e%e9%a2%84%e5%a1%ab%e5%85%85%e9%98%b6%e6%ae%b5%e7%9a%84%e6%b3%a8%e6%84%8f%e5%8a%9b%e6%a8%a1%e5%bc%8f&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;TriangleMix: A Lossless and Efficient Attention Pattern for Long Context Prefilling&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/trianglemix%E6%97%A0%E6%8D%9F%E4%B8%94%E9%AB%98%E6%95%88%E7%9A%84%E7%94%A8%E4%BA%8E%E9%A2%84%E5%A1%AB%E5%85%85%E9%98%B6%E6%AE%B5%E7%9A%84%E6%B3%A8%E6%84%8F%E5%8A%9B%E6%A8%A1%E5%BC%8F/featured.png" />
    </item>
    
    <item>
      <title>ASC：CoT压缩的激活引导 Training free</title>
      <link>https://mars160.github.io/posts/asccot%E5%8E%8B%E7%BC%A9%E7%9A%84%E6%BF%80%E6%B4%BB%E5%BC%95%E5%AF%BC-training-free/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:41 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/asccot%E5%8E%8B%E7%BC%A9%E7%9A%84%E6%BF%80%E6%B4%BB%E5%BC%95%E5%AF%BC-training-free/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;ASC：CoT 压缩的激活引导 Training free
    &lt;div id=&#34;asccot-压缩的激活引导-training-free&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#asccot-%e5%8e%8b%e7%bc%a9%e7%9a%84%e6%bf%80%e6%b4%bb%e5%bc%95%e5%af%bc-training-free&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Activation Steering for Chain-of-Thought Compression&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/asccot%E5%8E%8B%E7%BC%A9%E7%9A%84%E6%BF%80%E6%B4%BB%E5%BC%95%E5%AF%BC-training-free/featured.png" />
    </item>
    
    <item>
      <title>SEAL：大语言模型的可操控推理 Traning Free</title>
      <link>https://mars160.github.io/posts/seal%E5%A4%A7%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E5%8F%AF%E6%93%8D%E6%8E%A7%E6%8E%A8%E7%90%86-traning-free/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:36 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/seal%E5%A4%A7%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E5%8F%AF%E6%93%8D%E6%8E%A7%E6%8E%A8%E7%90%86-traning-free/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;SEAL：大语言模型的可操控推理 Traning Free
    &lt;div id=&#34;seal大语言模型的可操控推理-traning-free&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#seal%e5%a4%a7%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e7%9a%84%e5%8f%af%e6%93%8d%e6%8e%a7%e6%8e%a8%e7%90%86-traning-free&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;SEAL: Steerable Reasoning Calibration of Large Language Models for Free&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/seal%E5%A4%A7%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E7%9A%84%E5%8F%AF%E6%93%8D%E6%8E%A7%E6%8E%A8%E7%90%86-traning-free/featured.png" />
    </item>
    
    <item>
      <title>Hmm等Token影响模型推理能力</title>
      <link>https://mars160.github.io/posts/hmm%E7%AD%89token%E5%BD%B1%E5%93%8D%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86%E8%83%BD%E5%8A%9B/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:33 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/hmm%E7%AD%89token%E5%BD%B1%E5%93%8D%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86%E8%83%BD%E5%8A%9B/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;Hmm 等 Token 影响模型推理能力
    &lt;div id=&#34;hmm-等-token-影响模型推理能力&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#hmm-%e7%ad%89-token-%e5%bd%b1%e5%93%8d%e6%a8%a1%e5%9e%8b%e6%8e%a8%e7%90%86%e8%83%bd%e5%8a%9b&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Demystifying Reasoning Dynamics with Mutual Information: Thinking Tokens are Information Peaks in LLM Reasoning&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/hmm%E7%AD%89token%E5%BD%B1%E5%93%8D%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86%E8%83%BD%E5%8A%9B/featured.png" />
    </item>
    
    <item>
      <title>AdaCoT：通过强化学习实现的帕累托最优自适应链式思维触发器</title>
      <link>https://mars160.github.io/posts/adacot%E9%80%9A%E8%BF%87%E5%BC%BA%E5%8C%96%E5%AD%A6%E4%B9%A0%E5%AE%9E%E7%8E%B0%E7%9A%84%E5%B8%95%E7%B4%AF%E6%89%98%E6%9C%80%E4%BC%98%E8%87%AA%E9%80%82%E5%BA%94%E9%93%BE%E5%BC%8F%E6%80%9D%E7%BB%B4%E8%A7%A6%E5%8F%91%E5%99%A8/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:28 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/adacot%E9%80%9A%E8%BF%87%E5%BC%BA%E5%8C%96%E5%AD%A6%E4%B9%A0%E5%AE%9E%E7%8E%B0%E7%9A%84%E5%B8%95%E7%B4%AF%E6%89%98%E6%9C%80%E4%BC%98%E8%87%AA%E9%80%82%E5%BA%94%E9%93%BE%E5%BC%8F%E6%80%9D%E7%BB%B4%E8%A7%A6%E5%8F%91%E5%99%A8/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;AdaCoT：通过强化学习实现的帕累托最优自适应链式思维触发器
    &lt;div id=&#34;adacot通过强化学习实现的帕累托最优自适应链式思维触发器&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#adacot%e9%80%9a%e8%bf%87%e5%bc%ba%e5%8c%96%e5%ad%a6%e4%b9%a0%e5%ae%9e%e7%8e%b0%e7%9a%84%e5%b8%95%e7%b4%af%e6%89%98%e6%9c%80%e4%bc%98%e8%87%aa%e9%80%82%e5%ba%94%e9%93%be%e5%bc%8f%e6%80%9d%e7%bb%b4%e8%a7%a6%e5%8f%91%e5%99%a8&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;AdaCoT: Pareto-Optimal Adaptive Chain-of-Thought Triggering via Reinforcement
Learning&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/adacot%E9%80%9A%E8%BF%87%E5%BC%BA%E5%8C%96%E5%AD%A6%E4%B9%A0%E5%AE%9E%E7%8E%B0%E7%9A%84%E5%B8%95%E7%B4%AF%E6%89%98%E6%9C%80%E4%BC%98%E8%87%AA%E9%80%82%E5%BA%94%E9%93%BE%E5%BC%8F%E6%80%9D%E7%BB%B4%E8%A7%A6%E5%8F%91%E5%99%A8/featured.png" />
    </item>
    
    <item>
      <title>AdaptThink: 让模型决定是否思考</title>
      <link>https://mars160.github.io/posts/adaptthink_-%E8%AE%A9%E6%A8%A1%E5%9E%8B%E5%86%B3%E5%AE%9A%E6%98%AF%E5%90%A6%E6%80%9D%E8%80%83/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:25 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/adaptthink_-%E8%AE%A9%E6%A8%A1%E5%9E%8B%E5%86%B3%E5%AE%9A%E6%98%AF%E5%90%A6%E6%80%9D%E8%80%83/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;AdaptThink: 让模型决定是否思考
    &lt;div id=&#34;adaptthink-让模型决定是否思考&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#adaptthink-%e8%ae%a9%e6%a8%a1%e5%9e%8b%e5%86%b3%e5%ae%9a%e6%98%af%e5%90%a6%e6%80%9d%e8%80%83&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;AdaptThink: Reasoning Models Can Learn When to Think&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/adaptthink_-%E8%AE%A9%E6%A8%A1%E5%9E%8B%E5%86%B3%E5%AE%9A%E6%98%AF%E5%90%A6%E6%80%9D%E8%80%83/featured.png" />
    </item>
    
    <item>
      <title>SpecReason：使用推测性推理实现加速推理</title>
      <link>https://mars160.github.io/posts/specreason%E4%BD%BF%E7%94%A8%E6%8E%A8%E6%B5%8B%E6%80%A7%E6%8E%A8%E7%90%86%E5%AE%9E%E7%8E%B0%E5%8A%A0%E9%80%9F%E6%8E%A8%E7%90%86/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:21 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/specreason%E4%BD%BF%E7%94%A8%E6%8E%A8%E6%B5%8B%E6%80%A7%E6%8E%A8%E7%90%86%E5%AE%9E%E7%8E%B0%E5%8A%A0%E9%80%9F%E6%8E%A8%E7%90%86/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;SpecReason：使用推测性推理实现加速推理
    &lt;div id=&#34;specreason使用推测性推理实现加速推理&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#specreason%e4%bd%bf%e7%94%a8%e6%8e%a8%e6%b5%8b%e6%80%a7%e6%8e%a8%e7%90%86%e5%ae%9e%e7%8e%b0%e5%8a%a0%e9%80%9f%e6%8e%a8%e7%90%86&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;SpecReason: Fast and Accurate Inference-Time Compute via Speculative Reasoning&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/specreason%E4%BD%BF%E7%94%A8%E6%8E%A8%E6%B5%8B%E6%80%A7%E6%8E%A8%E7%90%86%E5%AE%9E%E7%8E%B0%E5%8A%A0%E9%80%9F%E6%8E%A8%E7%90%86/featured.png" />
    </item>
    
    <item>
      <title>ThinkLess：一种无需训练的推理高效方法，用于减少推理冗余</title>
      <link>https://mars160.github.io/posts/thinkless%E4%B8%80%E7%A7%8D%E6%97%A0%E9%9C%80%E8%AE%AD%E7%BB%83%E7%9A%84%E6%8E%A8%E7%90%86%E9%AB%98%E6%95%88%E6%96%B9%E6%B3%95%E7%94%A8%E4%BA%8E%E5%87%8F%E5%B0%91%E6%8E%A8%E7%90%86%E5%86%97%E4%BD%99/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:20 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/thinkless%E4%B8%80%E7%A7%8D%E6%97%A0%E9%9C%80%E8%AE%AD%E7%BB%83%E7%9A%84%E6%8E%A8%E7%90%86%E9%AB%98%E6%95%88%E6%96%B9%E6%B3%95%E7%94%A8%E4%BA%8E%E5%87%8F%E5%B0%91%E6%8E%A8%E7%90%86%E5%86%97%E4%BD%99/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;ThinkLess：一种无需训练的推理高效方法，用于减少推理冗余
    &lt;div id=&#34;thinkless一种无需训练的推理高效方法用于减少推理冗余&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#thinkless%e4%b8%80%e7%a7%8d%e6%97%a0%e9%9c%80%e8%ae%ad%e7%bb%83%e7%9a%84%e6%8e%a8%e7%90%86%e9%ab%98%e6%95%88%e6%96%b9%e6%b3%95%e7%94%a8%e4%ba%8e%e5%87%8f%e5%b0%91%e6%8e%a8%e7%90%86%e5%86%97%e4%bd%99&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;ThinkLess: A Training-Free Inference-Efficient Method for Reducing Reasoning Redundancy&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/thinkless%E4%B8%80%E7%A7%8D%E6%97%A0%E9%9C%80%E8%AE%AD%E7%BB%83%E7%9A%84%E6%8E%A8%E7%90%86%E9%AB%98%E6%95%88%E6%96%B9%E6%B3%95%E7%94%A8%E4%BA%8E%E5%87%8F%E5%B0%91%E6%8E%A8%E7%90%86%E5%86%97%E4%BD%99/featured.png" />
    </item>
    
    <item>
      <title>Thinkless: LLM Learns When to Think</title>
      <link>https://mars160.github.io/posts/thinkless_-llm-learns-when-to-think/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:19 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/thinkless_-llm-learns-when-to-think/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;Thinkless: LLM Learns When to Think
    &lt;div id=&#34;thinkless-llm-learns-when-to-think&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#thinkless-llm-learns-when-to-think&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Thinkless: LLM Learns When to Think&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/thinkless_-llm-learns-when-to-think/featured.png" />
    </item>
    
    <item>
      <title>🧠思维操控：外部CoT辅助大模型推理</title>
      <link>https://mars160.github.io/posts/%E6%80%9D%E7%BB%B4%E6%93%8D%E6%8E%A7%E5%A4%96%E9%83%A8cot%E8%BE%85%E5%8A%A9%E5%A4%A7%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:16 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E6%80%9D%E7%BB%B4%E6%93%8D%E6%8E%A7%E5%A4%96%E9%83%A8cot%E8%BE%85%E5%8A%A9%E5%A4%A7%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;🧠 思维操控：外部 CoT 辅助大模型推理
    &lt;div id=&#34;-思维操控外部-cot-辅助大模型推理&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#-%e6%80%9d%e7%bb%b4%e6%93%8d%e6%8e%a7%e5%a4%96%e9%83%a8-cot-%e8%be%85%e5%8a%a9%e5%a4%a7%e6%a8%a1%e5%9e%8b%e6%8e%a8%e7%90%86&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Thought Manipulation: External Thought Can Be Efficient for Large  Reasoning Models&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/%E6%80%9D%E7%BB%B4%E6%93%8D%E6%8E%A7%E5%A4%96%E9%83%A8cot%E8%BE%85%E5%8A%A9%E5%A4%A7%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86/featured.png" />
    </item>
    
    <item>
      <title>⏰开始作答：弹性推理实现的可扩展的CoT</title>
      <link>https://mars160.github.io/posts/%E5%BC%80%E5%A7%8B%E4%BD%9C%E7%AD%94%E5%BC%B9%E6%80%A7%E6%8E%A8%E7%90%86%E5%AE%9E%E7%8E%B0%E7%9A%84%E5%8F%AF%E6%89%A9%E5%B1%95%E7%9A%84cot/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:15 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E5%BC%80%E5%A7%8B%E4%BD%9C%E7%AD%94%E5%BC%B9%E6%80%A7%E6%8E%A8%E7%90%86%E5%AE%9E%E7%8E%B0%E7%9A%84%E5%8F%AF%E6%89%A9%E5%B1%95%E7%9A%84cot/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;⏰ 开始作答：弹性推理实现的可扩展的 CoT
    &lt;div id=&#34;-开始作答弹性推理实现的可扩展的-cot&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#-%e5%bc%80%e5%a7%8b%e4%bd%9c%e7%ad%94%e5%bc%b9%e6%80%a7%e6%8e%a8%e7%90%86%e5%ae%9e%e7%8e%b0%e7%9a%84%e5%8f%af%e6%89%a9%e5%b1%95%e7%9a%84-cot&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Scalable Chain of Thoughts via Elastic Reasoning&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/%E5%BC%80%E5%A7%8B%E4%BD%9C%E7%AD%94%E5%BC%B9%E6%80%A7%E6%8E%A8%E7%90%86%E5%AE%9E%E7%8E%B0%E7%9A%84%E5%8F%AF%E6%89%A9%E5%B1%95%E7%9A%84cot/featured.png" />
    </item>
    
    <item>
      <title>DEER：基于Trial置信度的推理早停</title>
      <link>https://mars160.github.io/posts/deer%E5%9F%BA%E4%BA%8Etrial%E7%BD%AE%E4%BF%A1%E5%BA%A6%E7%9A%84%E6%8E%A8%E7%90%86%E6%97%A9%E5%81%9C/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:12 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/deer%E5%9F%BA%E4%BA%8Etrial%E7%BD%AE%E4%BF%A1%E5%BA%A6%E7%9A%84%E6%8E%A8%E7%90%86%E6%97%A9%E5%81%9C/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;DEER：基于 Trial 置信度的推理早停
    &lt;div id=&#34;deer基于-trial-置信度的推理早停&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#deer%e5%9f%ba%e4%ba%8e-trial-%e7%bd%ae%e4%bf%a1%e5%ba%a6%e7%9a%84%e6%8e%a8%e7%90%86%e6%97%a9%e5%81%9c&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;DYNAMIC EARLY EXIT IN REASONING MODELS&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/deer%E5%9F%BA%E4%BA%8Etrial%E7%BD%AE%E4%BF%A1%E5%BA%A6%E7%9A%84%E6%8E%A8%E7%90%86%E6%97%A9%E5%81%9C/featured.png" />
    </item>
    
    <item>
      <title>SoftCoT：Prompt➡️SLM➡️LLM</title>
      <link>https://mars160.github.io/posts/softcotprompt%EF%B8%8Fslm%EF%B8%8Fllm/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:09 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/softcotprompt%EF%B8%8Fslm%EF%B8%8Fllm/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;SoftCoT：Prompt➡️SLM➡️LLM
    &lt;div id=&#34;softcotpromptslmllm&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#softcotpromptslmllm&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;SoftCoT: Soft Chain-of-Thought for Efficient Reasoning with LLMs&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/softcotprompt%EF%B8%8Fslm%EF%B8%8Fllm/featured.png" />
    </item>
    
    <item>
      <title>CODI: 通过自蒸馏将CoT压缩到连续空间中</title>
      <link>https://mars160.github.io/posts/codi_-%E9%80%9A%E8%BF%87%E8%87%AA%E8%92%B8%E9%A6%8F%E5%B0%86cot%E5%8E%8B%E7%BC%A9%E5%88%B0%E8%BF%9E%E7%BB%AD%E7%A9%BA%E9%97%B4%E4%B8%AD/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:06 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/codi_-%E9%80%9A%E8%BF%87%E8%87%AA%E8%92%B8%E9%A6%8F%E5%B0%86cot%E5%8E%8B%E7%BC%A9%E5%88%B0%E8%BF%9E%E7%BB%AD%E7%A9%BA%E9%97%B4%E4%B8%AD/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;CODI: 通过自蒸馏将 CoT 压缩到连续空间中
    &lt;div id=&#34;codi-通过自蒸馏将-cot-压缩到连续空间中&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#codi-%e9%80%9a%e8%bf%87%e8%87%aa%e8%92%b8%e9%a6%8f%e5%b0%86-cot-%e5%8e%8b%e7%bc%a9%e5%88%b0%e8%bf%9e%e7%bb%ad%e7%a9%ba%e9%97%b4%e4%b8%ad&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;CODI: Compressing Chain-of-Thought into Continuous Space via Self-Distillation&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/codi_-%E9%80%9A%E8%BF%87%E8%87%AA%E8%92%B8%E9%A6%8F%E5%B0%86cot%E5%8E%8B%E7%BC%A9%E5%88%B0%E8%BF%9E%E7%BB%AD%E7%A9%BA%E9%97%B4%E4%B8%AD/featured.png" />
    </item>
    
    <item>
      <title>HAWKEYE：大小模型协作实现精简CoT</title>
      <link>https://mars160.github.io/posts/hawkeye%E5%A4%A7%E5%B0%8F%E6%A8%A1%E5%9E%8B%E5%8D%8F%E4%BD%9C%E5%AE%9E%E7%8E%B0%E7%B2%BE%E7%AE%80cot/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:04 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/hawkeye%E5%A4%A7%E5%B0%8F%E6%A8%A1%E5%9E%8B%E5%8D%8F%E4%BD%9C%E5%AE%9E%E7%8E%B0%E7%B2%BE%E7%AE%80cot/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;HAWKEYE：大小模型协作实现精简 CoT
    &lt;div id=&#34;hawkeye大小模型协作实现精简-cot&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#hawkeye%e5%a4%a7%e5%b0%8f%e6%a8%a1%e5%9e%8b%e5%8d%8f%e4%bd%9c%e5%ae%9e%e7%8e%b0%e7%b2%be%e7%ae%80-cot&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Hawkeye:Efficient Reasoning with Model Collaboration&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/hawkeye%E5%A4%A7%E5%B0%8F%E6%A8%A1%E5%9E%8B%E5%8D%8F%E4%BD%9C%E5%AE%9E%E7%8E%B0%E7%B2%BE%E7%AE%80cot/featured.png" />
    </item>
    
    <item>
      <title>LCIRC: 长文档循环压缩方法 （LLM Training Free）</title>
      <link>https://mars160.github.io/posts/lcirc_-%E9%95%BF%E6%96%87%E6%A1%A3%E5%BE%AA%E7%8E%AF%E5%8E%8B%E7%BC%A9%E6%96%B9%E6%B3%95-llm-training-free/</link>
      <pubDate>Tue, 02 Sep 2025 07:22:00 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/lcirc_-%E9%95%BF%E6%96%87%E6%A1%A3%E5%BE%AA%E7%8E%AF%E5%8E%8B%E7%BC%A9%E6%96%B9%E6%B3%95-llm-training-free/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;LCIRC: 长文档循环压缩方法 （LLM Training Free）
    &lt;div id=&#34;lcirc-长文档循环压缩方法-llm-training-free&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#lcirc-%e9%95%bf%e6%96%87%e6%a1%a3%e5%be%aa%e7%8e%af%e5%8e%8b%e7%bc%a9%e6%96%b9%e6%b3%95-llm-training-free&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;LCIRC: A Recurrent Compression Approach for Efficient Long-form Context and Query Dependent Modeling in LLMs&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/lcirc_-%E9%95%BF%E6%96%87%E6%A1%A3%E5%BE%AA%E7%8E%AF%E5%8E%8B%E7%BC%A9%E6%96%B9%E6%B3%95-llm-training-free/featured.png" />
    </item>
    
    <item>
      <title>LLM在连续Latent空间中推理</title>
      <link>https://mars160.github.io/posts/llm%E5%9C%A8%E8%BF%9E%E7%BB%ADlatent%E7%A9%BA%E9%97%B4%E4%B8%AD%E6%8E%A8%E7%90%86/</link>
      <pubDate>Tue, 02 Sep 2025 07:21:57 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/llm%E5%9C%A8%E8%BF%9E%E7%BB%ADlatent%E7%A9%BA%E9%97%B4%E4%B8%AD%E6%8E%A8%E7%90%86/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;LLM 在连续 Latent 空间中推理
    &lt;div id=&#34;llm-在连续-latent-空间中推理&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#llm-%e5%9c%a8%e8%bf%9e%e7%bb%ad-latent-%e7%a9%ba%e9%97%b4%e4%b8%ad%e6%8e%a8%e7%90%86&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Training Large Language Models to Reason in a Continuous Latent Space&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/llm%E5%9C%A8%E8%BF%9E%E7%BB%ADlatent%E7%A9%BA%E9%97%B4%E4%B8%AD%E6%8E%A8%E7%90%86/featured.png" />
    </item>
    
    <item>
      <title>Pause Token：隐式CoT</title>
      <link>https://mars160.github.io/posts/pause-token%E9%9A%90%E5%BC%8Fcot/</link>
      <pubDate>Tue, 02 Sep 2025 07:21:55 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/pause-token%E9%9A%90%E5%BC%8Fcot/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;Pause Token：隐式 CoT
    &lt;div id=&#34;pause-token隐式-cot&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#pause-token%e9%9a%90%e5%bc%8f-cot&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Think before you speak: Training Language Models With Pause Tokens&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/pause-token%E9%9A%90%E5%BC%8Fcot/featured.png" />
    </item>
    
    <item>
      <title>面向模型推理思考优化的Test time scaling</title>
      <link>https://mars160.github.io/posts/%E9%9D%A2%E5%90%91%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86%E6%80%9D%E8%80%83%E4%BC%98%E5%8C%96%E7%9A%84test-time-scaling/</link>
      <pubDate>Tue, 02 Sep 2025 07:21:53 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/%E9%9D%A2%E5%90%91%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86%E6%80%9D%E8%80%83%E4%BC%98%E5%8C%96%E7%9A%84test-time-scaling/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;面向模型推理思考优化的 Test time scaling
    &lt;div id=&#34;面向模型推理思考优化的-test-time-scaling&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#%e9%9d%a2%e5%90%91%e6%a8%a1%e5%9e%8b%e6%8e%a8%e7%90%86%e6%80%9d%e8%80%83%e4%bc%98%e5%8c%96%e7%9a%84-test-time-scaling&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Towards Thinking-Optimal Scaling of Test-Time Compute for LLM Reasoning&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/%E9%9D%A2%E5%90%91%E6%A8%A1%E5%9E%8B%E6%8E%A8%E7%90%86%E6%80%9D%E8%80%83%E4%BC%98%E5%8C%96%E7%9A%84test-time-scaling/featured.png" />
    </item>
    
    <item>
      <title>CCoT：通过密集表示实现高效推理</title>
      <link>https://mars160.github.io/posts/ccot%E9%80%9A%E8%BF%87%E5%AF%86%E9%9B%86%E8%A1%A8%E7%A4%BA%E5%AE%9E%E7%8E%B0%E9%AB%98%E6%95%88%E6%8E%A8%E7%90%86/</link>
      <pubDate>Tue, 02 Sep 2025 07:21:49 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/ccot%E9%80%9A%E8%BF%87%E5%AF%86%E9%9B%86%E8%A1%A8%E7%A4%BA%E5%AE%9E%E7%8E%B0%E9%AB%98%E6%95%88%E6%8E%A8%E7%90%86/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;CCoT：通过密集表示实现高效推理
    &lt;div id=&#34;ccot通过密集表示实现高效推理&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#ccot%e9%80%9a%e8%bf%87%e5%af%86%e9%9b%86%e8%a1%a8%e7%a4%ba%e5%ae%9e%e7%8e%b0%e9%ab%98%e6%95%88%e6%8e%a8%e7%90%86&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Compressed Chain of Thought: Efficient Reasoning Through Dense Representations&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/ccot%E9%80%9A%E8%BF%87%E5%AF%86%E9%9B%86%E8%A1%A8%E7%A4%BA%E5%AE%9E%E7%8E%B0%E9%AB%98%E6%95%88%E6%8E%A8%E7%90%86/featured.png" />
    </item>
    
    <item>
      <title>Token预算意识的llm推理</title>
      <link>https://mars160.github.io/posts/token%E9%A2%84%E7%AE%97%E6%84%8F%E8%AF%86%E7%9A%84llm%E6%8E%A8%E7%90%86/</link>
      <pubDate>Tue, 02 Sep 2025 07:21:47 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/token%E9%A2%84%E7%AE%97%E6%84%8F%E8%AF%86%E7%9A%84llm%E6%8E%A8%E7%90%86/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;Token 预算意识的 llm 推理
    &lt;div id=&#34;token-预算意识的-llm-推理&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#token-%e9%a2%84%e7%ae%97%e6%84%8f%e8%af%86%e7%9a%84-llm-%e6%8e%a8%e7%90%86&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;Token-Budget-Aware LLM Reasoning&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/token%E9%A2%84%E7%AE%97%E6%84%8F%E8%AF%86%E7%9A%84llm%E6%8E%A8%E7%90%86/featured.png" />
    </item>
    
    <item>
      <title>INFTYTHINK：打破大型语言模型长上下文推理长度限制</title>
      <link>https://mars160.github.io/posts/inftythink%E6%89%93%E7%A0%B4%E5%A4%A7%E5%9E%8B%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E9%95%BF%E4%B8%8A%E4%B8%8B%E6%96%87%E6%8E%A8%E7%90%86%E9%95%BF%E5%BA%A6%E9%99%90%E5%88%B6/</link>
      <pubDate>Tue, 02 Sep 2025 07:21:43 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/inftythink%E6%89%93%E7%A0%B4%E5%A4%A7%E5%9E%8B%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E9%95%BF%E4%B8%8A%E4%B8%8B%E6%96%87%E6%8E%A8%E7%90%86%E9%95%BF%E5%BA%A6%E9%99%90%E5%88%B6/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;INFTYTHINK：打破大型语言模型长上下文推理长度限制
    &lt;div id=&#34;inftythink打破大型语言模型长上下文推理长度限制&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#inftythink%e6%89%93%e7%a0%b4%e5%a4%a7%e5%9e%8b%e8%af%ad%e8%a8%80%e6%a8%a1%e5%9e%8b%e9%95%bf%e4%b8%8a%e4%b8%8b%e6%96%87%e6%8e%a8%e7%90%86%e9%95%bf%e5%ba%a6%e9%99%90%e5%88%b6&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;InftyThink: Breaking the Length Limits of Long-Context Reasoning in Large Language Models&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/inftythink%E6%89%93%E7%A0%B4%E5%A4%A7%E5%9E%8B%E8%AF%AD%E8%A8%80%E6%A8%A1%E5%9E%8B%E9%95%BF%E4%B8%8A%E4%B8%8B%E6%96%87%E6%8E%A8%E7%90%86%E9%95%BF%E5%BA%A6%E9%99%90%E5%88%B6/featured.png" />
    </item>
    
    <item>
      <title>TokenSkip:可控的CoT压缩 in LLMs</title>
      <link>https://mars160.github.io/posts/tokenskip_%E5%8F%AF%E6%8E%A7%E7%9A%84cot%E5%8E%8B%E7%BC%A9-in-llms/</link>
      <pubDate>Tue, 02 Sep 2025 07:21:38 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/tokenskip_%E5%8F%AF%E6%8E%A7%E7%9A%84cot%E5%8E%8B%E7%BC%A9-in-llms/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;TokenSkip:可控的 CoT 压缩 in LLMs
    &lt;div id=&#34;tokenskip可控的-cot-压缩-in-llms&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#tokenskip%e5%8f%af%e6%8e%a7%e7%9a%84-cot-%e5%8e%8b%e7%bc%a9-in-llms&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;TokenSkip: Controllable Chain-of-Thought Compression in LLMs&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/tokenskip_%E5%8F%AF%E6%8E%A7%E7%9A%84cot%E5%8E%8B%E7%BC%A9-in-llms/featured.png" />
    </item>
    
    <item>
      <title>LightThinker: 每个想法压缩成两个token</title>
      <link>https://mars160.github.io/posts/lightthinker_-%E6%AF%8F%E4%B8%AA%E6%83%B3%E6%B3%95%E5%8E%8B%E7%BC%A9%E6%88%90%E4%B8%A4%E4%B8%AAtoken/</link>
      <pubDate>Tue, 02 Sep 2025 07:21:35 +0800</pubDate>
      
      <guid>https://mars160.github.io/posts/lightthinker_-%E6%AF%8F%E4%B8%AA%E6%83%B3%E6%B3%95%E5%8E%8B%E7%BC%A9%E6%88%90%E4%B8%A4%E4%B8%AAtoken/</guid>
      <description>&lt;h2 class=&#34;relative group&#34;&gt;LightThinker: 每个想法压缩成两个 token
    &lt;div id=&#34;lightthinker-每个想法压缩成两个-token&#34; class=&#34;anchor&#34;&gt;&lt;/div&gt;
    
    &lt;span
        class=&#34;absolute top-0 w-6 transition-opacity opacity-0 -start-6 not-prose group-hover:opacity-100 select-none&#34;&gt;
        &lt;a class=&#34;text-primary-300 dark:text-neutral-700 !no-underline&#34; href=&#34;#lightthinker-%e6%af%8f%e4%b8%aa%e6%83%b3%e6%b3%95%e5%8e%8b%e7%bc%a9%e6%88%90%e4%b8%a4%e4%b8%aa-token&#34; aria-label=&#34;锚点&#34;&gt;#&lt;/a&gt;
    &lt;/span&gt;
    
&lt;/h2&gt;
&lt;p&gt;如果 lt 确实靠谱&lt;/p&gt;</description>
      <media:content xmlns:media="http://search.yahoo.com/mrss/" url="https://mars160.github.io/posts/lightthinker_-%E6%AF%8F%E4%B8%AA%E6%83%B3%E6%B3%95%E5%8E%8B%E7%BC%A9%E6%88%90%E4%B8%A4%E4%B8%AAtoken/featured.png" />
    </item>
    
  </channel>
</rss>
