<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:content="http://purl.org/rss/1.0/modules/content/">
  <channel>
    <title>Attention on Answer</title>
    <link>https://answer.freetools.me/tags/attention/</link>
    <description>Recent content in Attention on Answer</description>
    <generator>Hugo -- 0.152.2</generator>
    <language>zh-cn</language>
    <lastBuildDate>Thu, 12 Mar 2026 19:18:43 +0800</lastBuildDate>
    <atom:link href="https://answer.freetools.me/tags/attention/index.xml" rel="self" type="application/rss+xml" />
    <item>
      <title>序列到序列学习的二十年演进：从统计方法到Transformer的革命</title>
      <link>https://answer.freetools.me/%E5%BA%8F%E5%88%97%E5%88%B0%E5%BA%8F%E5%88%97%E5%AD%A6%E4%B9%A0%E7%9A%84%E4%BA%8C%E5%8D%81%E5%B9%B4%E6%BC%94%E8%BF%9B%E4%BB%8E%E7%BB%9F%E8%AE%A1%E6%96%B9%E6%B3%95%E5%88%B0transformer%E7%9A%84%E9%9D%A9%E5%91%BD/</link>
      <pubDate>Thu, 12 Mar 2026 19:18:43 +0800</pubDate>
      <guid>https://answer.freetools.me/%E5%BA%8F%E5%88%97%E5%88%B0%E5%BA%8F%E5%88%97%E5%AD%A6%E4%B9%A0%E7%9A%84%E4%BA%8C%E5%8D%81%E5%B9%B4%E6%BC%94%E8%BF%9B%E4%BB%8E%E7%BB%9F%E8%AE%A1%E6%96%B9%E6%B3%95%E5%88%B0transformer%E7%9A%84%E9%9D%A9%E5%91%BD/</guid>
      <description>深入解析Seq2Seq学习从统计机器翻译、RNN Encoder-Decoder、Attention机制到Transformer的完整技术演进历程，涵盖IBM Models、Phrase-based SMT、Bahdanau Attention、Teacher Forcing等核心技术，揭示现代大模型处理序列任务的技术根源。</description>
    </item>
    <item>
      <title>自注意力与交叉注意力：Transformer如何用两种机制处理「同一序列」与「两个世界」</title>
      <link>https://answer.freetools.me/%E8%87%AA%E6%B3%A8%E6%84%8F%E5%8A%9B%E4%B8%8E%E4%BA%A4%E5%8F%89%E6%B3%A8%E6%84%8F%E5%8A%9Btransformer%E5%A6%82%E4%BD%95%E7%94%A8%E4%B8%A4%E7%A7%8D%E6%9C%BA%E5%88%B6%E5%A4%84%E7%90%86%E5%90%8C%E4%B8%80%E5%BA%8F%E5%88%97%E4%B8%8E%E4%B8%A4%E4%B8%AA%E4%B8%96%E7%95%8C/</link>
      <pubDate>Thu, 12 Mar 2026 03:15:16 +0800</pubDate>
      <guid>https://answer.freetools.me/%E8%87%AA%E6%B3%A8%E6%84%8F%E5%8A%9B%E4%B8%8E%E4%BA%A4%E5%8F%89%E6%B3%A8%E6%84%8F%E5%8A%9Btransformer%E5%A6%82%E4%BD%95%E7%94%A8%E4%B8%A4%E7%A7%8D%E6%9C%BA%E5%88%B6%E5%A4%84%E7%90%86%E5%90%8C%E4%B8%80%E5%BA%8F%E5%88%97%E4%B8%8E%E4%B8%A4%E4%B8%AA%E4%B8%96%E7%95%8C/</guid>
      <description>深入解析Transformer中Self-Attention和Cross-Attention的技术原理、数学公式、历史演进与实际应用。从GPT的自回归生成到机器翻译的编码器-解码器架构，揭示这两种注意力机制如何塑造现代大模型的设计哲学。</description>
    </item>
  </channel>
</rss>
