<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Formalization on emsenn.net</title>
    <link>https://emsenn.net/tags/formalization/</link>
    <description>Recent content in Formalization on emsenn.net</description>
    <generator>Hugo</generator>
    <language>en</language>
    <lastBuildDate>Sat, 07 Mar 2026 00:00:00 +0000</lastBuildDate>
    <atom:link href="https://emsenn.net/tags/formalization/index.xml" rel="self" type="application/rss+xml" />
    <item>
      <title>Survey: AI Agents for Formal Mathematics (External Landscape, 2026)</title>
      <link>https://emsenn.net/library/domains/engineering/domains/tech/domains/computing/domains/artificial-intelligence/domains/agents/texts/ai-math-agents-survey-2026/</link>
      <pubDate>Sat, 07 Mar 2026 00:00:00 +0000</pubDate>
      <guid>https://emsenn.net/library/domains/engineering/domains/tech/domains/computing/domains/artificial-intelligence/domains/agents/texts/ai-math-agents-survey-2026/</guid>
      <description>&lt;h2 id=&#34;ai-agents-for-formal-mathematics-external-landscape-survey&#34;&gt;&lt;a href=&#34;#ai-agents-for-formal-mathematics-external-landscape-survey&#34; class=&#34;heading-anchor&#34; aria-label=&#34;Link to this section&#34;&gt;¶&lt;/a&gt;AI Agents for Formal Mathematics: External Landscape Survey&#xA;&lt;/h2&gt;&#xA;&lt;p&gt;Survey of external tools, research, and practices for LLM agents doing formal&#xA;mathematics with proof assistants. Focused on what exists outside this&#xA;repository that could improve agent mathematical capability here.&lt;/p&gt;&#xA;&lt;h2 id=&#34;1-llm-based-mathematical-reasoning-agents&#34;&gt;&lt;a href=&#34;#1-llm-based-mathematical-reasoning-agents&#34; class=&#34;heading-anchor&#34; aria-label=&#34;Link to this section&#34;&gt;¶&lt;/a&gt;1. LLM-Based Mathematical Reasoning Agents&#xA;&lt;/h2&gt;&#xA;&lt;h3 id=&#34;deepseek-prover-v2-deepseek-2025&#34;&gt;&lt;a href=&#34;#deepseek-prover-v2-deepseek-2025&#34; class=&#34;heading-anchor&#34; aria-label=&#34;Link to this section&#34;&gt;¶&lt;/a&gt;DeepSeek-Prover-V2 (DeepSeek, 2025)&#xA;&lt;/h3&gt;&#xA;&lt;p&gt;Formal theorem proving in Lean 4. Key innovation: subgoal decomposition —&#xA;the model writes an informal proof sketch first, decomposes into formal&#xA;subgoals, then proves each subgoal. Trained with GRPO (not PPO) reinforcement&#xA;learning. Achieved 88.9% on MiniF2F-test, 49 out of 658 problems on&#xA;FormalMATH. Open-weight (7B and 671B MoE variants).&lt;/p&gt;</description>
    </item>
  </channel>
</rss>
