Spaces:

zhiyuanhucs
/

Meta-Ability-Alignment

Running

App Files Files Community

zhiyuanhucs commited on May 15

Commit

d8b71b8

verified ·

1 Parent(s): a001de1

Update index.html

Browse files

Files changed (1) hide show

index.html +112 -139

index.html CHANGED Viewed

@@ -1,166 +1,139 @@
 <!DOCTYPE html>
-<html>
 <head>
-  <meta charset="utf-8">
-  <meta name="description"        content="Beyond ‘Aha!’: Toward Systematic Meta‑Abilities Alignment in Large Reasoning Models introduces a three‑stage recipe that explicitly teaches deduction, induction, and abduction to large language models, delivering state‑of‑the‑art reasoning performance.">
-  <meta name="keywords" content="Meta‑Abilities, Deduction, Induction, Abduction, Reinforcement Learning, Large Reasoning Models, LLM, Chain‑of‑Thought">
-  <meta name="viewport" content="width=device-width, initial-scale=1">
-  <title>Beyond ‘Aha!’: Meta‑Ability Alignment for Large Reasoning Models</title>
-  <!-- Fonts & Icons -->
-  <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro" rel="stylesheet">
-  <!-- Bulma & Theme Assets (keep original Nerfies paths / copy to your static folder) -->
-  <link rel="stylesheet" href="./static/css/bulma.min.css">
-  <link rel="stylesheet" href="./static/css/bulma-carousel.min.css">
-  <link rel="stylesheet" href="./static/css/bulma-slider.min.css">
-  <link rel="stylesheet" href="./static/css/fontawesome.all.min.css">
-  <link rel="stylesheet" href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
-  <link rel="stylesheet" href="./static/css/index.css">
-  <link rel="icon" href="./static/images/favicon.svg">
-  <!-- JS -->
-  <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
   <script defer src="./static/js/fontawesome.all.min.js"></script>
-  <script src="./static/js/bulma-carousel.min.js"></script>
-  <script src="./static/js/bulma-slider.min.js"></script>
-  <script src="./static/js/index.js"></script>
 </head>
 <body>
-<!-- ────────────────────────────── HERO ───────────────────────────── → -->
-<section class="hero">
-  <div class="hero-body">
-    <div class="container is-max-desktop">
-      <div class="columns is-centered">
-        <div class="column has-text-centered">
-          <h1 class="title is-1 publication-title">Beyond ‘Aha!’: Toward Systematic Meta‑Abilities Alignment in Large Reasoning Models</h1>
-          <div class="is-size-5 publication-authors">
-            <span class="author-block"><a href="#" target="_blank">Zhiyuan Hu</a><sup>1*</sup>,</span>
-            <span class="author-block"><a href="#" target="_blank">Yibo Wang</a><sup>2</sup>,</span>
-            <span class="author-block"><a href="#" target="_blank">Hanze Dong</a><sup>3</sup>,</span>
-            <span class="author-block"><a href="#" target="_blank">Yuhui Xu</a><sup>3</sup>,</span>
-            <span class="author-block"><a href="#" target="_blank">Amrita Saha</a><sup>3</sup>,</span>
-            <span class="author-block"><a href="#" target="_blank">Caiming Xiong</a><sup>3</sup>,</span>
-            <span class="author-block"><a href="#" target="_blank">Bryan Hooi</a><sup>1†</sup>,</span>
-            <span class="author-block"><a href="#" target="_blank">Junnan Li</a><sup>3†</sup></span>
-          </div>
-          <div class="is-size-5 publication-authors">
-            <span class="author-block"><sup>1</sup>National University of Singapore,</span>
-            <span class="author-block"><sup>2</sup>Tsinghua University,</span>
-            <span class="author-block"><sup>3</sup>Salesforce AI Research</span>
-          </div>
-          <!-- Links → -->
           <div class="column has-text-centered">
-            <div class="publication-links">
-              <!-- PDF -->
-              <span class="link-block">
-                <a href="./static/pdfs/meta_ability_alignment.pdf" target="_blank" class="external-link button is-normal is-rounded is-dark">
-                  <span class="icon"><i class="fas fa-file-pdf"></i></span>
-                  <span>Paper</span>
-                </a>
-              </span>
-              <!-- arXiv -->
-              <span class="link-block">
-                <a href="https://arxiv.org/abs/2505.00000" target="_blank" class="external-link button is-normal is-rounded is-dark">
-                  <span class="icon"><i class="ai ai-arxiv"></i></span>
-                  <span>arXiv</span>
-                </a>
-              </span>
-              <!-- Video (optional) -->
-              <span class="link-block">
-                <a href="https://youtu.be/your_video" target="_blank" class="external-link button is-normal is-rounded is-dark">
-                  <span class="icon"><i class="fab fa-youtube"></i></span>
-                  <span>Video</span>
-                </a>
-              </span>
-              <!-- Code -->
-              <span class="link-block">
-                <a href="https://github.com/zhiyuanhubj/Meta-Ability-Alignment" target="_blank" class="external-link button is-normal is-rounded is-dark">
-                  <span class="icon"><i class="fab fa-github"></i></span>
-                  <span>Code</span>
-                </a>
-              </span>
             </div>
           </div>
-          <!--/ Links -->
         </div>
       </div>
     </div>
-  </div>
-</section>
-<!-- ────────────────────────────── TEASER ──────────────────────────── → -->
-<section class="hero teaser">
-  <div class="container is-max-desktop">
-    <div class="hero-body">
-      <video id="teaser" autoplay muted loop playsinline height="100%">
-        <source src="./static/videos/meta_teaser.mp4" type="video/mp4">
-      </video>
-      <h2 class="subtitle has-text-centered">
-        <span class="dnerf">Meta‑Ability Alignment</span> systematically teaches deduction, induction, and abduction to large language models, turning unpredictable “aha” moments into reliable reasoning capabilities.
-      </h2>
-    </div>
-  </div>
-</section>
-<!-- ────────────────────────────── ABSTRACT ─────────────────────────── → -->
-<section class="section">
-  <div class="container is-max-desktop">
-    <div class="columns is-centered has-text-centered">
-      <div class="column is-four-fifths">
-        <h2 class="title is-3">Abstract</h2>
-        <div class="content has-text-justified">
-          <p>Large reasoning models (LRMs) possess a latent capacity for long chain‑of‑thought reasoning, but emergent “aha” behaviors are unpredictable and hard to control. We introduce an explicit <em>Meta‑Ability Alignment</em> strategy that separately trains deduction, induction, and abduction specialists on self‑verifiable tasks, then merges them in parameter space and continues domain‑specific RL. This three‑stage recipe boosts performance by &gt;10% over instruction‑tuned baselines and lifts the attainable ceiling after downstream RL, yielding consistent gains across math, coding, and science benchmarks.</p>
         </div>
       </div>
     </div>
-    <!-- Paper video (optional) → -->
-    <div class="columns is-centered has-text-centered">
-      <div class="column is-four-fifths">
-        <h2 class="title is-3">Video</h2>
-        <div class="publication-video">
-          <iframe src="https://www.youtube.com/embed/your_video?rel=0&amp;showinfo=0" frameborder="0" allow="autoplay; encrypted-media" allowfullscreen></iframe>
-        </div>
-      </div>
     </div>
-  </div>
-</section>
-<!-- ────────────────────────────── PIPELINE IMAGE / CAROUSEL (OPTIONAL) ───────────────────────────── → -->
-<!-- You can replace this section with evaluation figures or a carousel of task demonstrations. → -->
-<section class="section" id="BibTeX">
-  <div class="container is-max-desktop content">
-    <h2 class="title">BibTeX</h2>
-    <pre><code>@article{hu2025metaability,
-  author    = {Hu, Zhiyuan and Wang, Yibo and Dong, Hanze and Xu, Yuhui and Saha, Amrita and Xiong, Caiming and Hooi, Bryan and Li, Junnan},
-  title     = {Beyond \`Aha!\': Toward Systematic Meta‑Abilities Alignment in Large Reasoning Models},
-  journal   = {NeurIPS},
-  year      = {2025},
-  url       = {https://arxiv.org/abs/2505.00000}
 }</code></pre>
-  </div>
-</section>
-<footer class="footer">
-  <div class="container">
-    <div class="content has-text-centered">
-      <a class="icon-link" target="_blank" href="./static/pdfs/meta_ability_alignment.pdf"><i class="fas fa-file-pdf"></i></a>
-      <a class="icon-link" href="https://github.com/zhiyuanhubj/Meta-Ability-Alignment" target="_blank"><i class="fab fa-github"></i></a>
     </div>
-    <div class="columns is-centered">
-      <div class="column is-8">
-        <div class="content">
-          <p>This website template is adapted from the <a target="_blank" href="https://nerfies.github.io">Nerfies</a> project page and is licensed under a <a rel="license" target="_blank" href="http://creativecommons.org/licenses/by-sa/4.0/">CC BY‑SA 4.0</a> License. Please attribute appropriately.</p>
         </div>
       </div>
     </div>
-  </div>
-</footer>
 </body>
 </html>

 <!DOCTYPE html>
+<html lang="en">
 <head>
+  <meta charset="utf-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1" />
+  <meta name="description" content="Beyond ‘Aha!’ — Systematic Meta‑Ability Alignment in Large Reasoning Models presents a three‑stage recipe that explicitly teaches deduction, induction, and abduction, achieving state‑of‑the‑art reasoning performance." />
+  <meta name="keywords" content="Meta‑Abilities, Deduction, Induction, Abduction, Reinforcement Learning, Large Reasoning Models" />
+  <title>Beyond “Aha!” — Meta‑Ability Alignment for Reasoning Models</title>
+  <link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro" rel="stylesheet" />
+  <link rel="stylesheet" href="./static/css/bulma.min.css" />
+  <link rel="stylesheet" href="./static/css/fontawesome.all.min.css" />
+  <link rel="stylesheet" href="./static/css/index.css" />
+  <link rel="icon" href="./static/images/favicon.svg" />
   <script defer src="./static/js/fontawesome.all.min.js"></script>
 </head>
 <body>
+  <!-- Header / Title -->
+  <section class="hero">
+    <div class="hero-body">
+      <div class="container is-max-desktop">
+        <div class="columns is-centered">
           <div class="column has-text-centered">
+            <h1 class="title is-1 publication-title">Beyond “Aha!”: Systematic Meta‑Ability Alignment in Large Reasoning Models</h1>
+            <div class="is-size-5 publication-authors">
+              <!-- Update author list as needed -->
+              <span class="author-block"><a href="#" target="_blank">Zhiyuan Hu</a><sup>1</sup>,</span>
+              <span class="author-block"><a href="#" target="_blank">Yibo Wang</a><sup>2</sup>,</span>
+              <span class="author-block"><a href="#" target="_blank">Hanze Dong</a><sup>3</sup>,</span>
+              <span class="author-block"><a href="#" target="_blank">Yuhui Xu</a><sup>3</sup>,</span>
+              <span class="author-block"><strong>Amrita Saha</strong><sup>3</sup>,</span>
+              <span class="author-block"><strong>Caiming Xiong</strong><sup>3</sup>,</span>
+              <span class="author-block"><strong>Bryan Hooi</strong><sup>1</sup>,</span>
+              <span class="author-block"><strong>Junnan Li</strong><sup>3</sup></span>
+            </div>
+            <div class="is-size-5 publication-authors">
+              <span class="author-block"><sup>1</sup>National University of Singapore,</span>
+              <span class="author-block"><sup>2</sup>Tsinghua University,</span>
+              <span class="author-block"><sup>3</sup>Salesforce AI Research</span>
+            </div>
+            <!-- Links -->
+            <div class="column has-text-centered">
+              <div class="publication-links">
+                <span class="link-block">
+                  <a href="https://github.com/zhiyuanhubj/Meta-Ability-Alignment/blob/main/Paper.pdf" target="_blank" class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon"><i class="fas fa-file-pdf"></i></span>
+                    <span>Paper</span>
+                  </a>
+                </span>
+                <span class="link-block">
+                  <a href="https://github.com/zhiyuanhubj/Meta-Ability-Alignment/blob/main/Paper.pdf" target="_blank" class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon"><i class="ai ai-arxiv"></i></span>
+                    <span>arXiv</span>
+                  </a>
+                </span>
+                <span class="link-block">
+                  <a href="https://github.com/your‑repo" target="_blank" class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon"><i class="fab fa-github"></i></span>
+                    <span>Code</span>
+                  </a>
+                </span>
+                <span class="link-block">
+                  <a href="https://github.com/your‑repo/releases" target="_blank" class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon"><i class="far fa-images"></i></span>
+                    <span>Data</span>
+                  </a>
+                </span>
+              </div>
             </div>
           </div>
         </div>
       </div>
     </div>
+  </section>
+  <!-- Abstract -->
+  <section class="section">
+    <div class="container is-max-desktop">
+      <div class="columns is-centered has-text-centered">
+        <div class="column is-four-fifths">
+          <h2 class="title is-3">Abstract</h2>
+          <div class="content has-text-justified">
+            <p>Large reasoning models (LRMs) possess a latent capacity for long chain‑of‑thought reasoning, but the timing and consistency of emergent “aha” behaviors remain unpredictable. We explicitly align LRMs with three meta‑abilities—<strong>deduction, induction, and abduction</strong>—using automatically generated, self‑verifiable tasks. Our three‑stage pipeline (individual alignment, parameter‑space merging, and domain‑specific reinforcement learning) lifts performance ceilings by&nbsp;≤10 % over instruction‑tuned baselines and delivers state‑of‑the‑art accuracy across math, coding, and science benchmarks.</p>
+          </div>
         </div>
       </div>
     </div>
+  </section>
+  <!-- Results & Framework Figures -->
+  <section class="section is-light">
+    <div class="container is-max-desktop">
+      <h2 class="title is-3 has-text-centered">Key Results</h2>
+      <figure class="image">
+        <img src="./static/images/results_tables.png" alt="Performance tables showing consistent gains from meta‑ability alignment." />
+        <figcaption class="has-text-centered">Table&nbsp;1&nbsp;&amp;&nbsp;2: Meta‑ability alignment boosts reasoning performance at both 7B and 32B scales.</figcaption>
+      </figure>
+      <br />
+      <h2 class="title is-3 has-text-centered">Three‑Stage Training Framework</h2>
+      <figure class="image">
+        <img src="./static/images/framework.png" alt="Three‑stage meta‑ability alignment framework diagram." />
+        <figcaption class="has-text-centered">Stage A: Meta‑ability alignment &nbsp;⟶&nbsp; Stage B: Parameter‑space merging &nbsp;⟶&nbsp; Stage C: Domain‑specific RL.</figcaption>
+      </figure>
     </div>
+  </section>
+  <!-- Related Links (optional) -->
+  <section class="section" id="BibTeX">
+    <div class="container is-max-desktop content">
+      <h2 class="title">BibTeX</h2>
+      <pre><code>@article{hu2025metaability,
+  author  = {Hu, Zhiyuan and Wang, Yibo and Dong, Hanze and Xu, Yuhui and Saha, Amrita and Xiong, Caiming and Hooi, Bryan and Li, Junnan},
+  title   = {Beyond “Aha!”: Systematic Meta‑Ability Alignment in Large Reasoning Models},
+  journal = {NeurIPS},
+  year    = {2025}
 }</code></pre>
     </div>
+  </section>
+  <footer class="footer">
+    <div class="container">
+      <div class="content has-text-centered">
+        <a class="icon-link" target="_blank" href="https://github.com/zhiyuanhubj/Meta-Ability-Alignment/blob/main/Paper.pdf"><i class="fas fa-file-pdf"></i></a>
+        <a class="icon-link" target="_blank" href="https://github.com/your‑repo"><i class="fab fa-github"></i></a>
+      </div>
+      <div class="columns is-centered">
+        <div class="column is-8">
+          <div class="content">
+            <p>This website is licensed under a <a rel="license" target="_blank" href="http://creativecommons.org/licenses/by-sa/4.0/">Creative Commons Attribution‑ShareAlike 4.0 International License</a>.</p>
+            <p>You are free to reuse the <a target="_blank" href="https://github.com/nerfies/nerfies.github.io">source code</a>; please include a link back in the footer.</p>
+          </div>
         </div>
       </div>
     </div>
+  </footer>
 </body>
 </html>