tom cohere

celrm · celrm · commit e01db20e64ae · 2025-08-19T13:40:46.000+02:00
diff --git a/_bibliography/references.bib b/_bibliography/references.bib
@@ -5,8 +5,8 @@ @inproceedings{jacobs2025mirror
 author={Tom Jacobs and Chao Zhou and Rebekka Burkholz},
 booktitle={Forty-second International Conference on Machine Learning},
 year={2025},
-url={https://arxiv.org/abs/2504.12883},
-pdf={https://arxiv.org/pdf/2504.12883},
+url={https://openreview.net/forum?id=MLiR9LS5PW},
+pdf={https://openreview.net/pdf?id=MLiR9LS5PW},
 img={mirror-mirror.jpg},
 abstract={Implicit bias plays an important role in explaining how overparameterized models generalize well. Explicit regularization like weight decay is often employed in addition to prevent overfitting. While both concepts have been studied separately, in practice, they often act in tandem. Understanding their interplay is key to controlling the shape and strength of implicit bias, as it can be modified by explicit regularization. To this end, we incorporate explicit regularization into the mirror flow framework and analyze its lasting effects on the geometry of the training dynamics, covering three distinct effects: positional bias, type of bias, and range shrinking. Our analytical approach encompasses a broad class of problems, including sparse coding, matrix sensing, single-layer attention, and LoRA, for which we demonstrate the utility of our insights. To exploit the lasting effect of regularization and highlight the potential benefit of dynamic weight decay schedules, we propose to switch off weight decay during training, which can improve generalization, as we demonstrate in experiments.},
 }
diff --git a/_data/alumni_members.yml b/_data/alumni_members.yml
@@ -1,17 +1,4 @@
 
-
-- role: Research engineers
-  members:
-    - name: Nikita Vedeneev
-      last_name: Vedeneev
-      photo: c01mive.jpg
-      start_date: Dec 24
-      end_date: May 25
-      email: mikita.vedzeneyeu@cispa.de
-      url: https://github.com/nikitaved
-      description: "I am interesting in making modern AI models efficient. In particular, I work on discovering and exploiting structure in Neural Networks (sparsity, low-dimensional representations and similar) for efficient training, fine-tuning and inference. I am a former full-time core developer for [PyTorch](https://github.com/pytorch/pytorch) and [Lightning Thunder](https://github.com/Lightning-AI/lightning-thunder). Check my [GitHub](https://github.com/nikitaved) to see what I work on now."
-      next: Senior Engineer at NVIDIA
-      
 - role: Research assistants
   members:
     - name: Ben Horvath
@@ -42,6 +29,18 @@
       start_date: Dec 21
       end_date: Oct 22
 
+- role: Research engineers
+  members:
+    - name: Nikita Vedeneev
+      last_name: Vedeneev
+      photo: c01mive.jpg
+      start_date: Dec 24
+      end_date: May 25
+      email: mikita.vedzeneyeu@cispa.de
+      url: https://github.com/nikitaved
+      description: "I am interesting in making modern AI models efficient. In particular, I work on discovering and exploiting structure in Neural Networks (sparsity, low-dimensional representations and similar) for efficient training, fine-tuning and inference. I am a former full-time core developer for [PyTorch](https://github.com/pytorch/pytorch) and [Lightning Thunder](https://github.com/Lightning-AI/lightning-thunder). Check my [GitHub](https://github.com/nikitaved) to see what I work on now."
+      next: Senior Engineer at NVIDIA
+
 - role: Visiting students
   members:
     - name: Otto Piramuthu
diff --git a/_data/news.yml b/_data/news.yml
@@ -2,7 +2,7 @@
   headline: "Rebekka and Celia are presenting at the Workshop on Mining and Learning with Graphs ([MLG](https://mlg-europe.github.io/2025/)) in Porto with a keynote and two posters, respectively."
 
 - date: 14. August 2025
-  headline: "Tom is [presenting](https://cohere.com/events/Cohere-Labs-Tom-Jacobs-2025) his work on implicit regularization at Cohere Labs: Open Science Community."
+  headline: "Tom is [presenting](https://cohere.com/events/Cohere-Labs-Tom-Jacobs-2025) his work on implicit regularization at Cohere Labs: Open Science Community ([video](/outreach#tom-jacobs--cohere-labs-aug-14-2025))."
 
 - date: 12. June 2025
   headline: "Tom is attending the AI & Mathematics Workshop ([AIM](https://aimath.nl/index.php/2025/03/13/4th-aim-cluster-event-tilburg/)) at Tilburg University."
diff --git a/_data/outreach.yml b/_data/outreach.yml
@@ -1,4 +1,18 @@
 videos:
+- title: "Weight Decay Controls Implicit Regularization: Insights on Generalization and Sparsity"
+  date: 2025-08-14
+  speaker: "Tom Jacobs"
+  venue: "Cohere Labs"
+  video: https://www.youtube.com/embed/KwxqXbgu78c?si=U-5CdYYuHwoP6r5o
+  papers:
+    - title: "Mask in the Mirror: Implicit Sparsification"
+      authors: "Tom Jacobs, and Rebekka Burkholz"
+      conference: ICLR 2025
+      link: https://openreview.net/forum?id=U47ymTS3ut
+    - title: "Mirror, Mirror of the Flow: How Does Regularization Shape Implicit Bias?"
+      authors: "Tom Jacobs, Chao Zhou, and Rebekka Burkholz"
+      conference: ICML 2025
+      link: https://openreview.net/forum?id=MLiR9LS5PW
 - title: "Rewiring Graph Neural Networks: When Less is More and Structure Matters"
   date: 2025-02-13
   speaker: "Celia Rubio-Madrigal"
diff --git a/_site/index.html b/_site/index.html
@@ -136,7 +136,7 @@ <h3>News</h3>
 <hr/>
 
 <b>14 Aug 2025</b>
-<p>Tom is <a href="https://cohere.com/events/Cohere-Labs-Tom-Jacobs-2025">presenting</a> his work on implicit regularization at Cohere Labs: Open Science Community.</p>
+<p>Tom is <a href="https://cohere.com/events/Cohere-Labs-Tom-Jacobs-2025">presenting</a> his work on implicit regularization at Cohere Labs: Open Science Community (<a href="/outreach#tom-jacobs--cohere-labs-aug-14-2025">video</a>).</p>
 
 <hr/>
 
diff --git a/_site/news.html b/_site/news.html
@@ -83,7 +83,7 @@ <h4>15 September 2025</h4>
 <hr />
 
 <h4>14 August 2025</h4>
-<p>Tom is <a href="https://cohere.com/events/Cohere-Labs-Tom-Jacobs-2025">presenting</a> his work on implicit regularization at Cohere Labs: Open Science Community.</p>
+<p>Tom is <a href="https://cohere.com/events/Cohere-Labs-Tom-Jacobs-2025">presenting</a> his work on implicit regularization at Cohere Labs: Open Science Community (<a href="/outreach#tom-jacobs--cohere-labs-aug-14-2025">video</a>).</p>
 
 <hr />
 
diff --git a/_site/outreach/index.html b/_site/outreach/index.html
@@ -85,6 +85,38 @@ <h1 id="outreach">Outreach</h1>
 
 <h2 id="videos" class="anchor">Videos</h2>
 
+<h3 id="tom-jacobs--cohere-labs-aug-14-2025">Tom Jacobs @ Cohere Labs (Aug 14, 2025)</h3>
+<h4 id="weight-decay-controls-implicit-regularization-insights-on-generalization-and-sparsity">Weight Decay Controls Implicit Regularization: Insights on Generalization and Sparsity</h4>
+
+<div class="row">
+
+  <div class="col-sm-6 clearfix">
+
+    <p>Based on papers:</p>
+    <ul>
+
+<li>
+        <strong>Mask in the Mirror: Implicit Sparsification</strong>,
+        Tom Jacobs, and Rebekka Burkholz,
+        <em>ICLR 2025</em>. (<a href="https://openreview.net/forum?id=U47ymTS3ut">Link to paper</a>)
+</li>
+
+<li>
+        <strong>Mirror, Mirror of the Flow: How Does Regularization Shape Implicit Bias?</strong>,
+        Tom Jacobs, Chao Zhou, and Rebekka Burkholz,
+        <em>ICML 2025</em>. (<a href="https://openreview.net/forum?id=MLiR9LS5PW">Link to paper</a>)
+</li>
+
+</ul>
+
+  </div>
+
+  <div class="col-sm-6 clearfix">
+    <iframe width="374" height="210" src="https://www.youtube.com/embed/KwxqXbgu78c?si=U-5CdYYuHwoP6r5o&amp;autoplay=0" title="video player" frameborder="0" allow="accelerometer; clipboard-write; encrypted-media; gyroscope; picture-in-picture; web-share" referrerpolicy="strict-origin-when-cross-origin" allowfullscreen=""></iframe>
+  </div>
+
+</div>
+
 <h3 id="celia-rubio-madrigal--cohere-labs-feb-13-2025">Celia Rubio-Madrigal @ Cohere Labs (Feb 13, 2025)</h3>
 <h4 id="rewiring-graph-neural-networks-when-less-is-more-and-structure-matters">Rewiring Graph Neural Networks: When Less is More and Structure Matters</h4>
 
diff --git a/_site/publications/index.html b/_site/publications/index.html
@@ -389,7 +389,7 @@ <h2 id="accepted-papers">Accepted papers</h2>
         <div id="jacobs2025mirror" class="col-sm-10">
         <!-- Title -->
         
-          <div class="title"><a href="https://arxiv.org/abs/2504.12883"><b>Mirror, Mirror of the Flow: How Does Regularization Shape Implicit Bias?</b></a></div>
+          <div class="title"><a href="https://openreview.net/forum?id=MLiR9LS5PW"><b>Mirror, Mirror of the Flow: How Does Regularization Shape Implicit Bias?</b></a></div>
         
         <!-- Author -->
         <div class="author">
@@ -410,7 +410,7 @@ <h2 id="accepted-papers">Accepted papers</h2>
           <!-- Links/Buttons -->
         <div class="links"><a class="conf btn btn-sm z-depth-0">ICML</a><a class="bibtex btn btn-sm z-depth-0" role="button">Bib</a>
             <a class="abstract btn btn-sm z-depth-0" role="button">Abs</a>
-            <!-- <a href="https://arxiv.org/pdf/2504.12883" class="btn btn-sm z-depth-0" role="button">PDF</a> -->
+            <!-- <a href="https://openreview.net/pdf?id=MLiR9LS5PW" class="btn btn-sm z-depth-0" role="button">PDF</a> -->
           </div>
           
 
@@ -424,7 +424,7 @@ <h2 id="accepted-papers">Accepted papers</h2>
   <span class="na">author</span> <span class="p">=</span> <span class="s">{Jacobs, Tom and Zhou, Chao and Burkholz, Rebekka}</span><span class="p">,</span>
   <span class="na">booktitle</span> <span class="p">=</span> <span class="s">{Forty-second International Conference on Machine Learning}</span><span class="p">,</span>
   <span class="na">year</span> <span class="p">=</span> <span class="s">{2025}</span><span class="p">,</span>
-  <span class="na">url</span> <span class="p">=</span> <span class="s">{https://arxiv.org/abs/2504.12883}</span><span class="p">,</span>
+  <span class="na">url</span> <span class="p">=</span> <span class="s">{https://openreview.net/forum?id=MLiR9LS5PW}</span><span class="p">,</span>
 <span class="p">}</span></code></pre></figure>
           </div>
         </div>
diff --git a/_site/team/index.html b/_site/team/index.html
@@ -264,20 +264,6 @@ <h2 id="alumni">Alumni</h2>
 
 <!--  -->
 
-<div class="row">
-  <div class="col-sm-12 clearfix">
-
-    <h3>Research engineers</h3>
-
-    <p><a href="https://github.com/nikitaved">Nikita Vedeneev</a>: 
-Dec 24-May 25. Next ⇢ Senior Engineer at NVIDIA.</p>
-
-  </div>
-
-</div>
-
-<!--  -->
-
 <div class="row">
   <div class="col-sm-12 clearfix">
 
@@ -301,6 +287,20 @@ <h3>Research assistants</h3>
 
 <!--  -->
 
+<div class="row">
+  <div class="col-sm-12 clearfix">
+
+    <h3>Research engineers</h3>
+
+    <p><a href="https://github.com/nikitaved">Nikita Vedeneev</a>: 
+Dec 24-May 25. Next ⇢ Senior Engineer at NVIDIA.</p>
+
+  </div>
+
+</div>
+
+<!--  -->
+
 <div class="row">
   <div class="col-sm-12 clearfix">