icml25

celrm · celrm · commit 34d38bc66001 · 2025-05-30T10:23:07.000+02:00
diff --git a/_bibliography/references.bib b/_bibliography/references.bib
@@ -1,5 +1,15 @@
 ---
 ---
+@inproceedings{jacobs2025mirror,
+title={Mirror, Mirror of the Flow: How Does Regularization Shape Implicit Bias?},
+author={Tom Jacobs and Chao Zhou and Rebekka Burkholz},
+booktitle={Forty-second International Conference on Machine Learning},
+year={2025},
+url={https://arxiv.org/abs/2504.12883},
+pdf={https://arxiv.org/pdf/2504.12883},
+img={mirror-mirror.jpg},
+abstract={Implicit bias plays an important role in explaining how overparameterized models generalize well. Explicit regularization like weight decay is often employed in addition to prevent overfitting. While both concepts have been studied separately, in practice, they often act in tandem. Understanding their interplay is key to controlling the shape and strength of implicit bias, as it can be modified by explicit regularization. To this end, we incorporate explicit regularization into the mirror flow framework and analyze its lasting effects on the geometry of the training dynamics, covering three distinct effects: positional bias, type of bias, and range shrinking. Our analytical approach encompasses a broad class of problems, including sparse coding, matrix sensing, single-layer attention, and LoRA, for which we demonstrate the utility of our insights. To exploit the lasting effect of regularization and highlight the potential benefit of dynamic weight decay schedules, we propose to switch off weight decay during training, which can improve generalization, as we demonstrate in experiments.},
+}
 
 @inproceedings{
 jacobs2025mask,
diff --git a/_data/alumni_members.yml b/_data/alumni_members.yml
@@ -15,6 +15,16 @@
       end_date: Jul 24
       url: https://nelaturuharsha.github.io/
 
+- role: Research engineers
+  members:
+    - name: Nikita (Nik) Vedeneev
+      last_name: Vedeneev
+      photo: c01mive.jpg
+      start_date: Dec 24
+      end_date: May 25
+      email: mikita.vedzeneyeu@cispa.de
+      description: "I am interesting in making modern AI models efficient. In particular, I work on discovering and exploiting structure in Neural Networks (sparsity, low-dimensional representations and similar) for efficient training, fine-tuning and inference. I am a former full-time core developer for [PyTorch](https://github.com/pytorch/pytorch) and [Lightning Thunder](https://github.com/Lightning-AI/lightning-thunder). Check my [GitHub](https://github.com/nikitaved) to see what I work on now."
+
 - role: Visiting students
   members:
     - name: Otto Piramuthu
diff --git a/_data/news.yml b/_data/news.yml
@@ -1,11 +1,20 @@
+- date: 2. June 2025
+  headline: "Rebekka and Celia are presenting at the International Network Science Conference ([NetSci](https://netsci2025.github.io/)) in Maastricht."
+
+- date: 1. June 2025
+  headline: Welcome Baraah!
+
+- date: 1. May 2025
+  headline: "Our paper on [implicit bias](https://arxiv.org/pdf/2504.12883) has been accepted at ICML 2025."
+
 - date: 24. March 2025
   headline: "Rebekka is at [CPAL](https://cpal.cc/spotlight_track/) in Stanford presenting three of our [papers](/publications) as recent spotlights."
 
 - date: 22. January 2025
   headline: "Two papers 
   [(1)](https://openreview.net/forum?id=g6v09VxgFw) 
   [(2)](https://openreview.net/forum?id=U47ymTS3ut) 
-  have been accepted at ICLR 2025 (see [publications](/publications))."
+  have been accepted at ICLR 2025."
 
 - date: 1. December 2024
   headline: "Welcome to Gowtham and Nik!"
@@ -21,7 +30,7 @@
   headline: "Welcome to Chao, Rahul, and Dong!"
 
 - date: 14. June 2024
-  headline: "Celia, Advait and Adarsh are presenting at the Helmholtz AI Conference: AI for Science ([HAICON](https://eventclass.it/haic2024/scientific/external-program/session?s=S-05a))."
+  headline: "Celia, Advait and Adarsh are presenting at the Helmholtz AI Conference: AI for Science ([HAICON](https://eventclass.it/haic2024/scientific/external-program/session?s=S-05a)) in Düsseldorf."
 
 - date: 1. May 2024
   headline: "Our paper on [improving GATs](https://openreview.net/forum?id=Sjv5RcqfuH) has been accepted at ICML 2024."
diff --git a/_data/team_members.yml b/_data/team_members.yml
@@ -74,12 +74,9 @@
       url: https://cispa.de/en/people/c01dosu
       description: "My current research focuses on theoretically elucidating the superior performance of Mixture of Experts models, with an emphasis on their generalization performance, sample complexity, training dynamics, and robustness to adversarial noises."
 
-- role: Research engineers
-  members:
-    - name: Nikita (Nik) Vedeneev
-      last_name: Vedeneev
-      photo: c01mive.jpg
-      start_date: Dec 2024
-      email: mikita.vedzeneyeu@cispa.de
-      url: https://cispa.de/en/people/c01mive
-      description: "I am interesting in making modern AI models efficient. In particular, I work on discovering and exploiting structure in Neural Networks (sparsity, low-dimensional representations and similar) for efficient training, fine-tuning and inference. I am a former full-time core developer for [PyTorch](https://github.com/pytorch/pytorch) and [Lightning Thunder](https://github.com/Lightning-AI/lightning-thunder). Check my [GitHub](https://github.com/nikitaved) to see what I work on now."
+    - name: Baraah Sidahmed
+      last_name: Sidahmed
+      photo: 
+      start_date: Jun 2025
+      email: baraah.adil@cispa.de
+      url: https://cispa.de/en/people/c01baad
diff --git a/_site/images/publications/mirror-mirror.jpg b/_site/images/publications/mirror-mirror.jpg
diff --git a/_site/index.html b/_site/index.html
@@ -120,28 +120,28 @@ <h1 id="relational-ml-lab">Relational ML Lab</h1>
 <h3>News</h3>
 <div class="well">
 
-<b>24 Mar 2025</b>
-<p>Rebekka is at <a href="https://cpal.cc/spotlight_track/">CPAL</a> in Stanford presenting three of our <a href="/publications">papers</a> as recent spotlights.</p>
+<b>02 Jun 2025</b>
+<p>Rebekka and Celia are presenting at the International Network Science Conference (<a href="https://netsci2025.github.io/">NetSci</a>) in Maastricht.</p>
 
 <hr/>
 
-<b>22 Jan 2025</b>
-<p>Two papers <a href="https://openreview.net/forum?id=g6v09VxgFw">(1)</a> <a href="https://openreview.net/forum?id=U47ymTS3ut">(2)</a> have been accepted at ICLR 2025 (see <a href="/publications">publications</a>).</p>
+<b>01 Jun 2025</b>
+<p>Welcome Baraah!</p>
 
 <hr/>
 
-<b>01 Dec 2024</b>
-<p>Welcome to Gowtham and Nik!</p>
+<b>01 May 2025</b>
+<p>Our paper on <a href="https://arxiv.org/pdf/2504.12883">implicit bias</a> has been accepted at ICML 2025.</p>
 
 <hr/>
 
-<b>25 Sep 2024</b>
-<p>Three papers <a href="https://openreview.net/forum?id=EMkrwJY2de">(1)</a> <a href="https://openreview.net/forum?id=IfZwSRpqHl">(2)</a> <a href="https://openreview.net/forum?id=FNtsZLwkGr">(3)</a> have been accepted at NeurIPS 2024.</p>
+<b>24 Mar 2025</b>
+<p>Rebekka is at <a href="https://cpal.cc/spotlight_track/">CPAL</a> in Stanford presenting three of our <a href="/publications">papers</a> as recent spotlights.</p>
 
 <hr/>
 
-<b>01 Jul 2024</b>
-<p>Welcome to Chao, Rahul, and Dong!</p>
+<b>22 Jan 2025</b>
+<p>Two papers <a href="https://openreview.net/forum?id=g6v09VxgFw">(1)</a> <a href="https://openreview.net/forum?id=U47ymTS3ut">(2)</a> have been accepted at ICLR 2025.</p>
 
 <hr/>
 
diff --git a/_site/news.html b/_site/news.html
@@ -71,13 +71,28 @@ <h1 id="news">News</h1>
 
 <hr />
 
+<h4>02 June 2025</h4>
+<p>Rebekka and Celia are presenting at the International Network Science Conference (<a href="https://netsci2025.github.io/">NetSci</a>) in Maastricht.</p>
+
+<hr />
+
+<h4>01 June 2025</h4>
+<p>Welcome Baraah!</p>
+
+<hr />
+
+<h4>01 May 2025</h4>
+<p>Our paper on <a href="https://arxiv.org/pdf/2504.12883">implicit bias</a> has been accepted at ICML 2025.</p>
+
+<hr />
+
 <h4>24 March 2025</h4>
 <p>Rebekka is at <a href="https://cpal.cc/spotlight_track/">CPAL</a> in Stanford presenting three of our <a href="/publications">papers</a> as recent spotlights.</p>
 
 <hr />
 
 <h4>22 January 2025</h4>
-<p>Two papers <a href="https://openreview.net/forum?id=g6v09VxgFw">(1)</a> <a href="https://openreview.net/forum?id=U47ymTS3ut">(2)</a> have been accepted at ICLR 2025 (see <a href="/publications">publications</a>).</p>
+<p>Two papers <a href="https://openreview.net/forum?id=g6v09VxgFw">(1)</a> <a href="https://openreview.net/forum?id=U47ymTS3ut">(2)</a> have been accepted at ICLR 2025.</p>
 
 <hr />
 
@@ -97,7 +112,7 @@ <h4>01 July 2024</h4>
 <hr />
 
 <h4>14 June 2024</h4>
-<p>Celia, Advait and Adarsh are presenting at the Helmholtz AI Conference: AI for Science (<a href="https://eventclass.it/haic2024/scientific/external-program/session?s=S-05a">HAICON</a>).</p>
+<p>Celia, Advait and Adarsh are presenting at the Helmholtz AI Conference: AI for Science (<a href="https://eventclass.it/haic2024/scientific/external-program/session?s=S-05a">HAICON</a>) in Düsseldorf.</p>
 
 <hr />
 
diff --git a/_site/publications/index.html b/_site/publications/index.html
@@ -80,12 +80,66 @@ <h1 id="publications">Publications</h1>
     <option value="Jacobs">Tom Jacobs</option>
     <option value="Nittala">Rahul Nittala</option>
     <option value="Sun">Dong Sun</option>
-    <option value="Vedeneev">Nikita (Nik) Vedeneev</option>
+    <option value="Sidahmed">Baraah Sidahmed</option>
     </select></p>
 
 <ol class="bibliography"><li><!-- _layouts/bib.html -->
 
 
+  <div class="row" style="margin-top: 30px;" id="bib-jacobs2025mirror" authors="JacobsZhouBurkholz">
+        <div class="preview"><img class="preview z-depth-1 rounded" src="/images/publications/mirror-mirror.jpg" />
+            <!-- include figure.html
+            path=entry_path
+            class="preview z-depth-1 rounded"
+            zoomable=false
+            alt=entry.img --></div>
+        <!-- Entry bib key -->
+        <div id="jacobs2025mirror" class="col-sm-10">
+        <!-- Title -->
+        
+          <div class="title"><a href="https://arxiv.org/abs/2504.12883"><b>Mirror, Mirror of the Flow: How Does Regularization Shape Implicit Bias?</b></a></div>
+        
+        <!-- Author -->
+        <div class="author">
+        
+
+        Tom Jacobs,&nbsp;Chao Zhou,&nbsp;and&nbsp;Rebekka Burkholz</div>
+
+        <!-- Journal/Book title and date -->
+        
+        
+        <div class="periodical">
+          <em>In Forty-second International Conference on Machine Learning</em>, 2025
+        </div>
+        <div class="periodical">
+          
+        </div>
+
+          <!-- Links/Buttons -->
+        <div class="links"><a class="conf btn btn-sm z-depth-0">ICML</a><a class="bibtex btn btn-sm z-depth-0" role="button">Bib</a>
+            <a class="abstract btn btn-sm z-depth-0" role="button">Abs</a>
+            <!-- <a href="https://arxiv.org/pdf/2504.12883" class="btn btn-sm z-depth-0" role="button">PDF</a> -->
+          </div>
+          
+
+          <!-- Hidden abstract block -->
+          <div class="abstract hidden">
+            <p>Implicit bias plays an important role in explaining how overparameterized models generalize well. Explicit regularization like weight decay is often employed in addition to prevent overfitting. While both concepts have been studied separately, in practice, they often act in tandem. Understanding their interplay is key to controlling the shape and strength of implicit bias, as it can be modified by explicit regularization. To this end, we incorporate explicit regularization into the mirror flow framework and analyze its lasting effects on the geometry of the training dynamics, covering three distinct effects: positional bias, type of bias, and range shrinking. Our analytical approach encompasses a broad class of problems, including sparse coding, matrix sensing, single-layer attention, and LoRA, for which we demonstrate the utility of our insights. To exploit the lasting effect of regularization and highlight the potential benefit of dynamic weight decay schedules, we propose to switch off weight decay during training, which can improve generalization, as we demonstrate in experiments.</p>
+          </div><!-- Hidden bibtex block -->
+          <div class="bibtex hidden">
+            <figure class="highlight"><pre><code class="language-bibtex" data-lang="bibtex"><span class="nc">@inproceedings</span><span class="p">{</span><span class="nl">jacobs2025mirror</span><span class="p">,</span>
+  <span class="na">title</span> <span class="p">=</span> <span class="s">{Mirror, Mirror of the Flow: How Does Regularization Shape Implicit Bias?}</span><span class="p">,</span>
+  <span class="na">author</span> <span class="p">=</span> <span class="s">{Jacobs, Tom and Zhou, Chao and Burkholz, Rebekka}</span><span class="p">,</span>
+  <span class="na">booktitle</span> <span class="p">=</span> <span class="s">{Forty-second International Conference on Machine Learning}</span><span class="p">,</span>
+  <span class="na">year</span> <span class="p">=</span> <span class="s">{2025}</span><span class="p">,</span>
+  <span class="na">url</span> <span class="p">=</span> <span class="s">{https://arxiv.org/abs/2504.12883}</span><span class="p">,</span>
+<span class="p">}</span></code></pre></figure>
+          </div>
+        </div>
+      </div></li>
+<li><!-- _layouts/bib.html -->
+
+
   <div class="row" style="margin-top: 30px;" id="bib-jacobs2025mask" authors="JacobsBurkholz">
         <div class="preview"><img class="preview z-depth-1 rounded" src="/images/publications/mask_in_the_mirror.png" />
             <!-- include figure.html
diff --git a/_site/team/index.html b/_site/team/index.html
@@ -233,21 +233,15 @@ <h4>Dong Sun</h4>
 
 <div class="row">
 
-  <h3 style="margin-left:16px;">Research engineers</h3>
-
   <div class="col-sm-6 clearfix">
 
-    <p><img src="/images/team members/c01mive.jpg" class="img-responsive" width="20%" style="float: left; margin: 0px 22px 24px 0;" /></p>
-
-    <h4>Nikita (Nik) Vedeneev</h4>
-    <p><a href="https://cispa.de/en/people/c01mive">Homepage</a>
-  | <a href="mailto:mikita.vedzeneyeu@cispa.de">Email</a>
-   |  <a class="membercv" role="button">Description</a>  <br />
-  <i>since Dec 2024</i></p>
+    <p><img src="/images/team members/blank.jpg" class="img-responsive" width="20%" style="float: left; margin: 0px 22px 24px 0;" /></p>
 
-    <div class="membercv hidden">
-      <p>I am interesting in making modern AI models efficient. In particular, I work on discovering and exploiting structure in Neural Networks (sparsity, low-dimensional representations and similar) for efficient training, fine-tuning and inference. I am a former full-time core developer for <a href="https://github.com/pytorch/pytorch">PyTorch</a> and <a href="https://github.com/Lightning-AI/lightning-thunder">Lightning Thunder</a>. Check my <a href="https://github.com/nikitaved">GitHub</a> to see what I work on now.</p>
-    </div>
+    <h4>Baraah Sidahmed</h4>
+    <p><a href="https://cispa.de/en/people/c01baad">Homepage</a>
+  | <a href="mailto:baraah.adil@cispa.de">Email</a>
+   <br />
+  <i>since Jun 2025</i></p>
 
   </div>
 
@@ -272,6 +266,21 @@ <h3>Research assistants</h3>
 </ul>
   </div>
 
+  <div class="col-sm-6 clearfix">
+    <h3>Research engineers</h3>
+    <ul>
+
+<li style="margin-left:-16px;">Nikita (Nik) Vedeneev:
+<i>Dec 24-May 25</i>.
+</li>
+
+</ul>
+  </div>
+
+</div>
+
+<div class="row">
+
   <div class="col-sm-6 clearfix">
     <h3>Visiting students</h3>
     <ul>
diff --git a/images/publications/mirror-mirror.jpg b/images/publications/mirror-mirror.jpg