Updated on 2024-11-26

lxaw · lxaw · commit c10e1cac86fb · 2024-11-26T08:20:50.000-05:00
diff --git a/papers/list.json b/papers/list.json
@@ -1,7 +1,16 @@
 [
+  {
+    "title": "A Simple Early Exiting Framework for Accelerating Sampling in Diffusion Models",
+    "author": "Taehong Moon et al",
+    "year": "2024",
+    "topic": "diffusion, early exit",
+    "venue": "ICML",
+    "description": "This paper presents Adaptive Score Estimation (ASE), a novel framework that accelerates diffusion model sampling by adaptively allocating computational resources based on the time step being processed. The authors observe that score estimation near the noise distribution (t→1) requires less computational power than estimation near the data distribution (t→0), leading them to develop a time-dependent early-exiting scheme where more neural network blocks are skipped during the noise-phase sampling steps. Their approach differs between architectures - for DiT models they skip entire blocks, while for U-ViT models they preserve the linear layers connected to skip connections while dropping other block components to maintain the residual pathway information. The authors fine-tune their models using a specially designed training procedure that employs exponential moving averages and weighted coefficients to ensure minimal information updates near t→0 while allowing more updates near t→1.",
+    "link": "https://arxiv.org/pdf/2408.05927"
+  },
   {
     "title": "Active Prompting with Chain-of-Thought for Large Language Models",
-    "author": "Shizhe Diao, et al",
+    "author": "Shizhe Diao et al",
     "year": "2023",
     "topic": "prompting, cot",
     "venue": "Arxiv",
@@ -10,7 +19,7 @@
   },
   {
     "title": "RAFT: Reward rAnked FineTuning for Generative Foundation Model Alignment",
-    "author": "Hanze Dong, et al",
+    "author": "Hanze Dong et al",
     "year": "2023",
     "topic": "watermark, offset learning",
     "venue": "TMLR",
@@ -19,7 +28,7 @@
   },
   {
     "title": "Finding needles in a haystack: A Black-Box Approach to Invisible Watermark Detection",
-    "author": "Minzhou Pan, et al",
+    "author": "Minzhou Pan et al",
     "year": "2024",
     "topic": "watermark, offset learning",
     "venue": "Arxiv",
@@ -28,7 +37,7 @@
   },
   {
     "title": "Mitigating the Alignment Tax of RLHF",
-    "author": "Yong Lin, et al",
+    "author": "Yong Lin et al",
     "year": "2024",
     "topic": "rlhf, alignment",
     "venue": "Arxiv",
@@ -37,7 +46,7 @@
   },
   {
     "title": "AsyncDiff: Parallelizing Diffusion Models by Asynchronous Denoising",
-    "author": "Zigeng Chen, et al",
+    "author": "Zigeng Chen et al",
     "year": "2024",
     "topic": "diffusion, parallelization, denoising",
     "venue": "Arxiv",
diff --git a/papers_read.html b/papers_read.html
@@ -75,10 +75,10 @@ <h1>Here's where I keep a list of papers I have read.</h1>
         I typically use this to organize papers I found interesting. Please feel free to do whatever you want with it. Note that this is not every single paper I have ever read, just a collection of ones that I remember to put down.
     </p>
     <p id="paperCount">
-        So far, we have read 180 papers. Let's keep it up!
+        So far, we have read 181 papers. Let's keep it up!
     </p> 
     <small id="searchCount">
-        Your search returned 180 papers. Nice! 
+        Your search returned 181 papers. Nice! 
     </small>
     
     <div class="search-inputs">
@@ -105,9 +105,19 @@ <h1>Here's where I keep a list of papers I have read.</h1>
         </thead>
         <tbody>
         
+            <tr>
+                <td>A Simple Early Exiting Framework for Accelerating Sampling in Diffusion Models</td>
+                <td>Taehong Moon et al</td>
+                <td>2024</td>
+                <td>diffusion, early exit</td>
+                <td>ICML</td>
+                <td>This paper presents Adaptive Score Estimation (ASE), a novel framework that accelerates diffusion model sampling by adaptively allocating computational resources based on the time step being processed. The authors observe that score estimation near the noise distribution (t→1) requires less computational power than estimation near the data distribution (t→0), leading them to develop a time-dependent early-exiting scheme where more neural network blocks are skipped during the noise-phase sampling steps. Their approach differs between architectures - for DiT models they skip entire blocks, while for U-ViT models they preserve the linear layers connected to skip connections while dropping other block components to maintain the residual pathway information. The authors fine-tune their models using a specially designed training procedure that employs exponential moving averages and weighted coefficients to ensure minimal information updates near t→0 while allowing more updates near t→1.</td>
+                <td><a href="https://arxiv.org/pdf/2408.05927" target="_blank">Link</a></td>
+            </tr>
+        
             <tr>
                 <td>Active Prompting with Chain-of-Thought for Large Language Models</td>
-                <td>Shizhe Diao, et al</td>
+                <td>Shizhe Diao et al</td>
                 <td>2023</td>
                 <td>prompting, cot</td>
                 <td>Arxiv</td>
@@ -117,7 +127,7 @@ <h1>Here's where I keep a list of papers I have read.</h1>
         
             <tr>
                 <td>RAFT: Reward rAnked FineTuning for Generative Foundation Model Alignment</td>
-                <td>Hanze Dong, et al</td>
+                <td>Hanze Dong et al</td>
                 <td>2023</td>
                 <td>watermark, offset learning</td>
                 <td>TMLR</td>
@@ -127,7 +137,7 @@ <h1>Here's where I keep a list of papers I have read.</h1>
         
             <tr>
                 <td>Finding needles in a haystack: A Black-Box Approach to Invisible Watermark Detection</td>
-                <td>Minzhou Pan, et al</td>
+                <td>Minzhou Pan et al</td>
                 <td>2024</td>
                 <td>watermark, offset learning</td>
                 <td>Arxiv</td>
@@ -137,7 +147,7 @@ <h1>Here's where I keep a list of papers I have read.</h1>
         
             <tr>
                 <td>Mitigating the Alignment Tax of RLHF</td>
-                <td>Yong Lin, et al</td>
+                <td>Yong Lin et al</td>
                 <td>2024</td>
                 <td>rlhf, alignment</td>
                 <td>Arxiv</td>
@@ -147,7 +157,7 @@ <h1>Here's where I keep a list of papers I have read.</h1>
         
             <tr>
                 <td>AsyncDiff: Parallelizing Diffusion Models by Asynchronous Denoising</td>
-                <td>Zigeng Chen, et al</td>
+                <td>Zigeng Chen et al</td>
                 <td>2024</td>
                 <td>diffusion, parallelization, denoising</td>
                 <td>Arxiv</td>