Merge branch 'source' of github.com:UTAustin-SwarmLab/UTAustin-SwarmLab.github.io into source

d31003 · d31003 · commit 38477dc3690d · 2025-09-21T12:01:53.000-05:00
diff --git a/.github/workflows/jekyll.yml b/.github/workflows/jekyll.yml
@@ -1,47 +1,65 @@
+# This workflow uses actions that are not certified by GitHub.
+# They are provided by a third-party and are governed by
+# separate terms of service, privacy policy, and support
+# documentation.
+
+# Sample workflow for building and deploying a Jekyll site to GitHub Pages
 name: Deploy Jekyll site to Pages
 
 on:
+  # Runs on pushes targeting the default branch
   push:
     branches: ["source"]
 
+  # Allows you to run this workflow manually from the Actions tab
+  workflow_dispatch:
+
+# Sets permissions of the GITHUB_TOKEN to allow deployment to GitHub Pages
 permissions:
   contents: read
   pages: write
   id-token: write
 
+# Allow only one concurrent deployment, skipping runs queued between the run in-progress and latest queued.
+# However, do NOT cancel in-progress runs as we want to allow these production deployments to complete.
 concurrency:
   group: "pages"
-  cancel-in-progress: true
+  cancel-in-progress: false
 
 jobs:
+  # Build job
   build:
     runs-on: ubuntu-latest
     steps:
       - name: Checkout
         uses: actions/checkout@v4
-
       - name: Setup Ruby
-        uses: ruby/setup-ruby@v1
+        # https://github.com/ruby/setup-ruby/releases/tag/v1.207.0
+        uses: ruby/setup-ruby@4a9ddd6f338a97768b8006bf671dfbad383215f4
         with:
-          ruby-version: '3.4.1'
-          bundler-cache: true
-          cache-version: 1
-
+          ruby-version: '3.2.3' # Not needed with a .ruby-version file
+          bundler-cache: true # runs 'bundle install' and caches installed gems automatically
+          cache-version: 0 # Increment this number if you need to re-download cached gems
+      - name: Setup Pages
+        id: pages
+        uses: actions/configure-pages@v5
       - name: Build with Jekyll
+        # Outputs to the './_site' directory by default
         run: bundle exec jekyll build --baseurl "${{ steps.pages.outputs.base_path }}"
         env:
           JEKYLL_ENV: production
+      - name: Upload artifact
+        # Automatically uploads an artifact from the './_site' directory by default
+        uses: actions/upload-pages-artifact@v3
 
-  # deploy:
-  #   needs: build
-  #   runs-on: ubuntu-latest
-  #   permissions:
-  #     pages: write
-  #     id-token: write
-  #   environment:
-  #     name: github-pages
-  #     url: ${{ steps.deployment.outputs.page_url }}
-  #   steps:
-  #     - name: Deploy to GitHub Pages
-  #       id: deployment
-  #       uses: actions/deploy-pages@v4
+  # Deployment job
+  deploy:
+    environment:
+      name: github-pages
+      url: ${{ steps.deployment.outputs.page_url }}
+    runs-on: ubuntu-latest
+    needs: build
+    steps:
+      - name: Deploy to GitHub Pages
+        id: deployment
+        uses: actions/deploy-pages@v4
diff --git a/Gemfile b/Gemfile
@@ -1,7 +1,7 @@
 # frozen_string_literal: true
 
 source "https://rubygems.org"
-ruby ">= 3.2.3"
+ruby ">= 3.1.3"
 
 # gem "rails"
 
diff --git a/_bibliography/references.bib b/_bibliography/references.bib
@@ -2,6 +2,34 @@
 ---
 references
 ==========
+@article{baser2025fairsynergy,
+    title={FairSynergy: Fair Resource Allocation for Fleet Intelligence},
+    author={Baser, Oguzhan and Kale, Kaan and Li, Po-han and Chinchali, Sandeep},
+    journal={IEEE Global Communications Conference (GLOBECOM)},
+    year={2025},
+}
+
+@article{baser2025phonemefake,
+  title={PhonemeFake: Redefining Deepfake Realism with Language-Driven Segmental Manipulation and Adaptive Bilevel Detection},
+  author={Baser, Oguzhan and  Tanriverdi, Ahmet Ege and Vishwanath, Sriram and Chinchali, Sandeep},
+  journal={Proceedings of Interspeech},
+  year={2025},
+}
+
+@article{baser2025wavshape,
+  title={WavShape: Information-Theoretic Speech Representation Learning for Fair and Privacy-Aware Audio Processing},
+  author={Baser, Oguzhan and  Tanriverdi, Ahmet Ege and Kale, Kaan and Chinchali, Sandeep and Vishwanath, Sriram},
+  journal={Proceedings of Interspeech},
+  year={2025},
+}
+
+@article{akcin2025dual,
+    title={Distributed Upload and Active Labeling for Resource-Constrained Fleet Learning},
+    author={Akcin, Oguzhan and Goel, Harsh and Zhao, Ruihan and Sandeep P. Chinchali},
+    journal={9th Annual Conference on Robot Learning},
+    year={2025},
+    url={https://openreview.net/forum?id=M1e2PEMLp2}
+}
 
 @article{Omama2024exploiting,
   title={Exploiting Distribution Constraints for Scalable and Efficient Image Retrieval},
@@ -35,7 +63,7 @@ @article{akcin2024fleet
 @article{baser2024securespectra,
   title={SecureSpectra: Safeguarding Digital Identity from Deep Fake Threats via Intelligent Signatures},
   author={Baser, Oguzhan and Kale, Kaan and Chinchali, Sandeep},
-  journal={INTERSPEECH},
+  journal={Proceedings of Interspeech},
   year={2024}
 }
 
diff --git a/_data/news.yml b/_data/news.yml
@@ -1,9 +1,12 @@
-- date: 2025-24-01
+- date: 2025-08-01
   details: >-
-    Po-han's and Omama's papers <a href="https://openreview.net/forum?id=6Mg7pjG7Sw"> CSA: Data-efficient Mapping of Unimodal Features to Multimodal Features </a> and <a href="https://openreview.net/forum?id=d0tlL0ZWlu"> Exploiting Distribution Constraints for Scalable and Efficient Image Retrieval </a> were accepted to ICLR 2025!
-- date: 2024-19-12
+    Oguzhan B.'s paper <a href="https://openreview.net/forum?id=M1e2PEMLp2"> Fair Resource Allocation for Fleet Intelligence </a> was accepted to GLOBECOM 2025!
+- date: 2025-08-01
   details: >-
-    Philip's papers <a href="https://arxiv.org/abs/2410.18242"> Human-Agent Coordination in Games under Incomplete Information via Multi-Step Intent </a> was accepted to AAMAS 2025!
-- date: 2024-19-09
+    Oguzhan A.'s paper <a href="https://openreview.net/forum?id=M1e2PEMLp2"> Distributed Upload and Active Labeling for Resource-Constrained Fleet Learning </a> was accepted to CoRL 2025!
+- date: 2025-07-15
   details: >-
-    Philip's and Oguzhan A.'s' papers <a href="https://philipzrh.com/lane/"> Accelerating Visual Sparse-Reward Learning with Latent Nearest-Demonstration-Guided Exploration </a> and <a href="https://openreview.net/forum?id=9dsBQhoqVr"> Fleet Supervisor Allocation: A Submodular Maximization Approach</a> were accepted to CoRL 2024.
+    Oguzhan B.'s paper <a href="https://arxiv.org/abs/2506.22789"> Information-Theoretic Speech Representation Learning for Fair and Privacy-Aware Audio Processing </a> was accepted to INTERSPEECH 2025!
+- date: 2025-07-15
+  details: >-
+    Oguzhan B.'s paper <a href="https://arxiv.org/abs/2506.22783"> Redefining Deepfake Realism with Language-Driven Segmental Manipulation and Adaptive Bilevel Detection </a> was accepted to INTERSPEECH 2025!
diff --git a/_people/oguzhan_akcin.md b/_people/oguzhan_akcin.md
@@ -1,6 +1,6 @@
 ---
 name: Oguzhan Akcin
-position: gradstudent
+position: alumni
 avatar: oguzhan_akcin.jpg
 ---
 
diff --git a/_posts/2025-04-01-IRDC.md b/_posts/2025-04-01-IRDC.md
@@ -0,0 +1,71 @@
+---
+title: 'Exploiting Distribution Constraints for Scalable and Efficient Image Retrieval'
+description: ICLR 2025 paper
+categories: blog
+---
+
+*By Mohammad Omama*
+
+
+# Exploiting Distribution Constraints for Scalable and Efficient Image Retrieval
+
+> Proceedings of the International Conference on Learning Representations (ICLR)
+
+
+`TLDR:` Image Retrieval with Foundation Models: Better, Faster, Distribution-Aware!
+
+[ArXiv](https://arxiv.org/abs/2410.07022)
+
+[Project Website](https://mohdomama.github.io/IRDC-Project-Website/)
+
+## Motivation
+
+Image retrieval is pivotal in many real-world applications, from visual place recognition in robotics to personalized recommendations in e-commerce. However, current state-of-the-art (SOTA) image retrieval methods face two significant problems:
+
+1. **Scalability Issue**: State-of-the-art (SOTA) image retrieval methods train large models separately for each dataset. This is __not scalable__.
+
+2. **Efficiency Issue**: SOTA image retrieval methods use large embeddings, and since retrieval speed is directly proportional to embedding size, this is __not efficient__.
+
+Our research specifically targets these challenges with two crucial questions:
+- **Q1 (Scalability)**: Can we enhance the performance of universal off-the-shelf models in an entirely unsupervised way?
+- **Q2 (Efficiency)**: Is it possible to design an effective unsupervised dimensionality reduction method that preserves the similarity structure and can adaptively perform well at varying embedding sizes?
+
+## Contributions
+
+To tackle the scalability and efficiency challenges, our work introduces the follwoing novel ideas:
+
+- **Autoencoders with Strong Variance Constraints (AE-SVC)**: Addressing scalability, AE-SVC significantly improves off-the-shelf foundation model embeddings through three rigorously enforced constraints: orthogonality, mean-centering, and unit variance in the latent space. We both empirically demonstrate and mathematically validate that these constraints adjust the distribution of cosine similarity, making embeddings more discriminative.
+
+- **Single Shot Similarity Space Distillation ((SS)<sub>2</sub> D)**: To tackle efficiency, (SS)<sub>2</sub> D provides dimensionality reduction that preserves similarity structures
+  and further allows embeddings to adaptively scale without retraining. This enables smaller segments of the embedding to retain high retrieval performance, significantly speeding up retrieval.
+
+## Methodology
+
+Our proposed approach follows a two-step pipeline:
+
+1. **AE-SVC** first trains an autoencoder with the constraints mentioned to enhance the embeddings from foundation models.
+2. The improved embeddings from AE-SVC are then distilled using **(SS)<sub>2</sub>D**, producing embeddings that are both efficient and adaptive at various sizes.
+
+The training process ensures that the resulting embeddings, even at smaller sizes, preserve similarity relationships, making them highly effective for retrieval tasks.
+
+![Methodology Pipeline](/images/post/IRDC_pipeline.png)
+
+## Impact on Cosine Similarity Distribution
+
+Our AE-SVC method profoundly impacts cosine similarity distributions, significantly reducing their variance. 
+Lower variance in similarity distributions correlates with improved discriminative power as we mathematically prove in our paper.
+Our method shows remarkable benefits, particularly for general-purpose foundation models like DINO, compared to already optimized dataset-specific models such as Cosplace.
+
+![Cosine Similarity Distribution](/images/post/IRDC_theory.png)
+
+## Results
+
+Our experimental validation demonstrates:
+
+- **AE-SVC** consistently surpasses baseline PCA methods across multiple datasets, offering an average of 15.5% improvement in retrieval performance.
+- **(SS)<sub>2</sub>D**, building upon AE-SVC, achieves up to a 10% further improvement at smaller embedding sizes, demonstrating superior performance compared to traditional dimensionality reduction methods like VAE and approaches the theoretical upper bound set by SSD.
+
+This advancement represents a significant step towards more practical, scalable, and efficient image retrieval solutions, enhancing both speed and accuracy.
+
+![Retrieval Performance Results](/images/post/IRDC_results.png)
+
diff --git a/images/post/IRDC_pipeline.png b/images/post/IRDC_pipeline.png
diff --git a/images/post/IRDC_results.png b/images/post/IRDC_results.png
diff --git a/images/post/IRDC_theory.png b/images/post/IRDC_theory.png
diff --git a/index.html b/index.html
@@ -24,7 +24,7 @@ <h2> Recent News </h2>
           <u>Happenings of the last four months. Updated {{ 'now' | date: "%m/%d/%y" }}.</u>
           <span style="display: block; margin-bottom: 1em"></span>
           <div class="news">
-              {% capture now %}{{'now' | date: "%s" | minus: 5184000}}{% endcapture %}
+              {% capture now %}{{'now' | date: "%s" | minus: 10368000}}{% endcapture %}
               <ul style="list-style-position:outside;padding:20px" >
                 {% for new in site.data.news %}
                   {% capture date %}{{new.date | date: '%s' | plus: 0}}{% endcapture %}
diff --git a/people.md b/people.md
@@ -61,6 +61,7 @@ permalink: /people/
 
 | Name | Time at SwarmLab | Where they went |
 | :------------- |:-------------| :-----------|
+| Oguzhan Akcin | 2021-2025 | Meta |
 |Sharachchandra Bhat| 2021-2023 | Tesla|
 |Pranav Kasibhatla| 2023-2024 |Columbia University|
 |Sundar Sripada V. S.| 2022-2023 | UT Austin|