|
1 | 1 | - title: "The Fragile Truth of Saliency: Improving LLM Input Attribution via Attention Bias Optimization" |
2 | 2 | image: dummy.png |
3 | 3 | description: |
4 | | - authors: "<span style='color:blue'>Yihua Zhang</span>, <span style='color:blue'>Changsheng Wang</span>, <span style='color:blue'>Yiwei Chen</span>, <span style='color:blue'>Chongyu Fan</span>, <span style='color:blue'>Jinghan Jia</span>, <span style='color:blue'>Sijia Liu</span>" |
| 4 | + authors: "<span style='color:blue'>Y. Zhang</span>, <span style='color:blue'>C. Wang</span>, <span style='color:blue'>Y. Chen</span>, <span style='color:blue'>C. Fan</span>, <span style='color:blue'>J. Jia</span>, <span style='color:blue'>S. Liu</span>" link: |
5 | 5 | link: |
6 | 6 | url: https://neurips.cc/virtual/2025/poster/119184 |
7 | 7 | display: NeurIPS'25 (<span style='color:red'><b>Spotlight</b>, acceptance rate 3.2%</span>) |
8 | 8 | highlight: 0 |
9 | 9 | news2: |
10 | 10 | post: |
11 | 11 |
|
| 12 | +- title: "Simplicity Prevails: Rethinking Negative Preference Optimization for LLM Unlearning" |
| 13 | + image: dummy.png |
| 14 | + description: |
| 15 | + authors: "<span style='color:blue'>C. Fan*</span>, <span style='color:blue'>J. Liu*</span>, L. Lin*, <span style='color:blue'>J. Jia</span>, S. Mei, <span style='color:blue'>S. Liu</span>"link: |
| 16 | + link: |
| 17 | + url: https://arxiv.org/abs/2410.07163 |
| 18 | + display: NeurIPS'25 |
| 19 | + highlight: 0 |
| 20 | + news2: |
| 21 | + post: |
| 22 | + |
| 23 | +- title: "LLM Unlearning on Noisy Forget Sets: A Study of Incomplete, Rewritten, and Watermarked Data" |
| 24 | + image: dummy.png |
| 25 | + description: |
| 26 | + authors: "<span style='color:blue'>C. Wang</span>, <span style='color:blue'>Y. Zhang</span>, D. Wei, <span style='color:blue'>J. Jia</span>, P.-Y. Chen, <span style='color:blue'>S. Liu</span>" |
| 27 | + link: |
| 28 | + url: https://arxiv.org/abs/2510.09007 |
| 29 | + display: CCS AISec'25 |
| 30 | + highlight: 0 |
| 31 | + news2: |
| 32 | + post: |
| 33 | + |
| 34 | +- title: "One Token Embedding Is Enough to Deadlock Your Large Reasoning Model" |
| 35 | + image: dummy.png |
| 36 | + description: |
| 37 | + authors: "M. Zhang*, <span style='color:blue'>Y. Zhang*</span>, <span style='color:blue'>J. Jia</span>, Z. Wang, <span style='color:blue'>S. Liu</span>, T. Chen" |
| 38 | + link: |
| 39 | + url: https://arxiv.org/abs/2510.15965 |
| 40 | + display: NeurIPS'25 |
| 41 | + highlight: 0 |
| 42 | + news2: |
| 43 | + post: |
| 44 | + |
| 45 | +- title: "Reasoning Model Unlearning: Forgetting Traces, Not Just Answers, While Preserving Reasoning Skills" |
| 46 | + image: dummy.png |
| 47 | + description: |
| 48 | + authors: "<span style='color:blue'>C. Wang*</span>, <span style='color:blue'>C. Fan*</span>, <span style='color:blue'>Y. Zhang</span>, <span style='color:blue'>J. Jia</span>, D. Wei, P. Ram, N. Baracaldo, <span style='color:blue'>S. Liu</span>" |
| 49 | + link: |
| 50 | + url: https://arxiv.org/abs/2506.12963 |
| 51 | + display: EMNLP'25 (Main Track) |
| 52 | + highlight: 0 |
| 53 | + news2: |
| 54 | + post: |
| 55 | + |
| 56 | +- title: "LLM Unlearning Reveals a Stronger-Than-Expected Coreset Effect in Current Benchmarks" |
| 57 | + image: dummy.png |
| 58 | + description: |
| 59 | + authors: "<span style='color:blue'>S. Pal*</span>, <span style='color:blue'>C. Wang*</span>, J. Diffenderfer, B. Kailkhura, <span style='color:blue'>S. Liu</span>" |
| 60 | + link: |
| 61 | + url: https://arxiv.org/abs/2504.10185 |
| 62 | + display: COLM'25 |
| 63 | + highlight: 0 |
| 64 | + news2: |
| 65 | + post: |
| 66 | + |
| 67 | +- title: "Invisible Watermarks, Visible Gains: Steering Machine Unlearning with Bi-Level Watermarking Design" |
| 68 | + image: dummy.png |
| 69 | + description: |
| 70 | + authors: "<span style='color:blue'>Y. Sun*</span>, <span style='color:blue'>Y. Zhang*</span>, G. Liu, H. Xie,<span style='color:blue'>S. Liu</span>" |
| 71 | + link: |
| 72 | + url: https://arxiv.org/abs/2508.10065 |
| 73 | + display: ICCV'25 |
| 74 | + highlight: 0 |
| 75 | + news2: |
| 76 | + post: |
| 77 | + |
12 | 78 | - title: "Towards LLM Unlearning Resilient to Relearn- ing Attacks: A Sharpness-Aware Minimization Perspective and Beyond" |
13 | 79 | image: dummy.png |
14 | 80 | description: |
|
0 commit comments