Skip to content

Commit 78544b4

Browse files
author
Nora
committed
docs: update papers
1 parent 74063e1 commit 78544b4

File tree

14 files changed

+161
-25
lines changed

14 files changed

+161
-25
lines changed

.github/ISSUE_TEMPLATE/missing_paper.yml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,7 @@ body:
7171
- data_synthesis
7272
- data_analysis
7373
- methods_analysis
74+
- others
7475
validations:
7576
required: true
7677
- type: input

README.md

Lines changed: 12 additions & 7 deletions
Large diffs are not rendered by default.

app/data/papers_data_collection.yaml

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,28 @@
1010
arxiv: https://arxiv.org/abs/2603.13023
1111
github: https://github.com/GAIR-NLP/OpenSWE
1212
huggingface: https://huggingface.co/datasets/GAIR/OpenSWE
13+
- short_name: SWE-Next
14+
title: 'SWE-Next: Scalable Real-World Software Engineering Tasks for Agents'
15+
authors: Jiarong Liang, Zhiheng Lyu, Zijie Liu, Xiangchao Chen, Ping Nie, Kai Zou,
16+
Wenhu Chen
17+
year: '2026'
18+
venue: arXiv preprint arXiv:2603.20691
19+
month: 2026-03
20+
links:
21+
arxiv: https://arxiv.org/abs/2603.20691
22+
github: https://github.com/TIGER-AI-Lab/SWE-Next
23+
- short_name: RepoLaunch
24+
title: 'RepoLaunch: Automating Build&Test Pipeline of Code Repositories on ANY Language
25+
and ANY Platform'
26+
authors: Kenan Li, Rongzhi Li, Linghao Zhang, Qirui Jin, Liao Zhu, Xiaosong Huang,
27+
Geng Zhang, Yikai Zhang, Shilin He, Chengxing Xie, Xin Zhang, Zijian Jin, Bowen
28+
Li, Chaoyun Zhang, Yu Kang, Yufan Huang, Elsie Nallipogu, Saravan Rajmohan, Qingwei
29+
Lin, Dongmei Zhang
30+
year: '2026'
31+
venue: arXiv preprint arXiv:2603.05026
32+
month: 2026-03
33+
links:
34+
arxiv: https://arxiv.org/abs/2603.05026
1335
- short_name: DockSmith
1436
title: 'DockSmith: Scaling Reliable Coding Environments via an Agentic Docker Builder'
1537
authors: Jiaran Zhang, Luck Ma, Yanhao Li, Fanqi Wan, Di Qi, Xu Zhao, Jieyi Hou,
@@ -104,3 +126,11 @@
104126
links:
105127
arxiv: https://arxiv.org/abs/2505.20411v2
106128
openreview: https://openreview.net/forum?id=nMpJoVmRy1
129+
- short_name: SetUpAgent, SWEE-bench, SWA-bench
130+
title: Automated Benchmark Generation for Repository-Level Coding Tasks
131+
authors: Konstantinos Vergopoulos, Mark Niklas Müller, Martin Vechev
132+
year: '2025'
133+
venue: arXiv preprint arXiv:2503.07701
134+
month: 2025-03
135+
links:
136+
arxiv: https://arxiv.org/abs/2503.07701

app/data/papers_evaluation_datasets.yaml

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,15 @@
4040
links:
4141
arxiv: https://arxiv.org/abs/2603.15401
4242
github: https://github.com/GeniusHTX/SWE-Skills-Bench
43+
- short_name: MobileDev-Bench
44+
title: 'MobileDev-Bench: A Comprehensive Benchmark for Evaluating Language Models
45+
on Mobile Application Development'
46+
authors: Moshood A. Fakorede, Krishna Upadhyay, A. B. Siddique, Umar Farooq
47+
year: '2026'
48+
venue: arXiv preprint arXiv:2603.24946
49+
month: 2026-03
50+
links:
51+
arxiv: https://arxiv.org/abs/2603.24946
4352
- short_name: SWE Context Bench
4453
title: 'SWE Context Bench: A Benchmark for Context Learning in Coding'
4554
authors: Jared Zhu, Minhao Hu, Junde Wu
@@ -219,6 +228,14 @@
219228
month: 2025-03
220229
links:
221230
arxiv: https://arxiv.org/abs/2503.06680v2
231+
- short_name: SetUpAgent, SWEE-bench, SWA-bench
232+
title: Automated Benchmark Generation for Repository-Level Coding Tasks
233+
authors: Konstantinos Vergopoulos, Mark Niklas Müller, Martin Vechev
234+
year: '2025'
235+
venue: arXiv preprint arXiv:2503.07701
236+
month: 2025-03
237+
links:
238+
arxiv: https://arxiv.org/abs/2503.07701
222239
- short_name: SWE-Lancer
223240
title: "SWE-Lancer: Can Frontier LLMs Earn $1 Million from Real-World\n \
224241
\ Freelance Software Engineering?"

app/data/papers_others.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
[]

app/data/papers_rl.yaml

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,12 @@
1+
- short_name: SWE-Fuse
2+
title: 'SWE-Fuse: Empowering Software Agents via Issue-free Trajectory Learning
3+
and Entropy-aware RLVR Training'
4+
authors: Xin-Cheng Wen, Binbin Chen, Haoxuan Lan, Hang Yu, Peng Di, Cuiyun Gao
5+
year: '2026'
6+
venue: arXiv preprint arXiv:2603.07927
7+
month: 2026-03
8+
links:
9+
arxiv: https://arxiv.org/abs/2603.07927
110
- short_name: SWE-Master
211
title: 'SWE-Master: Unleashing the Potential of Software Engineering Agents via
312
Post-Training'

app/docs/admin/data.json

Lines changed: 65 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,61 @@
11
{
2-
"generated": "2026-03-28",
2+
"generated": "2026-04-01",
33
"stats": {
4-
"total": 204,
5-
"data": 53,
6-
"methods": 130,
4+
"total": 209,
5+
"data": 57,
6+
"methods": 131,
77
"analysis": 23
88
},
99
"papers": [
10+
{
11+
"id": 210,
12+
"short_name": "RepoLaunch",
13+
"title": "RepoLaunch: Automating Build&Test Pipeline of Code Repositories on ANY Language and ANY Platform",
14+
"authors": "Kenan Li, Rongzhi Li, Linghao Zhang, Qirui Jin, Liao Zhu, Xiaosong Huang, Geng Zhang, Yikai Zhang, Shilin He, Chengxing Xie, Xin Zhang, Zijian Jin, Bowen Li, Chaoyun Zhang, Yu Kang, Yufan Huang, Elsie Nallipogu, Saravan Rajmohan, Qingwei Lin, Dongmei Zhang",
15+
"venue": "arXiv preprint arXiv:2603.05026",
16+
"month": "2026-03",
17+
"category": "data_collection",
18+
"links": {
19+
"arxiv": "https://arxiv.org/abs/2603.05026"
20+
}
21+
},
22+
{
23+
"id": 209,
24+
"short_name": "SWE-Fuse",
25+
"title": "SWE-Fuse: Empowering Software Agents via Issue-free Trajectory Learning and Entropy-aware RLVR Training",
26+
"authors": "Xin-Cheng Wen, Binbin Chen, Haoxuan Lan, Hang Yu, Peng Di, Cuiyun Gao",
27+
"venue": "arXiv preprint arXiv:2603.07927",
28+
"month": "2026-03",
29+
"category": "rl",
30+
"links": {
31+
"arxiv": "https://arxiv.org/abs/2603.07927"
32+
}
33+
},
34+
{
35+
"id": 208,
36+
"short_name": "MobileDev-Bench",
37+
"title": "MobileDev-Bench: A Comprehensive Benchmark for Evaluating Language Models on Mobile Application Development",
38+
"authors": "Moshood A. Fakorede, Krishna Upadhyay, A. B. Siddique, Umar Farooq",
39+
"venue": "arXiv preprint arXiv:2603.24946",
40+
"month": "2026-03",
41+
"category": "evaluation_datasets",
42+
"links": {
43+
"arxiv": "https://arxiv.org/abs/2603.24946"
44+
}
45+
},
46+
{
47+
"id": 207,
48+
"short_name": "SWE-Next",
49+
"title": "SWE-Next: Scalable Real-World Software Engineering Tasks for Agents",
50+
"authors": "Jiarong Liang, Zhiheng Lyu, Zijie Liu, Xiangchao Chen, Ping Nie, Kai Zou, Wenhu Chen",
51+
"venue": "arXiv preprint arXiv:2603.20691",
52+
"month": "2026-03",
53+
"category": "data_collection",
54+
"links": {
55+
"arxiv": "https://arxiv.org/abs/2603.20691",
56+
"github": "https://github.com/TIGER-AI-Lab/SWE-Next"
57+
}
58+
},
1059
{
1160
"id": 206,
1261
"short_name": "RepoRepair",
@@ -1791,6 +1840,18 @@
17911840
"doi": "http://dx.doi.org/10.1109/ICSE-Companion66252.2025.00075"
17921841
}
17931842
},
1843+
{
1844+
"id": 211,
1845+
"short_name": "SetUpAgent, SWEE-bench, SWA-bench",
1846+
"title": "Automated Benchmark Generation for Repository-Level Coding Tasks",
1847+
"authors": "Konstantinos Vergopoulos, Mark Niklas Müller, Martin Vechev",
1848+
"venue": "arXiv preprint arXiv:2503.07701",
1849+
"month": "2025-03",
1850+
"category": "data_collection,evaluation_datasets",
1851+
"links": {
1852+
"arxiv": "https://arxiv.org/abs/2503.07701"
1853+
}
1854+
},
17941855
{
17951856
"id": 160,
17961857
"short_name": "CoSIL",

app/docs/index.md

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@
3030
<a href="https://github.com/DeepSoftwareAnalytics/Awesome-Issue-Resolution/graphs/contributors" target="_blank">
3131
<img src="https://img.shields.io/github/contributors/DeepSoftwareAnalytics/Awesome-Issue-Resolution?style=for-the-badge&color=green&logo=github" alt="Contributors">
3232
</a>
33-
<img src="https://img.shields.io/badge/papers-204-green?style=for-the-badge&logo=googlescholar&logoColor=white" alt="Papers Count">
33+
<img src="https://img.shields.io/badge/papers-209-green?style=for-the-badge&logo=googlescholar&logoColor=white" alt="Papers Count">
3434
</div>
3535

3636
<!-- Interactive Exploration Badges -->
@@ -392,6 +392,11 @@ This section includes research works that provide in-depth analysis and discussi
392392
* **Agents in the Wild** (2025) [![Website](https://img.shields.io/badge/Website-paper-5B9BD5?logo=googlechrome&logoColor=white)](https://insights.logicstar.ai/){: target="_blank" }
393393
<!-- END PAPERS:methods_analysis -->
394394

395+
### Others
396+
397+
<!-- START PAPERS:others -->
398+
<!-- END PAPERS:others -->
399+
395400
---
396401

397402
## 🚀 Challenges and Opportunities

app/docs/news.md

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,16 +6,15 @@
66

77
<!-- START_RECENT_PAPERS -->
88
- **BeyondSWE**: BeyondSWE: Can Current Code Agent Survive Beyond Single-Repo Bug Fixing? [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.03194) [![GitHub](https://img.shields.io/badge/GitHub-code-181717?logo=github&logoColor=white)](https://github.com/AweAI-Team/BeyondSWE) [![HuggingFace](https://img.shields.io/badge/HuggingFace-model-FFD21E?logo=huggingface&logoColor=black)](https://huggingface.co/datasets/AweAI-Team/BeyondSWE) [![Website](https://img.shields.io/badge/Website-link-5B9BD5?logo=googlechrome&logoColor=white)](https://aweai-team.github.io/BeyondSWE/)
9+
- **MobileDev-Bench**: MobileDev-Bench: A Comprehensive Benchmark for Evaluating Language Models on Mobile Application Development [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.24946)
910
- **RepoRepair**: RepoRepair: Leveraging Code Documentation for Repository-Level Automated Program Repair [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.01048) [![GitHub](https://img.shields.io/badge/GitHub-code-181717?logo=github&logoColor=white)](https://github.com/ZhongQiangDev/RepoRepair)
1011
- **SWE-Adept**: SWE-Adept: An LLM-Based Agentic Framework for Deep Codebase Analysis and Structured Issue Resolution [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.01327)
1112
- **SWE-Atlas**: SWE-Atlas [![Website](https://img.shields.io/badge/Website-link-5B9BD5?logo=googlechrome&logoColor=white)](https://labs.scale.com/leaderboard/sweatlas-qna)
1213
- **SWE-CI**: SWE-CI: Evaluating Agent Capabilities in Maintaining Codebases via Continuous Integration [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.03823) [![GitHub](https://img.shields.io/badge/GitHub-code-181717?logo=github&logoColor=white)](https://github.com/SKYLENAGE-AI/SWE-CI) [![HuggingFace](https://img.shields.io/badge/HuggingFace-model-FFD21E?logo=huggingface&logoColor=black)](https://huggingface.co/datasets/skylenage/SWE-CI)
14+
- **SWE-Fuse**: SWE-Fuse: Empowering Software Agents via Issue-free Trajectory Learning and Entropy-aware RLVR Training [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.07927)
15+
- **SWE-Next**: SWE-Next: Scalable Real-World Software Engineering Tasks for Agents [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.20691) [![GitHub](https://img.shields.io/badge/GitHub-code-181717?logo=github&logoColor=white)](https://github.com/TIGER-AI-Lab/SWE-Next)
1316
- **SWE-Skills-Bench**: SWE-Skills-Bench: Do Agent Skills Actually Help in Real-World Software Engineering? [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.15401) [![GitHub](https://img.shields.io/badge/GitHub-code-181717?logo=github&logoColor=white)](https://github.com/GeniusHTX/SWE-Skills-Bench)
1417
- **OpenSWE**: daVinci-Env: Open SWE Environment Synthesis at Scale [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2603.13023) [![GitHub](https://img.shields.io/badge/GitHub-code-181717?logo=github&logoColor=white)](https://github.com/GAIR-NLP/OpenSWE) [![HuggingFace](https://img.shields.io/badge/HuggingFace-model-FFD21E?logo=huggingface&logoColor=black)](https://huggingface.co/datasets/GAIR/OpenSWE)
15-
- **DockSmith**: DockSmith: Scaling Reliable Coding Environments via an Agentic Docker Builder [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2602.00592) [![HuggingFace](https://img.shields.io/badge/HuggingFace-model-FFD21E?logo=huggingface&logoColor=black)](https://huggingface.co/collections/8sj7df9k8m5x8/docksmith)
16-
- **SWE Context Bench**: SWE Context Bench: A Benchmark for Context Learning in Coding [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/pdf/2602.08316)
17-
- **SWE-Master**: SWE-Master: Unleashing the Potential of Software Engineering Agents via Post-Training [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2602.03411) [![GitHub](https://img.shields.io/badge/GitHub-code-181717?logo=github&logoColor=white)](https://github.com/RUCAIBox/SWE-Master)
18-
- **SWE-World**: SWE-World: Building Software Engineering Agents in Docker-Free Environments [![arXiv](https://img.shields.io/badge/arXiv-paper-B31B1B?logo=arxiv&logoColor=white)](https://arxiv.org/abs/2602.03419) [![GitHub](https://img.shields.io/badge/GitHub-code-181717?logo=github&logoColor=white)](https://github.com/RUCAIBox/SWE-World)
1918
<!-- END_RECENT_PAPERS -->
2019

2120
### Recent Updates

app/view/admin/static/js/admin.js

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,9 @@ let currentlyEditingCell = null;
99

1010
// Multi-select state: Map of paper.id → paper object for all checked papers
1111
const selectedPapers = new Map();
12+
const PAPER_CATEGORIES = ['sft', 'rl', 'data_collection', 'data_analysis', 'data_synthesis',
13+
'evaluation_datasets', 'training_datasets', 'inference_scaling',
14+
'methods_analysis', 'workflow', 'tool', 'memory', 'multi_agent', 'single_agent', 'others'];
1215

1316
// Form field definitions for each entity type
1417
const FORM_FIELDS = {
@@ -19,9 +22,7 @@ const FORM_FIELDS = {
1922
{ name: 'month', label: 'Date (YYYY-MM)', type: 'text', required: true, placeholder: '2026-01' },
2023
{ name: 'venue', label: 'Venue', type: 'text', required: true },
2124
{ name: 'category', label: 'Category', type: 'multiselect', required: true,
22-
options: ['sft', 'rl', 'data_collection', 'data_analysis', 'data_synthesis',
23-
'evaluation_datasets', 'training_datasets', 'inference_scaling',
24-
'methods_analysis', 'workflow', 'tool', 'memory', 'multi_agent', 'single_agent'] },
25+
options: PAPER_CATEGORIES },
2526
{ name: 'abstract', label: 'Abstract', type: 'textarea', required: false },
2627
{ name: 'arxiv_link', label: 'arXiv Link', type: 'url', required: false },
2728
{ name: 'github_link', label: 'GitHub Link', type: 'url', required: false },
@@ -180,8 +181,7 @@ function initializeFilters() {
180181
// Initialize category options
181182
const categorySelect = document.getElementById('filter-category');
182183
if (categorySelect) {
183-
const categories = ['sft', 'rl', 'data_collection', 'data_analysis', 'data_synthesis', 'evaluation_datasets', 'training_datasets', 'inference_scaling', 'methods_analysis', 'workflow', 'tool', 'memory', 'multi_agent', 'single_agent'];
184-
categories.forEach(cat => {
184+
PAPER_CATEGORIES.forEach(cat => {
185185
const option = document.createElement('option');
186186
option.value = cat;
187187
option.textContent = cat;
@@ -428,7 +428,7 @@ function startInlineEdit(cell) {
428428
// Category uses dropdown selection
429429
let categories = [];
430430
if (itemType === 'papers') {
431-
categories = ['sft', 'rl', 'data_collection', 'data_analysis', 'data_synthesis', 'evaluation_datasets', 'training_datasets', 'inference_scaling', 'methods_analysis', 'workflow', 'tool', 'memory', 'multi_agent', 'single_agent'];
431+
categories = PAPER_CATEGORIES;
432432
} else if (itemType === 'datasets') {
433433
categories = ['single-pl', 'multi-pl'];
434434
}

0 commit comments

Comments
 (0)