Add new papers

Zhaoyang-Chu · Zhaoyang-Chu · commit cd84ba00932b · 2025-12-21T13:44:12.000Z
diff --git a/README.md b/README.md
diff --git a/data/ack_repos.yaml b/data/ack_repos.yaml
@@ -10,6 +10,7 @@
 - https://github.com/eltociear/awesome-AI-driven-development
 - https://github.com/YuyaoGe/Awesome-Vibe-Coding
 - https://github.com/codefuse-ai/Awesome-Code-LLM
+- https://github.com/juyongjiang/CodeLLMSurvey
 - https://github.com/xjywhu/Awesome-Multimodal-LLM-for-Code
 - https://github.com/github/awesome-copilot
 - https://github.com/steel-dev/awesome-web-agents
diff --git a/data/papers_3d_object_design.yaml b/data/papers_3d_object_design.yaml
@@ -158,6 +158,14 @@
     github: "https://github.com/LiuHengyu321/IR3D-Bench"
     website: "https://ir3d-bench.github.io/"
 
+- title: "SceneGenAgent: Precise Industrial Scene Generation with Coding Agent"
+  authors: "Xiao Xia, Dan Zhang, Zibo Liao, Zhenyu Hou, Tianrui Sun, Jing Li, Ling Fu, Yuxiao Dong"
+  venue: "ACL 2025"
+  links:
+    paper: "https://aclanthology.org/2025.acl-long.873/"
+    github: ""
+    website: ""
+
 - title: "SceneMotifCoder: Example-driven Visual Program Learning for Generating 3D Object Arrangements"
   authors: "Hou In Ivan Tam, Hou In Derek Pun, Austin T. Wang, Angel X. Chang, Manolis Savva"
   venue: "3DV 2025"
diff --git a/data/papers_code_generation.yaml b/data/papers_code_generation.yaml
@@ -1,3 +1,12 @@
+- title: "Does AI-Assisted Coding Deliver? A Difference-in-Differences Study of Cursor's Impact on Software Projects"
+  authors: "Hao He, Courtney Miller, Shyam Agarwal, Christian Kästner, Bogdan Vasilescu"
+  venue: "arXiv 2025/11"
+  links:
+    paper: "https://arxiv.org/abs/2511.04427"
+    github: ""
+    website: ""
+  tags: "Empirical Study"
+
 - title: "Lost in Code Generation: Reimagining the Role of Software Models in AI-driven Software Engineering"
   authors: "Jürgen Cito, Dominik Bork"
   venue: "arXiv 2025/11"
@@ -138,13 +147,13 @@
     github: "https://github.com/FSoft-AI4Code/HyperAgent"
     website: ""
 
-- title: "Verbal Process Supervision Elicits Better Coding Agents"
-  authors: "Hao-Yuan Chen, Cheng-Pong Huang, Jui-Ming Yao"
-  venue: "arXiv 2025"
-  links:
-    paper: "https://arxiv.org/abs/2503.18494"
-    github: ""
-    website: ""
+# - title: "Verbal Process Supervision Elicits Better Coding Agents"
+#   authors: "Hao-Yuan Chen, Cheng-Pong Huang, Jui-Ming Yao"
+#   venue: "arXiv 2025"
+#   links:
+#     paper: "https://arxiv.org/abs/2503.18494"
+#     github: ""
+#     website: ""
 
 - title: "KernelBench: Can LLMs Write Efficient GPU Kernels?"
   authors: "Anne Ouyang, Simon Guo, Simran Arora, Alex L. Zhang, William Hu, Christopher Ré, Azalia Mirhoseini"
@@ -154,6 +163,14 @@
     github: "https://github.com/ScalingIntelligence/KernelBench"
     website: "https://scalingintelligence.stanford.edu/blogs/kernelbench/"
 
+- title: "EpiCoder: Encompassing Diversity and Complexity in Code Generation"
+  authors: "Yaoxiang Wang, Haoling Li, Xin Zhang, Jie Wu, Xiao Liu, Wenxiang Hu, Zhongxin Guo, Yangyu Huang, Ying Xin, Yujiu Yang, Jinsong Su, Qi Chen, Scarlett Li"
+  venue: "ICML 2025"
+  links:
+    paper: "https://arxiv.org/abs/2501.04694"
+    github: ""
+    website: ""
+
 - title: "On the Impacts of Contexts on Repository-Level Code Generation"
   authors: "Nam Le Hai, Dung Manh Nguyen, Nghi D. Q. Bui"
   venue: "NAACL 2025 Findings"
@@ -258,7 +275,7 @@
     github: ""
     website: ""
 
-- title: "CodeTree: Agent‐guided Tree Search for Code Generation with Large Language Models"
+- title: "CodeTree: Agent-guided Tree Search for Code Generation with Large Language Models"
   authors: "Jierui Li, Hung Le, Yingbo Zhou, Caiming Xiong, Silvio Savarese, Doyen Sahoo"
   venue: "arXiv 2024"
   links:
diff --git a/data/papers_issue_localization.yaml b/data/papers_issue_localization.yaml
@@ -47,6 +47,14 @@
     github: "https://github.com/SalesforceAIResearch/SweRank"
     website: ""
 
+- title: "RANGER: Repository-Level Agent for Graph-Enhanced Retrieval"
+  authors: "Pratik Shah, Rajat Ghosh, Aryan Singhal, Debojyoti Dutta"
+  venue: "arXiv 2025/09"
+  links:
+    paper: "https://arxiv.org/abs/2509.25257"
+    github: ""
+    website: ""
+
 - title: "Benchmarking and Enhancing LLM Agents in Localizing Linux Kernel Bugs"
   authors: "Zhenhao Zhou, Zhuochen Huang, Yike He, Chong Wang, Jiajun Wang, Yijian Wu, Xin Peng, Yiling Lou"
   venue: "arXiv 2025/05"
diff --git a/data/papers_issue_resolution.yaml b/data/papers_issue_resolution.yaml
@@ -6,6 +6,14 @@
     github: "https://github.com/EuniAI/Prometheus"
     website: "https://euni.ai/"
 
+- title: "Unified Software Engineering Agent as AI Software Engineer"
+  authors: "Leonhard Applis, Yuntong Zhang, Shanchao Liang, Nan Jiang, Lin Tan, Abhik Roychoudhury"
+  venue: "ICSE 2026"
+  links:
+    paper: "https://arxiv.org/abs/2506.14683"
+    github: ""
+    website: ""
+
 - title: "Beyond Final Code: A Process-Oriented Error Analysis of Software Development Agents in Real-World GitHub Scenarios"
   authors: "Zhi Chen, Wei Ma, Lingxiao Jiang"
   venue: "ICSE 2026"
@@ -24,6 +32,14 @@
     website: ""
   tags: "Empirical Study"
 
+- title: "Confucius Code Agent: Scalable Agent Scaffolding for Real-World Codebases"
+  authors: "Zhaodong Wang, Zhenting Qi, Sherman Wong, Nathan Hu, Samuel Lin, Jun Ge, Erwin Gao, Wenlin Chen, Yilun Du, Minlan Yu, Ying Zhang"
+  venue: "arXiv 2025/12"
+  links:
+    paper: "https://arxiv.org/abs/2512.10398"
+    github: ""
+    website: ""
+
 - title: "Is Vibe Coding Safe? Benchmarking Vulnerability of Agent-Generated Code in Real-World Tasks"
   authors: "Songwen Zhao, Danqing Wang, Kexun Zhang, Jiaxuan Luo, Zhuo Li, Lei Li"
   venue: "arXiv 2025/12"
@@ -48,6 +64,30 @@
     github: "https://github.com/OpenHands/software-agent-sdk"
     website: ""
 
+- title: "CodeClash: Benchmarking Goal-Oriented Software Engineering"
+  authors: "John Yang, Kilian Lieret, Joyce Yang, Carlos E. Jimenez, Ofir Press, Ludwig Schmidt, Diyi Yang"
+  venue: "arXiv 2025/11"
+  links:
+    paper: "https://arxiv.org/abs/2511.00839"
+    github: ""
+    website: "https://codeclash.ai/"
+
+- title: "InfCode: Adversarial Iterative Refinement of Tests and Patches for Reliable Software Issue Resolution"
+  authors: "KeFan Li, Mengfei Wang, Hengzhi Zhang, Zhichao Li, Yuan Yuan, Mu Li, Xiang Gao, Hailong Sun, Chunming Hu, Weifeng Lv"
+  venue: "arXiv 2025/11"
+  links:
+    paper: "https://arxiv.org/abs/2511.16004"
+    github: ""
+    website: ""
+
+- title: "Agent READMEs: An Empirical Study of Context Files for Agentic Coding"
+  authors: "Worawalan Chatlatanagulchai, Hao Li, Yutaro Kashiwa, Brittany Reid, Kundjanasith Thonglek, Pattara Leelaprute, Arnon Rungsawang, Bundit Manaskasemsak, Bram Adams, Ahmed E. Hassan, Hajimu Iida"
+  venue: "arXiv 2025/11"
+  links:
+    paper: "https://arxiv.org/abs/2511.12884"
+    github: ""
+    website: ""
+
 - title: "Understanding Code Agent Behaviour: An Empirical Study of Success and Failure Trajectories"
   authors: "Oorja Majgaonkar, Zhiwei Fei, Xiang Li, Federica Sarro, He Ye"
   venue: "arXiv 2025/11"
@@ -114,6 +154,14 @@
     github: ""
     website: ""
 
+- title: "Process-Level Trajectory Evaluation for Environment Configuration in Software Engineering Agents"
+  authors: "Jiayi Kuang, Yinghui Li, Xin Zhang, Yangning Li, Di Yin, Xing Sun, Ying Shen, Philip S. Yu"
+  venue: "arXiv 2025/10"
+  links:
+    paper: "https://arxiv.org/abs/2510.25694"
+    github: ""
+    website: ""
+
 - title: "BugPilot: Complex Bug Generation for Efficient Learning of SWE Skills"
   authors: "Atharv Sonwane, Isadora White, Hyunji Lee, Matheus Pereira, Lucas Caccia, Minseon Kim, Zhengyan Shi, Chinmay Singh, Alessandro Sordoni, Marc-Alexandre Côté, Xingdi Yuan"
   venue: "arXiv 2025/10"
@@ -188,6 +236,22 @@
     github: "https://github.com/QuantaAlpha/GitTaskBench"
     website: "https://gittaskbench.github.io/"
 
+- title: "RepoForge: Training a SOTA Fast-thinking SWE Agent with an End-to-End Data Curation Pipeline Synergizing SFT and RL at Scale"
+  authors: "Zhilong Chen, Chengzong Zhao, Boyuan Chen, Dayi Lin, Yihao Chen, Arthur Leung, Gopi Krishnan Rajbahadur, Gustavo A. Oliva, Haoxiang Zhang, Aaditya Bhatia, Chong Chun Yong, Ahmed E. Hassan"
+  venue: "arXiv 2025/08"
+  links:
+    paper: "https://arxiv.org/abs/2508.01550"
+    github: ""
+    website: ""
+
+- title: "Understanding Software Engineering Agents Through the Lens of Traceability: An Empirical Study"
+  authors: "Ira Ceka, Saurabh Pujar, Shyam Ramji, Luca Buratti, Gail Kaiser, Baishakhi Ray"
+  venue: "arXiv 2025/06"
+  links:
+    paper: "https://arxiv.org/abs/2506.08311"
+    github: ""
+    website: ""
+
 - title: "SWE-Bench Pro: Can AI Agents Solve Long-Horizon Software Engineering Tasks?"
   authors: "Xiang Deng, Jeff Da, Edwin Pan, Yannis Yiming He, Charles Ide, Kanak Garg, Niklas Lauffer, Andrew Park, Nitin Pasari, Chetan Rane, Karmini Sampath, Maya Krishnan, Srivatsa Kundurthy, Sean Hendryx, Zifan Wang, Chen Bo Calvin Zhang, Noah Jacobson, Bing Liu, Brad Kenstler"
   venue: "arXiv 2025"
@@ -268,6 +332,14 @@
     github: "https://github.com/yingweima2022/SWE-Reasoner"
     website: ""
 
+- title: "AutoCodeSherpa: Symbolic Explanations in AI Coding Agents"
+  authors: "Sungmin Kang, Haifeng Ruan, Abhik Roychoudhury"
+  venue: "arXiv 2025/07"
+  links:
+    paper: "https://arxiv.org/abs/2507.22414"
+    github: ""
+    website: ""
+
 - title: "Satori-SWE: Evolutionary Test-Time Scaling for Sample-Efficient Software Engineering"
   authors: "Guangtao Zeng, Maohao Shen, Delin Chen, Zhenting Qi, Subhro Das, Dan Gutfreund, David Cox, Gregory Wornell, Wei Lu, Zhang-Wei Hong, Chuang Gan"
   venue: "arXiv 2025/05"
@@ -276,6 +348,14 @@
     github: "https://github.com/satori-reasoning/Satori-SWE"
     website: "https://satori-reasoning.github.io/"
 
+- title: "CrashFixer: A crash resolution agent for the Linux kernel"
+  authors: "Alex Mathai, Chenxi Huang, Suwei Ma, Jihwan Kim, Hailie Mitchell, Aleksandr Nogikh, Petros Maniatis, Franjo Ivančić, Junfeng Yang, Baishakhi Ray"
+  venue: "arXiv 2025/04"
+  links:
+    paper: "https://arxiv.org/abs/2504.20412"
+    github: ""
+    website: ""
+
 - title: "DARS: Dynamic Action Re-Sampling to Enhance Coding Agent Performance by Adaptive Tree Traversal"
   authors: "Vaibhav Aggarwal, Ojasv Kamal, Abhinav Japesh, Zhijing Jin, Bernhard Schölkopf"
   venue: "arXiv 2025/03"
@@ -500,6 +580,14 @@
     github: ""
     website: ""
 
+# - title: "Large Language Model Critics for Execution-Free Evaluation of Code Changes"
+#   authors: "Aashish Yadavally, Hoan Nguyen, Laurent Callot, Gauthier Guinet"
+#   venue: "arXiv 2025/01"
+#   links:
+#     paper: "https://arxiv.org/abs/2501.16655"
+#     github: ""
+#     website: ""
+
 - title: "Can Agents Fix Agent Issues?"
   authors: "Alfin Wijaya Rahardja, Junwei Liu, Weitong Chen, Zhenpeng Chen, Yiling Lou"
   venue: "NeurIPS 2025"
@@ -580,6 +668,14 @@
     github: "https://github.com/Hambaobao/SWE-Flow"
     website: ""
 
+- title: "Nemotron-CORTEXA: Enhancing LLM Agents for Software Engineering Tasks via Improved Localization and Solution Diversity"
+  authors: "Atefeh Sohrabizadeh, Jialin Song, Mingjie Liu, Rajarshi Roy, Chankyu Lee, Jonathan Raiman, Bryan Catanzaro"
+  venue: "ICML 2025"
+  links:
+    paper: "https://openreview.net/forum?id=k6p8UKRdH7"
+    github: ""
+    website: ""
+
 - title: "Guided Search Strategies in Non-Serializable Environments with Applications to Software Engineering Agents"
   authors: "Karina Zainullina, Alexander Golubev, Maria Trofimova, Sergei Polezhaev, Ibragim Badertdinov, Daria Litvintseva, Simon Karasik, Filipp Fisin, Sergei Skvortsov, Maksim Nekrashevich, Anton Shevtsov, Boris Yangel"
   venue: "ICML 2025"
@@ -652,6 +748,14 @@
     github: ""
     website: ""
 
+- title: "Understanding Software Engineering Agents: A Study of Thought-Action-Result Trajectories"
+  authors: "Islem Bouzenia, Michael Pradel"
+  venue: "ASE 2025"
+  links:
+    paper: "https://arxiv.org/abs/2506.18824"
+    github: ""
+    website: ""
+
 - title: "SPICE: An Automated SWE-Bench Labeling Pipeline for Issue Clarity, Test Coverage, and Effort Estimation"
   authors: "Gustavo A. Oliva, Gopi Krishnan Rajbahadur, Aaditya Bhatia, Haoxiang Zhang, Yihao Chen, Zhilong Chen, Arthur Leung, Dayi Lin, Boyuan Chen, Ahmed E. Hassan"
   venue: "ASE 2025"
@@ -692,6 +796,14 @@
     github: "https://github.com/InternLM/SWE-Fixer"
     website: ""
 
+- title: "SynFix: Dependency-Aware Program Repair via RelationGraph Analysis"
+  authors: "Xunzhu Tang, Jiechao Gao, Jin Xu, Tiezhu Sun, Yewei Song, Saad Ezzini, Wendkûuni C. Ouédraogo, Jacques Klein, Tegawendé F. Bissyandé"
+  venue: "ACL 2025 Findings"
+  links:
+    paper: "https://aclanthology.org/2025.findings-acl.252/"
+    github: ""
+    website: ""
+
 - title: "UniDebugger: Hierarchical Multi-Agent Framework for Unified Software Debugging"
   authors: "Cheryl Lee, Chunqiu Steven Xia, Longji Yang, Jen-tse Huang, Zhouruixing Zhu, Lingming Zhang, Michael R. Lyu"
   venue: "EMNLP 2025"
@@ -732,6 +844,14 @@
     github: ""
     website: ""
 
+- title: "Agentic Program Repair from Test Failures at Scale: A Neuro-symbolic approach with static analysis and test execution feedback"
+  authors: "Chandra Maddila, Adam Tait, Claire Chang, Daniel Cheng, Nauman Ahmad, Vijayaraghavan Murali, Marshall Roch, Arnaud Avondet, Aaron Meltzer, Victor Montalvao, Michael Hopko, Chris Waterson, Parth Thakkar, Renuka Fernandez, Kristian Kristensen, Sivan Barzily, Sherry Chen, Rui Abreu, Nachiappan Nagappan, Payam Shodjai, Killian Murphy, James Everingham, Aparna Ramani, Peter C. Rigby"
+  venue: "TSE 2025"
+  links:
+    paper: "https://arxiv.org/abs/2507.18755"
+    github: ""
+    website: ""
+
 - title: "AutoCodeRover: Autonomous Program Improvement"
   authors: "Yuntong Zhang, Haifeng Ruan, Zhiyu Fan, Abhik Roychoudhury"
   venue: "ISSTA 2024"
@@ -772,18 +892,18 @@
     github: "https://github.com/SWE-bench/SWE-bench"
     website: "https://www.swebench.com/"
 
-- title: "CodeR: Issue Resolving with Multi-Agent and Task Graphs"
-  authors: "Dong Chen, Shaoxin Lin, Muhan Zeng, Daoguang Zan, Jian-Gang Wang, Anton Cheshkov, Jun Sun, Hao Yu, Guoliang Dong, Artem Aliev, Jie Wang, Xiao Cheng, Guangtai Liang, Yuchi Ma, Pan Bian, Tao Xie, Qianxiang Wang"
-  venue: "arXiv 2024"
-  links:
-    paper: "https://arxiv.org/abs/2406.01304"
-    github: "https://github.com/NL2Code/CodeR"
-    website: ""
-
-- title: "MarsCode Agent: AI-native Automated Bug Fixing"
-  authors: "Yizhou Liu, Pengfei Gao, Xinchen Wang, Jie Liu, Yexuan Shi, Zhao Zhang, Chao Peng"
-  venue: "arXiv 2025"
-  links:
-    paper: "https://arxiv.org/abs/2409.00899"
-    github: ""
-    website: "https://se-research.bytedance.com/"
+# - title: "CodeR: Issue Resolving with Multi-Agent and Task Graphs"
+#   authors: "Dong Chen, Shaoxin Lin, Muhan Zeng, Daoguang Zan, Jian-Gang Wang, Anton Cheshkov, Jun Sun, Hao Yu, Guoliang Dong, Artem Aliev, Jie Wang, Xiao Cheng, Guangtai Liang, Yuchi Ma, Pan Bian, Tao Xie, Qianxiang Wang"
+#   venue: "arXiv 2024"
+#   links:
+#     paper: "https://arxiv.org/abs/2406.01304"
+#     github: "https://github.com/NL2Code/CodeR"
+#     website: ""
+
+# - title: "MarsCode Agent: AI-native Automated Bug Fixing"
+#   authors: "Yizhou Liu, Pengfei Gao, Xinchen Wang, Jie Liu, Yexuan Shi, Zhao Zhang, Chao Peng"
+#   venue: "arXiv 2025"
+#   links:
+#     paper: "https://arxiv.org/abs/2409.00899"
+#     github: ""
+#     website: "https://se-research.bytedance.com/"
diff --git a/data/papers_machine_learning_engineering.yaml b/data/papers_machine_learning_engineering.yaml
@@ -6,6 +6,14 @@
     github: ""
     website: ""
 
+- title: "ArchPilot: A Proxy-Guided Multi-Agent Approach for Machine Learning Engineering"
+  authors: "Zhuowen Yuan, Tao Liu, Yang Yang, Yang Wang, Feng Qi, Kaushik Rangadurai, Bo Li, Shuang Yang"
+  venue: "arXiv 2025/11"
+  links:
+    paper: "https://arxiv.org/abs/2511.03985"
+    github: ""
+    website: ""
+
 - title: "DeepCode: Open Agentic Coding"
   authors: "Data Intelligence Lab@HKU"
   venue: "2025"
diff --git a/data/papers_sql_engineering.yaml b/data/papers_sql_engineering.yaml
@@ -1,3 +1,11 @@
+# - title: "BAPPA: Benchmarking Agents, Plans, and Pipelines for Automated Text-to-SQL Generation"
+#   authors: "Fahim Ahmed, Md Mubtasim Ahasan, Jahir Sadik Monon, Muntasir Wahed, M Ashraful Amin, A K M Mahbubur Rahman, Amin Ahsan Ali"
+#   venue: "arXiv 2025/11"
+#   links:
+#     paper: "https://arxiv.org/abs/2511.04153"
+#     github: ""
+#     website: ""
+
 - title: "SWE-SQL: Illuminating LLM Pathways to Solve User SQL Issues in Real-World Applications"
   authors: "Jinyang Li, Xiaolong Li, Ge Qu, Per Jacobsson, Bowen Qin, Binyuan Hui, Shuzheng Si, Nan Huo, Xiaohan Xu, Yue Zhang, Ziwei Tang, Yuanshuai Li, Florensia Widjaja, Xintong Zhu, Feige Zhou, Yongfeng Huang, Yannis Papakonstantinou, Fatma Ozcan, Chenhao Ma, Reynold Cheng"
   venue: "arXiv 2025"
diff --git a/docs/static/badges/papers.json b/docs/static/badges/papers.json
@@ -1 +1 @@
-{"schemaVersion": 1, "label": "Papers", "message": "481", "color": "brightgreen"}
+{"schemaVersion": 1, "label": "Papers", "message": "497", "color": "brightgreen"}
diff --git a/docs/static/badges/papers.svg b/docs/static/badges/papers.svg
@@ -1,5 +1,5 @@
-<svg xmlns="http://www.w3.org/2000/svg" width="77" height="20" role="img" aria-label="papers: 481">
-  <title>papers: 481</title>
+<svg xmlns="http://www.w3.org/2000/svg" width="77" height="20" role="img" aria-label="papers: 497">
+  <title>papers: 497</title>
   <linearGradient id="s" x2="0" y2="100%">
     <stop offset="0" stop-color="#bbb" stop-opacity=".1"/>
     <stop offset="1" stop-opacity=".1"/>
@@ -12,6 +12,6 @@
   </g>
   <g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,Arial,sans-serif" font-size="11">
     <text x="23.0" y="14">papers</text>
-    <text x="61.5" y="14">481</text>
+    <text x="61.5" y="14">497</text>
   </g>
 </svg>
diff --git a/scripts/update_papers_badge.py b/scripts/update_papers_badge.py
@@ -118,7 +118,7 @@ def update_readme_summary(total_papers: int) -> None:
     summary = (
         f"🔥 **We are actively tracking the frontier research of code agents.**<br>\n"
         f"🧹 *We periodically curate our collection, retaining only published papers and interesting arXiv preprints from the last six months.*<br>\n"
-        f"📚 *Currently collected:* **`{total_papers}` papers and products** — *(Last update: {today})*"
+        f"📚 *Currently collected:* **`{total_papers}` papers** — *(Last update: {today})*"
     )
 
     pattern = re.compile(

Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-{"schemaVersion": 1, "label": "Papers", "message": "481", "color": "brightgreen"}`
	`1`	`+{"schemaVersion": 1, "label": "Papers", "message": "497", "color": "brightgreen"}`