


default search action
BibTeX records: Zhouhao Sun
@article{DBLP:journals/corr/abs-2601-07208,
author = {Yang Zhao and
Hepeng Wang and
Xiao Ding and
Yangou Ouyang and
Bibo Cai and
Kai Xiong and
Jinglong Gao and
Zhouhao Sun and
Li Du and
Bing Qin and
Ting Liu},
title = {{MAESTRO:} Meta-learning Adaptive Estimation of Scalarization Trade-offs
for Reward Optimization},
journal = {CoRR},
volume = {abs/2601.07208},
year = {2026},
url = {https://doi.org/10.48550/arXiv.2601.07208},
doi = {10.48550/ARXIV.2601.07208},
eprinttype = {arXiv},
eprint = {2601.07208},
timestamp = {Wed, 11 Feb 2026 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2601-07208.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2601-07224,
author = {Yang Zhao and
Yangou Ouyang and
Xiao Ding and
Hepeng Wang and
Bibo Cai and
Kai Xiong and
Jinglong Gao and
Zhouhao Sun and
Li Du and
Bing Qin and
Ting Liu},
title = {Consolidation or Adaptation? {PRISM:} Disentangling {SFT} and {RL}
Data via Gradient Concentration},
journal = {CoRR},
volume = {abs/2601.07224},
year = {2026},
url = {https://doi.org/10.48550/arXiv.2601.07224},
doi = {10.48550/ARXIV.2601.07224},
eprinttype = {arXiv},
eprint = {2601.07224},
timestamp = {Tue, 17 Feb 2026 00:00:00 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-2601-07224.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhaoDDOW0GSXYL025,
author = {Yang Zhao and
Li Du and
Xiao Ding and
Yangou Ouyang and
Hepeng Wang and
Kai Xiong and
Jinglong Gao and
Zhouhao Sun and
Dongliang Xu and
Qing Yang and
Dongchen Li and
Bing Qin and
Ting Liu},
editor = {Wanxiang Che and
Joyce Nabende and
Ekaterina Shutova and
Mohammad Taher Pilehvar},
title = {Beyond Similarity: {A} Gradient-based Graph Method for Instruction
Tuning Data Selection},
booktitle = {Proceedings of the 63rd Annual Meeting of the Association for Computational
Linguistics (Volume 1: Long Papers), {ACL} 2025, Vienna, Austria,
July 27 - August 1, 2025},
pages = {24391--24404},
publisher = {Association for Computational Linguistics},
year = {2025},
url = {https://aclanthology.org/2025.acl-long.1189/},
timestamp = {Sun, 02 Nov 2025 21:27:24 +0100},
biburl = {https://dblp.org/rec/conf/acl/ZhaoDDOW0GSXYL025.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2502-11062,
author = {Yang Zhao and
Li Du and
Xiao Ding and
Yangou Ouyang and
Hepeng Wang and
Kai Xiong and
Jinglong Gao and
Zhouhao Sun and
Dongliang Xu and
Qing Yang and
Dongchen Li and
Bing Qin and
Ting Liu},
title = {Beyond Similarity: {A} Gradient-based Graph Method for Instruction
Tuning Data Selection},
journal = {CoRR},
volume = {abs/2502.11062},
year = {2025},
url = {https://doi.org/10.48550/arXiv.2502.11062},
doi = {10.48550/ARXIV.2502.11062},
eprinttype = {arXiv},
eprint = {2502.11062},
timestamp = {Tue, 05 Aug 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2502-11062.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2504-12898,
author = {Zhouhao Sun and
Xiao Ding and
Li Du and
Yunpeng Xu and
Yixuan Ma and
Yang Zhao and
Bing Qin and
Ting Liu},
title = {Information Gain-Guided Causal Intervention for Autonomous Debiasing
Large Language Models},
journal = {CoRR},
volume = {abs/2504.12898},
year = {2025},
url = {https://doi.org/10.48550/arXiv.2504.12898},
doi = {10.48550/ARXIV.2504.12898},
eprinttype = {arXiv},
eprint = {2504.12898},
timestamp = {Fri, 04 Jul 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2504-12898.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-12457,
author = {Yang Zhao and
Kai Xiong and
Xiao Ding and
Li Du and
YangouOuyang and
Zhouhao Sun and
Jiannan Guan and
Wenbin Zhang and
Bin Liu and
Dong Hu and
Bing Qin and
Ting Liu},
title = {{UFO-RL:} Uncertainty-Focused Optimization for Efficient Reinforcement
Learning Data Selection},
journal = {CoRR},
volume = {abs/2505.12457},
year = {2025},
url = {https://doi.org/10.48550/arXiv.2505.12457},
doi = {10.48550/ARXIV.2505.12457},
eprinttype = {arXiv},
eprint = {2505.12457},
timestamp = {Tue, 05 Aug 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2505-12457.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-16522,
author = {Zhouhao Sun and
Zhiyuan Kan and
Xiao Ding and
Li Du and
Yang Zhao and
Bing Qin and
Ting Liu},
title = {Benchmarking and Pushing the Multi-Bias Elimination Boundary of LLMs
via Causal Effect Estimation-guided Debiasing},
journal = {CoRR},
volume = {abs/2505.16522},
year = {2025},
url = {https://doi.org/10.48550/arXiv.2505.16522},
doi = {10.48550/ARXIV.2505.16522},
eprinttype = {arXiv},
eprint = {2505.16522},
timestamp = {Fri, 04 Jul 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2505-16522.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-20664,
author = {Yang He and
Xiao Ding and
Bibo Cai and
Yufei Zhang and
Kai Xiong and
Zhouhao Sun and
Bing Qin and
Ting Liu},
title = {Self-Route: Automatic Mode Switching via Capability Estimation for
Efficient Reasoning},
journal = {CoRR},
volume = {abs/2505.20664},
year = {2025},
url = {https://doi.org/10.48550/arXiv.2505.20664},
doi = {10.48550/ARXIV.2505.20664},
eprinttype = {arXiv},
eprint = {2505.20664},
timestamp = {Tue, 05 Aug 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2505-20664.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhaoDD0SJ0024,
author = {Yang Zhao and
Li Du and
Xiao Ding and
Kai Xiong and
Zhouhao Sun and
Shi Jun and
Ting Liu and
Bing Qin},
editor = {Lun{-}Wei Ku and
Andre Martins and
Vivek Srikumar},
title = {Deciphering the Impact of Pretraining Data on Large Language Models
through Machine Unlearning},
booktitle = {Findings of the Association for Computational Linguistics, {ACL} 2024,
Bangkok, Thailand and virtual meeting, August 11-16, 2024},
series = {Findings of {ACL}},
volume = {{ACL} 2024},
pages = {9386--9406},
publisher = {Association for Computational Linguistics},
year = {2024},
url = {https://doi.org/10.18653/v1/2024.findings-acl.559},
doi = {10.18653/V1/2024.FINDINGS-ACL.559},
timestamp = {Tue, 27 Jan 2026 20:26:47 +0100},
biburl = {https://dblp.org/rec/conf/acl/ZhaoDD0SJ0024.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SunDDMZQ0024,
author = {Zhouhao Sun and
Li Du and
Xiao Ding and
Yixuan Ma and
Yang Zhao and
Kaitao Qiu and
Ting Liu and
Bing Qin},
editor = {Lun{-}Wei Ku and
Andre Martins and
Vivek Srikumar},
title = {Causal-Guided Active Learning for Debiasing Large Language Models},
booktitle = {Proceedings of the 62nd Annual Meeting of the Association for Computational
Linguistics (Volume 1: Long Papers), {ACL} 2024, Bangkok, Thailand,
August 11-16, 2024},
pages = {14455--14469},
publisher = {Association for Computational Linguistics},
year = {2024},
url = {https://doi.org/10.18653/v1/2024.acl-long.778},
doi = {10.18653/V1/2024.ACL-LONG.778},
timestamp = {Fri, 04 Jul 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/acl/SunDDMZQ0024.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/SunDDCG0024,
author = {Zhouhao Sun and
Xiao Ding and
Li Du and
Bibo Cai and
Jinglong Gao and
Ting Liu and
Bing Qin},
editor = {Nicoletta Calzolari and
Min{-}Yen Kan and
V{\'{e}}ronique Hoste and
Alessandro Lenci and
Sakriani Sakti and
Nianwen Xue},
title = {Towards Generalizable and Faithful Logic Reasoning over Natural Language
via Resolution Refutation},
booktitle = {Proceedings of the 2024 Joint International Conference on Computational
Linguistics, Language Resources and Evaluation, {LREC/COLING} 2024,
20-25 May, 2024, Torino, Italy},
pages = {16527--16538},
publisher = {{ELRA} and {ICCL}},
year = {2024},
url = {https://aclanthology.org/2024.lrec-main.1436},
timestamp = {Thu, 23 May 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/coling/SunDDCG0024.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-11537,
author = {Yang Zhao and
Li Du and
Xiao Ding and
Kai Xiong and
Zhouhao Sun and
Jun Shi and
Ting Liu and
Bing Qin},
title = {Deciphering the lmpact of Pretraining Data on Large Language Models
through Machine Unlearning},
journal = {CoRR},
volume = {abs/2402.11537},
year = {2024},
url = {https://doi.org/10.48550/arXiv.2402.11537},
doi = {10.48550/ARXIV.2402.11537},
eprinttype = {arXiv},
eprint = {2402.11537},
timestamp = {Tue, 05 Aug 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2402-11537.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-01677,
author = {Zhouhao Sun and
Xiao Ding and
Li Du and
Bibo Cai and
Jinglong Gao and
Ting Liu and
Bing Qin},
title = {Towards Generalizable and Faithful Logic Reasoning over Natural Language
via Resolution Refutation},
journal = {CoRR},
volume = {abs/2404.01677},
year = {2024},
url = {https://doi.org/10.48550/arXiv.2404.01677},
doi = {10.48550/ARXIV.2404.01677},
eprinttype = {arXiv},
eprint = {2404.01677},
timestamp = {Fri, 10 May 2024 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2404-01677.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2408-12942,
author = {Li Du and
Zhouhao Sun and
Xiao Ding and
Yixuan Ma and
Yang Zhao and
Kaitao Qiu and
Ting Liu and
Bing Qin},
title = {Causal-Guided Active Learning for Debiasing Large Language Models},
journal = {CoRR},
volume = {abs/2408.12942},
year = {2024},
url = {https://doi.org/10.48550/arXiv.2408.12942},
doi = {10.48550/ARXIV.2408.12942},
eprinttype = {arXiv},
eprint = {2408.12942},
timestamp = {Fri, 04 Jul 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2408-12942.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CaiDS00WS23,
author = {Bibo Cai and
Xiao Ding and
Zhouhao Sun and
Bing Qin and
Ting Liu and
Baojun Wang and
Lifeng Shang},
editor = {Brian Williams and
Yiling Chen and
Jennifer Neville},
title = {Self-Supervised Logic Induction for Explainable Fuzzy Temporal Commonsense
Reasoning},
booktitle = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
2023, Thirty-Fifth Conference on Innovative Applications of Artificial
Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
7-14, 2023},
pages = {12580--12588},
publisher = {{AAAI} Press},
year = {2023},
url = {https://doi.org/10.1609/aaai.v37i11.26481},
doi = {10.1609/AAAI.V37I11.26481},
timestamp = {Fri, 04 Jul 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/aaai/CaiDS00WS23.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DuDS00L23,
author = {Li Du and
Xiao Ding and
Zhouhao Sun and
Ting Liu and
Bing Qin and
Jingshuo Liu},
editor = {Anna Rogers and
Jordan L. Boyd{-}Graber and
Naoaki Okazaki},
title = {Towards Stable Natural Language Understanding via Information Entropy
Guided Debiasing},
booktitle = {Proceedings of the 61st Annual Meeting of the Association for Computational
Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
July 9-14, 2023},
pages = {2868--2882},
publisher = {Association for Computational Linguistics},
year = {2023},
url = {https://doi.org/10.18653/v1/2023.acl-long.161},
doi = {10.18653/V1/2023.ACL-LONG.161},
timestamp = {Fri, 04 Jul 2025 01:00:00 +0200},
biburl = {https://dblp.org/rec/conf/acl/DuDS00L23.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}

manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.


Google
Google Scholar
Semantic Scholar
Internet Archive Scholar
CiteSeerX
ORCID













