BibTeX records: Zhouhao Sun

download as .bib file

@article{DBLP:journals/corr/abs-2601-07208,
  author       = {Yang Zhao and
                  Hepeng Wang and
                  Xiao Ding and
                  Yangou Ouyang and
                  Bibo Cai and
                  Kai Xiong and
                  Jinglong Gao and
                  Zhouhao Sun and
                  Li Du and
                  Bing Qin and
                  Ting Liu},
  title        = {{MAESTRO:} Meta-learning Adaptive Estimation of Scalarization Trade-offs
                  for Reward Optimization},
  journal      = {CoRR},
  volume       = {abs/2601.07208},
  year         = {2026},
  url          = {https://doi.org/10.48550/arXiv.2601.07208},
  doi          = {10.48550/ARXIV.2601.07208},
  eprinttype    = {arXiv},
  eprint       = {2601.07208},
  timestamp    = {Wed, 11 Feb 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2601-07208.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2601-07224,
  author       = {Yang Zhao and
                  Yangou Ouyang and
                  Xiao Ding and
                  Hepeng Wang and
                  Bibo Cai and
                  Kai Xiong and
                  Jinglong Gao and
                  Zhouhao Sun and
                  Li Du and
                  Bing Qin and
                  Ting Liu},
  title        = {Consolidation or Adaptation? {PRISM:} Disentangling {SFT} and {RL}
                  Data via Gradient Concentration},
  journal      = {CoRR},
  volume       = {abs/2601.07224},
  year         = {2026},
  url          = {https://doi.org/10.48550/arXiv.2601.07224},
  doi          = {10.48550/ARXIV.2601.07224},
  eprinttype    = {arXiv},
  eprint       = {2601.07224},
  timestamp    = {Tue, 17 Feb 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2601-07224.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhaoDDOW0GSXYL025,
  author       = {Yang Zhao and
                  Li Du and
                  Xiao Ding and
                  Yangou Ouyang and
                  Hepeng Wang and
                  Kai Xiong and
                  Jinglong Gao and
                  Zhouhao Sun and
                  Dongliang Xu and
                  Qing Yang and
                  Dongchen Li and
                  Bing Qin and
                  Ting Liu},
  editor       = {Wanxiang Che and
                  Joyce Nabende and
                  Ekaterina Shutova and
                  Mohammad Taher Pilehvar},
  title        = {Beyond Similarity: {A} Gradient-based Graph Method for Instruction
                  Tuning Data Selection},
  booktitle    = {Proceedings of the 63rd Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2025, Vienna, Austria,
                  July 27 - August 1, 2025},
  pages        = {24391--24404},
  publisher    = {Association for Computational Linguistics},
  year         = {2025},
  url          = {https://aclanthology.org/2025.acl-long.1189/},
  timestamp    = {Sun, 02 Nov 2025 21:27:24 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/ZhaoDDOW0GSXYL025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2502-11062,
  author       = {Yang Zhao and
                  Li Du and
                  Xiao Ding and
                  Yangou Ouyang and
                  Hepeng Wang and
                  Kai Xiong and
                  Jinglong Gao and
                  Zhouhao Sun and
                  Dongliang Xu and
                  Qing Yang and
                  Dongchen Li and
                  Bing Qin and
                  Ting Liu},
  title        = {Beyond Similarity: {A} Gradient-based Graph Method for Instruction
                  Tuning Data Selection},
  journal      = {CoRR},
  volume       = {abs/2502.11062},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2502.11062},
  doi          = {10.48550/ARXIV.2502.11062},
  eprinttype    = {arXiv},
  eprint       = {2502.11062},
  timestamp    = {Tue, 05 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2502-11062.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2504-12898,
  author       = {Zhouhao Sun and
                  Xiao Ding and
                  Li Du and
                  Yunpeng Xu and
                  Yixuan Ma and
                  Yang Zhao and
                  Bing Qin and
                  Ting Liu},
  title        = {Information Gain-Guided Causal Intervention for Autonomous Debiasing
                  Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2504.12898},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2504.12898},
  doi          = {10.48550/ARXIV.2504.12898},
  eprinttype    = {arXiv},
  eprint       = {2504.12898},
  timestamp    = {Fri, 04 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2504-12898.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-12457,
  author       = {Yang Zhao and
                  Kai Xiong and
                  Xiao Ding and
                  Li Du and
                  YangouOuyang and
                  Zhouhao Sun and
                  Jiannan Guan and
                  Wenbin Zhang and
                  Bin Liu and
                  Dong Hu and
                  Bing Qin and
                  Ting Liu},
  title        = {{UFO-RL:} Uncertainty-Focused Optimization for Efficient Reinforcement
                  Learning Data Selection},
  journal      = {CoRR},
  volume       = {abs/2505.12457},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2505.12457},
  doi          = {10.48550/ARXIV.2505.12457},
  eprinttype    = {arXiv},
  eprint       = {2505.12457},
  timestamp    = {Tue, 05 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2505-12457.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-16522,
  author       = {Zhouhao Sun and
                  Zhiyuan Kan and
                  Xiao Ding and
                  Li Du and
                  Yang Zhao and
                  Bing Qin and
                  Ting Liu},
  title        = {Benchmarking and Pushing the Multi-Bias Elimination Boundary of LLMs
                  via Causal Effect Estimation-guided Debiasing},
  journal      = {CoRR},
  volume       = {abs/2505.16522},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2505.16522},
  doi          = {10.48550/ARXIV.2505.16522},
  eprinttype    = {arXiv},
  eprint       = {2505.16522},
  timestamp    = {Fri, 04 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2505-16522.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-20664,
  author       = {Yang He and
                  Xiao Ding and
                  Bibo Cai and
                  Yufei Zhang and
                  Kai Xiong and
                  Zhouhao Sun and
                  Bing Qin and
                  Ting Liu},
  title        = {Self-Route: Automatic Mode Switching via Capability Estimation for
                  Efficient Reasoning},
  journal      = {CoRR},
  volume       = {abs/2505.20664},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2505.20664},
  doi          = {10.48550/ARXIV.2505.20664},
  eprinttype    = {arXiv},
  eprint       = {2505.20664},
  timestamp    = {Tue, 05 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2505-20664.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhaoDD0SJ0024,
  author       = {Yang Zhao and
                  Li Du and
                  Xiao Ding and
                  Kai Xiong and
                  Zhouhao Sun and
                  Shi Jun and
                  Ting Liu and
                  Bing Qin},
  editor       = {Lun{-}Wei Ku and
                  Andre Martins and
                  Vivek Srikumar},
  title        = {Deciphering the Impact of Pretraining Data on Large Language Models
                  through Machine Unlearning},
  booktitle    = {Findings of the Association for Computational Linguistics, {ACL} 2024,
                  Bangkok, Thailand and virtual meeting, August 11-16, 2024},
  series       = {Findings of {ACL}},
  volume       = {{ACL} 2024},
  pages        = {9386--9406},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://doi.org/10.18653/v1/2024.findings-acl.559},
  doi          = {10.18653/V1/2024.FINDINGS-ACL.559},
  timestamp    = {Tue, 27 Jan 2026 20:26:47 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/ZhaoDD0SJ0024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SunDDMZQ0024,
  author       = {Zhouhao Sun and
                  Li Du and
                  Xiao Ding and
                  Yixuan Ma and
                  Yang Zhao and
                  Kaitao Qiu and
                  Ting Liu and
                  Bing Qin},
  editor       = {Lun{-}Wei Ku and
                  Andre Martins and
                  Vivek Srikumar},
  title        = {Causal-Guided Active Learning for Debiasing Large Language Models},
  booktitle    = {Proceedings of the 62nd Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2024, Bangkok, Thailand,
                  August 11-16, 2024},
  pages        = {14455--14469},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://doi.org/10.18653/v1/2024.acl-long.778},
  doi          = {10.18653/V1/2024.ACL-LONG.778},
  timestamp    = {Fri, 04 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SunDDMZQ0024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/SunDDCG0024,
  author       = {Zhouhao Sun and
                  Xiao Ding and
                  Li Du and
                  Bibo Cai and
                  Jinglong Gao and
                  Ting Liu and
                  Bing Qin},
  editor       = {Nicoletta Calzolari and
                  Min{-}Yen Kan and
                  V{\'{e}}ronique Hoste and
                  Alessandro Lenci and
                  Sakriani Sakti and
                  Nianwen Xue},
  title        = {Towards Generalizable and Faithful Logic Reasoning over Natural Language
                  via Resolution Refutation},
  booktitle    = {Proceedings of the 2024 Joint International Conference on Computational
                  Linguistics, Language Resources and Evaluation, {LREC/COLING} 2024,
                  20-25 May, 2024, Torino, Italy},
  pages        = {16527--16538},
  publisher    = {{ELRA} and {ICCL}},
  year         = {2024},
  url          = {https://aclanthology.org/2024.lrec-main.1436},
  timestamp    = {Thu, 23 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/SunDDCG0024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-11537,
  author       = {Yang Zhao and
                  Li Du and
                  Xiao Ding and
                  Kai Xiong and
                  Zhouhao Sun and
                  Jun Shi and
                  Ting Liu and
                  Bing Qin},
  title        = {Deciphering the lmpact of Pretraining Data on Large Language Models
                  through Machine Unlearning},
  journal      = {CoRR},
  volume       = {abs/2402.11537},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.11537},
  doi          = {10.48550/ARXIV.2402.11537},
  eprinttype    = {arXiv},
  eprint       = {2402.11537},
  timestamp    = {Tue, 05 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-11537.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-01677,
  author       = {Zhouhao Sun and
                  Xiao Ding and
                  Li Du and
                  Bibo Cai and
                  Jinglong Gao and
                  Ting Liu and
                  Bing Qin},
  title        = {Towards Generalizable and Faithful Logic Reasoning over Natural Language
                  via Resolution Refutation},
  journal      = {CoRR},
  volume       = {abs/2404.01677},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.01677},
  doi          = {10.48550/ARXIV.2404.01677},
  eprinttype    = {arXiv},
  eprint       = {2404.01677},
  timestamp    = {Fri, 10 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-01677.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2408-12942,
  author       = {Li Du and
                  Zhouhao Sun and
                  Xiao Ding and
                  Yixuan Ma and
                  Yang Zhao and
                  Kaitao Qiu and
                  Ting Liu and
                  Bing Qin},
  title        = {Causal-Guided Active Learning for Debiasing Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2408.12942},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2408.12942},
  doi          = {10.48550/ARXIV.2408.12942},
  eprinttype    = {arXiv},
  eprint       = {2408.12942},
  timestamp    = {Fri, 04 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2408-12942.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CaiDS00WS23,
  author       = {Bibo Cai and
                  Xiao Ding and
                  Zhouhao Sun and
                  Bing Qin and
                  Ting Liu and
                  Baojun Wang and
                  Lifeng Shang},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {Self-Supervised Logic Induction for Explainable Fuzzy Temporal Commonsense
                  Reasoning},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {12580--12588},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i11.26481},
  doi          = {10.1609/AAAI.V37I11.26481},
  timestamp    = {Fri, 04 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/CaiDS00WS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DuDS00L23,
  author       = {Li Du and
                  Xiao Ding and
                  Zhouhao Sun and
                  Ting Liu and
                  Bing Qin and
                  Jingshuo Liu},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Towards Stable Natural Language Understanding via Information Entropy
                  Guided Debiasing},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {2868--2882},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.161},
  doi          = {10.18653/V1/2023.ACL-LONG.161},
  timestamp    = {Fri, 04 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/DuDS00L23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}