BibTeX records: Yitao Hu

download as .bib file

@article{DBLP:journals/tpds/SuiYHLW26,
  author       = {Yifan Sui and
                  Hanfei Yu and
                  Yitao Hu and
                  Jianxun Li and
                  Hao Wang},
  title        = {Accelerating {ML} Inference via Opportunistic Pre-Loading on Serverless
                  Clusters},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {37},
  number       = {2},
  pages        = {472--488},
  year         = {2026},
  url          = {https://doi.org/10.1109/TPDS.2025.3638428},
  doi          = {10.1109/TPDS.2025.3638428},
  timestamp    = {Wed, 21 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tpds/SuiYHLW26.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2601-06562,
  author       = {Liang Zheng and
                  Bowen Shi and
                  Yitao Hu and
                  Jiawei Zhang and
                  Ruofan Li and
                  Sheng Chen and
                  Wenxin Li and
                  Keqiu Li},
  title        = {Mosaic: Unlocking Long-Context Inference for Diffusion LLMs via Global
                  Memory Planning and Dynamic Peak Taming},
  journal      = {CoRR},
  volume       = {abs/2601.06562},
  year         = {2026},
  url          = {https://doi.org/10.48550/arXiv.2601.06562},
  doi          = {10.48550/ARXIV.2601.06562},
  eprinttype    = {arXiv},
  eprint       = {2601.06562},
  timestamp    = {Thu, 12 Feb 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2601-06562.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tc/ZhaoHYGSZLLQ25,
  author       = {Zhixin Zhao and
                  Yitao Hu and
                  Guotao Yang and
                  Ziqi Gong and
                  Chen Shen and
                  Laiping Zhao and
                  Wenxin Li and
                  Xiulong Liu and
                  Wenyu Qu},
  title        = {SLOpt: Serving Real-Time Inference Pipeline With Strict Latency Constraint},
  journal      = {{IEEE} Trans. Computers},
  volume       = {74},
  number       = {4},
  pages        = {1431--1445},
  year         = {2025},
  url          = {https://doi.org/10.1109/TC.2025.3528125},
  doi          = {10.1109/TC.2025.3528125},
  timestamp    = {Fri, 30 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tc/ZhaoHYGSZLLQ25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tc/HuLYLZZCZLL25,
  author       = {Yitao Hu and
                  Xiulong Liu and
                  Guotao Yang and
                  Linxuan Li and
                  Kai Zeng and
                  Zhixin Zhao and
                  Sheng Chen and
                  Laiping Zhao and
                  Wenxin Li and
                  Keqiu Li},
  title        = {TightLLM: Maximizing Throughput for {LLM} Inference via Adaptive Offloading
                  Policy},
  journal      = {{IEEE} Trans. Computers},
  volume       = {74},
  number       = {7},
  pages        = {2195--2209},
  year         = {2025},
  url          = {https://doi.org/10.1109/TC.2025.3558009},
  doi          = {10.1109/TC.2025.3558009},
  timestamp    = {Sat, 31 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tc/HuLYLZZCZLL25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpads/GongHCLL25,
  author       = {Ziqi Gong and
                  Yitao Hu and
                  Sheng Chen and
                  Wenxin Li and
                  Keqiu Li},
  title        = {MoEoM: Joint Compute and Memory-Aware Balancing for Fast MoE Inference},
  booktitle    = {31th {IEEE} International Conference on Parallel and Distributed Systems,
                  {ICPADS} 2025, Hefei, China, December 14-18, 2025},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2025},
  url          = {https://doi.org/10.1109/ICPADS67057.2025.11323175},
  doi          = {10.1109/ICPADS67057.2025.11323175},
  timestamp    = {Wed, 04 Feb 2026 13:08:09 +0100},
  biburl       = {https://dblp.org/rec/conf/icpads/GongHCLL25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/infocom/Zhang0LLS0HZL25,
  author       = {Song Zhang and
                  Wenxin Li and
                  Yulong Li and
                  Yuan Liu and
                  Lide Suo and
                  Sheng Chen and
                  Yitao Hu and
                  Laiping Zhao and
                  Keqiu Li},
  title        = {Lark: {A} Buffer-aware Building Block for Programmable Packet Scheduling
                  in Datacenters},
  booktitle    = {{IEEE} {INFOCOM} 2025 - {IEEE} Conference on Computer Communications,
                  London, United Kingdom, May 19-22, 2025},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2025},
  url          = {https://doi.org/10.1109/INFOCOM55648.2025.11044448},
  doi          = {10.1109/INFOCOM55648.2025.11044448},
  timestamp    = {Fri, 30 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/infocom/Zhang0LLS0HZL25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/infocom/ZhaoHGY0LLW25,
  author       = {Zhixin Zhao and
                  Yitao Hu and
                  Ziqi Gong and
                  Guotao Yang and
                  Wenxin Li and
                  Xiulong Liu and
                  Keqiu Li and
                  Hao Wang},
  title        = {Harpagon: Minimizing {DNN} Serving Cost via Efficient Dispatching,
                  Scheduling and Splitting},
  booktitle    = {{IEEE} {INFOCOM} 2025 - {IEEE} Conference on Computer Communications,
                  London, United Kingdom, May 19-22, 2025},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2025},
  url          = {https://doi.org/10.1109/INFOCOM55648.2025.11044536},
  doi          = {10.1109/INFOCOM55648.2025.11044536},
  timestamp    = {Sat, 31 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/infocom/ZhaoHGY0LLW25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-14468,
  author       = {Yifan Sui and
                  Hao Wang and
                  Hanfei Yu and
                  Yitao Hu and
                  Jianxun Li and
                  Hao Wang},
  title        = {ServerlessLoRA: Minimizing Latency and Cost in Serverless Inference
                  for LoRA-Based LLMs},
  journal      = {CoRR},
  volume       = {abs/2505.14468},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2505.14468},
  doi          = {10.48550/ARXIV.2505.14468},
  eprinttype    = {arXiv},
  eprint       = {2505.14468},
  timestamp    = {Tue, 12 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2505-14468.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2511-12979,
  author       = {Zhengchao Wang and
                  Yitao Hu and
                  Jianing Ye and
                  Zhuxuan Chang and
                  Jiazheng Yu and
                  Youpeng Deng and
                  Keqiu Li},
  title        = {RAGPulse: An Open-Source {RAG} Workload Trace to Optimize {RAG} Serving
                  Systems},
  journal      = {CoRR},
  volume       = {abs/2511.12979},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2511.12979},
  doi          = {10.48550/ARXIV.2511.12979},
  eprinttype    = {arXiv},
  eprint       = {2511.12979},
  timestamp    = {Wed, 14 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2511-12979.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2511-18868,
  author       = {Dezhi Ran and
                  Shuxiao Xie and
                  Mingfang Ji and
                  Ziyue Hua and
                  Mengzhou Wu and
                  Yuan Cao and
                  Yuzhe Guo and
                  Hao Yu and
                  Linyi Li and
                  Yitao Hu and
                  Tao Xie},
  title        = {KernelBand: Boosting LLM-based Kernel Optimization with a Hierarchical
                  and Hardware-aware Multi-armed Bandit},
  journal      = {CoRR},
  volume       = {abs/2511.18868},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2511.18868},
  doi          = {10.48550/ARXIV.2511.18868},
  eprinttype    = {arXiv},
  eprint       = {2511.18868},
  timestamp    = {Wed, 14 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2511-18868.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2511-22333,
  author       = {Jinjun Yi and
                  Zhixin Zhao and
                  Yitao Hu and
                  Ke Yan and
                  Weiwei Sun and
                  Hao Wang and
                  Laiping Zhao and
                  Yuhao Zhang and
                  Wenxin Li and
                  Keqiu Li},
  title        = {{PAT:} Accelerating {LLM} Decoding via Prefix-Aware Attention with
                  Resource Efficient Multi-Tile Kernel},
  journal      = {CoRR},
  volume       = {abs/2511.22333},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2511.22333},
  doi          = {10.48550/ARXIV.2511.22333},
  eprinttype    = {arXiv},
  eprint       = {2511.22333},
  timestamp    = {Thu, 15 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2511-22333.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijcini/WenZHZW24,
  author       = {Wanzhi Wen and
                  Bin Zhang and
                  Yitao Hu and
                  Xingyu Zhu and
                  Zelin Wang},
  title        = {An {API} Recommendation Method for Querying Mobile Computing Problems},
  journal      = {Int. J. Cogn. Informatics Nat. Intell.},
  volume       = {18},
  number       = {1},
  pages        = {1--16},
  year         = {2024},
  url          = {https://doi.org/10.4018/ijcini.344422},
  doi          = {10.4018/IJCINI.344422},
  timestamp    = {Mon, 09 Dec 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijcini/WenZHZW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asplos/LiuZLDCHSQ24,
  author       = {Guowei Liu and
                  Laiping Zhao and
                  Yiming Li and
                  Zhaolin Duan and
                  Sheng Chen and
                  Yitao Hu and
                  Zhiyuan Su and
                  Wenyu Qu},
  editor       = {Rajiv Gupta and
                  Nael B. Abu{-}Ghazaleh and
                  Madan Musuvathi and
                  Dan Tsafrir},
  title        = {{FUYAO:} DPU-enabled Direct Data Transfer for Serverless Computing},
  booktitle    = {Proceedings of the 29th {ACM} International Conference on Architectural
                  Support for Programming Languages and Operating Systems, Volume 3,
                  {ASPLOS} 2024, La Jolla, CA, USA, 27 April 2024- 1 May 2024},
  pages        = {431--447},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://doi.org/10.1145/3620666.3651327},
  doi          = {10.1145/3620666.3651327},
  timestamp    = {Fri, 30 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/asplos/LiuZLDCHSQ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cloud/SuiYHLW24,
  author       = {Yifan Sui and
                  Hanfei Yu and
                  Yitao Hu and
                  Jianxun Li and
                  Hao Wang},
  title        = {Pre-Warming is Not Enough: Accelerating Serverless Inference With
                  Opportunistic Pre-Loading},
  booktitle    = {Proceedings of the 2024 {ACM} Symposium on Cloud Computing, SoCC 2024,
                  Redmond, WA, USA, November 20-22, 2024},
  pages        = {178--195},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://doi.org/10.1145/3698038.3698509},
  doi          = {10.1145/3698038.3698509},
  timestamp    = {Mon, 02 Dec 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cloud/SuiYHLW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigcomm/SuoP0PLLHHL24,
  author       = {Lide Suo and
                  Yiren Pang and
                  Wenxin Li and
                  Renjie Pei and
                  Keqiu Li and
                  Xiulong Liu and
                  Xin He and
                  Yitao Hu and
                  Guyue Liu},
  title        = {{PPT:} {A} Pragmatic Transport for Datacenters},
  booktitle    = {Proceedings of the {ACM} {SIGCOMM} 2024 Conference, {ACM} {SIGCOMM}
                  2024, Sydney, NSW, Australia, August 4-8, 2024},
  pages        = {954--969},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://doi.org/10.1145/3651890.3672235},
  doi          = {10.1145/3651890.3672235},
  timestamp    = {Sat, 31 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sigcomm/SuoP0PLLHHL24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2409-13311,
  author       = {Mengzhou Wu and
                  Hao Wang and
                  Jun Ren and
                  Yuan Cao and
                  Yuetong Li and
                  Alex Jiang and
                  Dezhi Ran and
                  Yitao Hu and
                  Wei Yang and
                  Tao Xie},
  title        = {Skill-Adpative Imitation Learning for {UI} Test Reuse},
  journal      = {CoRR},
  volume       = {abs/2409.13311},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2409.13311},
  doi          = {10.48550/ARXIV.2409.13311},
  eprinttype    = {arXiv},
  eprint       = {2409.13311},
  timestamp    = {Thu, 17 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2409-13311.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2412-06161,
  author       = {Zhixin Zhao and
                  Yitao Hu and
                  Ziqi Gong and
                  Guotao Yang and
                  Wenxin Li and
                  Xiulong Liu and
                  Keqiu Li and
                  Hao Wang},
  title        = {Harpagon: Minimizing {DNN} Serving Cost via Efficient Dispatching,
                  Scheduling and Splitting},
  journal      = {CoRR},
  volume       = {abs/2412.06161},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2412.06161},
  doi          = {10.48550/ARXIV.2412.06161},
  eprinttype    = {arXiv},
  eprint       = {2412.06161},
  timestamp    = {Sat, 31 Jan 2026 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2412-06161.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tpds/LiuLPPHLSL23,
  author       = {Hao Liu and
                  Wenxin Li and
                  Yiren Pang and
                  Renjie Pei and
                  Yitao Hu and
                  Yuan Liu and
                  Lide Suo and
                  Keqiu Li},
  title        = {Accelerating Data Delivery of Latency-Sensitive Applications in Container
                  Overlay Network},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {34},
  number       = {12},
  pages        = {3046--3058},
  year         = {2023},
  url          = {https://doi.org/10.1109/TPDS.2023.3300745},
  doi          = {10.1109/TPDS.2023.3300745},
  timestamp    = {Wed, 20 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tpds/LiuLPPHLSL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ica3pp/GaoH23,
  author       = {Jiaheng Gao and
                  Yitao Hu},
  editor       = {Zahir Tari and
                  Keqiu Li and
                  Hongyi Wu},
  title        = {DeepLat: Achieving Minimum Worst Case Latency for {DNN} Inference
                  with Batch-Aware Dispatching},
  booktitle    = {Algorithms and Architectures for Parallel Processing - 23rd International
                  Conference, {ICA3PP} 2023, Tianjin, China, October 20-22, 2023, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {14487},
  pages        = {109--129},
  publisher    = {Springer},
  year         = {2023},
  url          = {https://doi.org/10.1007/978-981-97-0834-5\_8},
  doi          = {10.1007/978-981-97-0834-5\_8},
  timestamp    = {Mon, 25 Mar 2024 20:43:51 +0100},
  biburl       = {https://dblp.org/rec/conf/ica3pp/GaoH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwqos/ZhaoDZXHQYL23,
  author       = {Laiping Zhao and
                  Xinan Dai and
                  Zhixin Zhao and
                  Yusong Xin and
                  Yitao Hu and
                  Jun Qian and
                  Jun Yao and
                  Keqiu Li},
  title        = {High-throughput Sampling, Communicating and Training for Reinforcement
                  Learning Systems},
  booktitle    = {31st {IEEE/ACM} International Symposium on Quality of Service, IWQoS
                  2023, Orlando, FL, USA, June 19-21, 2023},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/IWQoS57198.2023.10188703},
  doi          = {10.1109/IWQOS57198.2023.10188703},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iwqos/ZhaoDZXHQYL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijcini/WenWYZHLZ21,
  author       = {Wanzhi Wen and
                  Shiqiang Wang and
                  Bingqing Ye and
                  Xingyu Zhu and
                  Yitao Hu and
                  Xiaohong Lu and
                  Bin Zhang},
  title        = {{API} Recommendation Based on {WII-WMD}},
  journal      = {Int. J. Cogn. Informatics Nat. Intell.},
  volume       = {15},
  number       = {4},
  pages        = {1--20},
  year         = {2021},
  url          = {https://doi.org/10.4018/ijcini.20211001.oa16},
  doi          = {10.4018/IJCINI.20211001.OA16},
  timestamp    = {Wed, 24 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijcini/WenWYZHLZ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cloud/HuGG21,
  author       = {Yitao Hu and
                  Rajrup Ghosh and
                  Ramesh Govindan},
  editor       = {Carlo Curino and
                  Georgia Koutrika and
                  Ravi Netravali},
  title        = {Scrooge: {A} Cost-Effective Deep Learning Inference System},
  booktitle    = {SoCC '21: {ACM} Symposium on Cloud Computing, Seattle, WA, USA, November
                  1 - 4, 2021},
  pages        = {624--638},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3472883.3486993},
  doi          = {10.1145/3472883.3486993},
  timestamp    = {Thu, 23 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cloud/HuGG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iotdi/HuPLGKLG21,
  author       = {Yitao Hu and
                  Weiwu Pang and
                  Xiaochen Liu and
                  Rajrup Ghosh and
                  Bongjun Ko and
                  Wei{-}Han Lee and
                  Ramesh Govindan},
  title        = {Rim: Offloading Inference to the Edge},
  booktitle    = {IoTDI '21: International Conference on Internet-of-Things Design and
                  Implementation, Virtual Event / Charlottesville, VA, USA, May 18-21,
                  2021},
  pages        = {80--92},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3450268.3453521},
  doi          = {10.1145/3450268.3453521},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iotdi/HuPLGKLG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/el/XiZHTB18,
  author       = {Qingkui Xi and
                  Heng Zhao and
                  Yitao Hu and
                  Yunjuan Tong and
                  Ping Bao},
  title        = {Case studies and comparison between two models for assessing library
                  service quality},
  journal      = {Electron. Libr.},
  volume       = {36},
  number       = {6},
  pages        = {1099--1113},
  year         = {2018},
  url          = {https://doi.org/10.1108/EL-11-2016-0246},
  doi          = {10.1108/EL-11-2016-0246},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/el/XiZHTB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/middleware/HuRKG18,
  author       = {Yitao Hu and
                  Swati Rallapalli and
                  Bongjun Ko and
                  Ramesh Govindan},
  editor       = {Paulo Ferreira and
                  Liuba Shrira},
  title        = {Olympian: Scheduling {GPU} Usage in a Deep Neural Network Model Serving
                  System},
  booktitle    = {Proceedings of the 19th International Middleware Conference, Middleware
                  2018, Rennes, France, December 10-14, 2018},
  pages        = {53--65},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3274808.3274813},
  doi          = {10.1145/3274808.3274813},
  timestamp    = {Wed, 14 Nov 2018 10:08:26 +0100},
  biburl       = {https://dblp.org/rec/conf/middleware/HuRKG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/huc/HuLNG16,
  author       = {Yitao Hu and
                  Xiaochen Liu and
                  Suman Nath and
                  Ramesh Govindan},
  editor       = {Paul Lukowicz and
                  Antonio Kr{\"{u}}ger and
                  Andreas Bulling and
                  Youn{-}Kyung Lim and
                  Shwetak N. Patel},
  title        = {{ALPS:} accurate landmark positioning at city scales},
  booktitle    = {Proceedings of the 2016 {ACM} International Joint Conference on Pervasive
                  and Ubiquitous Computing, UbiComp 2016, Heidelberg, Germany, September
                  12-16, 2016},
  pages        = {1147--1158},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {https://doi.org/10.1145/2971648.2971674},
  doi          = {10.1145/2971648.2971674},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/huc/HuLNG16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rtss/HuYJZHLNLKDSBSG15,
  author       = {Shaohan Hu and
                  Shuochao Yao and
                  Haiming Jin and
                  Yiran Zhao and
                  Yitao Hu and
                  Xiaochen Liu and
                  Nooreddin Naghibolhosseini and
                  Shen Li and
                  Akash Kapoor and
                  William Dron and
                  Lu Su and
                  Amotz Bar{-}Noy and
                  Pedro A. Szekely and
                  Ramesh Govindan and
                  Reginald L. Hobbs and
                  Tarek F. Abdelzaher},
  title        = {Data Acquisition for Real-Time Decision-Making under Freshness Constraints},
  booktitle    = {2015 {IEEE} Real-Time Systems Symposium, {RTSS} 2015, San Antonio,
                  Texas, USA, December 1-4, 2015},
  pages        = {185--194},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/RTSS.2015.25},
  doi          = {10.1109/RTSS.2015.25},
  timestamp    = {Tue, 14 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/rtss/HuYJZHLNLKDSBSG15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/infocom/HuWG14,
  author       = {Yitao Hu and
                  Xinbing Wang and
                  Xiaoying Gan},
  title        = {Critical sensing range for mobile heterogeneous camera sensor networks},
  booktitle    = {2014 {IEEE} Conference on Computer Communications, {INFOCOM} 2014,
                  Toronto, Canada, April 27 - May 2, 2014},
  pages        = {970--978},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/INFOCOM.2014.6848026},
  doi          = {10.1109/INFOCOM.2014.6848026},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/infocom/HuWG14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}