BibTeX records: Xu Yang 0021

download as .bib file

@article{DBLP:journals/ai/FengWYG25,
  author       = {Fu Feng and
                  Jing Wang and
                  Xu Yang and
                  Xin Geng},
  title        = {Learngene: Inheritable "genes" in intelligent agents},
  journal      = {Artif. Intell.},
  volume       = {348},
  pages        = {104421},
  year         = {2025},
  url          = {https://doi.org/10.1016/j.artint.2025.104421},
  doi          = {10.1016/J.ARTINT.2025.104421},
  timestamp    = {Thu, 02 Oct 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ai/FengWYG25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WuZCLLCQSZW025,
  author       = {Yongliang Wu and
                  Wenbo Zhu and
                  Jiawang Cao and
                  Yi Lu and
                  Bozheng Li and
                  Weiheng Chi and
                  Zihan Qiu and
                  Lirian Su and
                  Haolin Zheng and
                  Jay Wu and
                  Xu Yang},
  editor       = {Toby Walsh and
                  Julie Shah and
                  Zico Kolter},
  title        = {Video Repurposing from User Generated Content: {A} Large-scale Dataset
                  and Benchmark},
  booktitle    = {AAAI-25, Sponsored by the Association for the Advancement of Artificial
                  Intelligence, February 25 - March 4, 2025, Philadelphia, PA, {USA}},
  pages        = {8487--8495},
  publisher    = {{AAAI} Press},
  year         = {2025},
  url          = {https://doi.org/10.1609/aaai.v39i8.32916},
  doi          = {10.1609/AAAI.V39I8.32916},
  timestamp    = {Tue, 05 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WuZCLLCQSZW025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WuZYWCZHZ025,
  author       = {Yongliang Wu and
                  Shiji Zhou and
                  Mingzhuo Yang and
                  Lianzhe Wang and
                  Heng Chang and
                  Wenbo Zhu and
                  Xinting Hu and
                  Xiao Zhou and
                  Xu Yang},
  editor       = {Toby Walsh and
                  Julie Shah and
                  Zico Kolter},
  title        = {Unlearning Concepts in Diffusion Model via Concept Domain Correction
                  and Concept Preserving Gradient},
  booktitle    = {AAAI-25, Sponsored by the Association for the Advancement of Artificial
                  Intelligence, February 25 - March 4, 2025, Philadelphia, PA, {USA}},
  pages        = {8496--8504},
  publisher    = {{AAAI} Press},
  year         = {2025},
  url          = {https://doi.org/10.1609/aaai.v39i8.32917},
  doi          = {10.1609/AAAI.V39I8.32917},
  timestamp    = {Thu, 17 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WuZYWCZHZ025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/FengXYW025,
  author       = {Fu Feng and
                  Yucheng Xie and
                  Xu Yang and
                  Jing Wang and
                  Xin Geng},
  title        = {Redefining in Dictionary: Towards an Enhanced Semantic Understanding
                  of Creative Generation},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2025, Nashville, TN, USA, June 11-15, 2025},
  pages        = {18444--18454},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2025},
  url          = {https://openaccess.thecvf.com/content/CVPR2025/html/Feng\_Redefining\_Creative\_in\_Dictionary\_Towards\_an\_Enhanced\_Semantic\_Understanding\_of\_CVPR\_2025\_paper.html},
  doi          = {10.1109/CVPR52734.2025.01719},
  timestamp    = {Wed, 20 Aug 2025 10:18:56 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/FengXYW025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iui/PengQZZL00R025,
  author       = {Yingzhe Peng and
                  Xiaoting Qin and
                  Zhiyang Zhang and
                  Jue Zhang and
                  Qingwei Lin and
                  Xu Yang and
                  Dongmei Zhang and
                  Saravan Rajmohan and
                  Qi Zhang},
  editor       = {Toby Li and
                  Fabio Patern{\`{o}} and
                  Kaisa V{\"{a}}{\"{a}}n{\"{a}}nen and
                  Luis Leiva and
                  Lucio Davide Spano and
                  Katrien Verbert},
  title        = {Navigating the Unknown: {A} Chat-Based Collaborative Interface for
                  Personalized Exploratory Tasks},
  booktitle    = {Proceedings of the 30th International Conference on Intelligent User
                  Interfaces, {IUI} 2025, Cagliari, Italy, March 24-27, 2025},
  pages        = {1048--1063},
  publisher    = {{ACM}},
  year         = {2025},
  url          = {https://doi.org/10.1145/3708359.3712093},
  doi          = {10.1145/3708359.3712093},
  timestamp    = {Fri, 04 Jul 2025 22:08:42 +0200},
  biburl       = {https://dblp.org/rec/conf/iui/PengQZZL00R025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2501-05775,
  author       = {Shunxin Guo and
                  Hongsong Wang and
                  Shuxia Lin and
                  Xu Yang and
                  Xin Geng},
  title        = {{STHFL:} Spatio-Temporal Heterogeneous Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2501.05775},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2501.05775},
  doi          = {10.48550/ARXIV.2501.05775},
  eprinttype    = {arXiv},
  eprint       = {2501.05775},
  timestamp    = {Thu, 20 Feb 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2501-05775.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2502-01662,
  author       = {Jiale Fu and
                  Yuchu Jiang and
                  Junkai Chen and
                  Jiaming Fan and
                  Xin Geng and
                  Xu Yang},
  title        = {Speculative Ensemble: Fast Large Language Model Ensemble via Speculation},
  journal      = {CoRR},
  volume       = {abs/2502.01662},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2502.01662},
  doi          = {10.48550/ARXIV.2502.01662},
  eprinttype    = {arXiv},
  eprint       = {2502.01662},
  timestamp    = {Tue, 11 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2502-01662.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2503-07536,
  author       = {Yingzhe Peng and
                  Gongrui Zhang and
                  Miaosen Zhang and
                  Zhiyuan You and
                  Jie Liu and
                  Qipeng Zhu and
                  Kai Yang and
                  Xingzhong Xu and
                  Xin Geng and
                  Xu Yang},
  title        = {{LMM-R1:} Empowering 3B LMMs with Strong Reasoning Abilities Through
                  Two-Stage Rule-Based {RL}},
  journal      = {CoRR},
  volume       = {abs/2503.07536},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2503.07536},
  doi          = {10.48550/ARXIV.2503.07536},
  eprinttype    = {arXiv},
  eprint       = {2503.07536},
  timestamp    = {Sun, 13 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2503-07536.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2504-08851,
  author       = {Yuchu Jiang and
                  Jiale Fu and
                  Chenduo Hao and
                  Xinting Hu and
                  Yingzhe Peng and
                  Xin Geng and
                  Xu Yang},
  title        = {Mimic In-Context Learning for Multimodal Tasks},
  journal      = {CoRR},
  volume       = {abs/2504.08851},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2504.08851},
  doi          = {10.48550/ARXIV.2504.08851},
  eprinttype    = {arXiv},
  eprint       = {2504.08851},
  timestamp    = {Thu, 22 May 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2504-08851.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2504-14200,
  author       = {Huiyi Chen and
                  Jiawei Peng and
                  Kaihua Tang and
                  Xin Geng and
                  Xu Yang},
  title        = {Enhancing Multimodal In-Context Learning for Image Classification
                  through Coreset Optimization},
  journal      = {CoRR},
  volume       = {abs/2504.14200},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2504.14200},
  doi          = {10.48550/ARXIV.2504.14200},
  eprinttype    = {arXiv},
  eprint       = {2504.14200},
  timestamp    = {Thu, 22 May 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2504-14200.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-03667,
  author       = {Fu Feng and
                  Yucheng Xie and
                  Xu Yang and
                  Jing Wang and
                  Xin Geng},
  title        = {Distribution-Conditional Generation: From Class Distribution to Creative
                  Generation},
  journal      = {CoRR},
  volume       = {abs/2505.03667},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2505.03667},
  doi          = {10.48550/ARXIV.2505.03667},
  eprinttype    = {arXiv},
  eprint       = {2505.03667},
  timestamp    = {Mon, 23 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2505-03667.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2505-12728,
  author       = {Zihua Wang and
                  Ruibo Li and
                  Haozhe Du and
                  Joey Tianyi Zhou and
                  Yu Zhang and
                  Xu Yang},
  title        = {{FLASH:} Latent-Aware Semi-Autoregressive Speculative Decoding for
                  Multimodal Tasks},
  journal      = {CoRR},
  volume       = {abs/2505.12728},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2505.12728},
  doi          = {10.48550/ARXIV.2505.12728},
  eprinttype    = {arXiv},
  eprint       = {2505.12728},
  timestamp    = {Fri, 27 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2505-12728.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2506-16673,
  author       = {Ruiming Chen and
                  Junming Yang and
                  Shiyu Xia and
                  Xu Yang and
                  Jing Wang and
                  Xin Geng},
  title        = {Extracting Multimodal Learngene in {CLIP:} Unveiling the Multimodal
                  Generalizable Knowledge},
  journal      = {CoRR},
  volume       = {abs/2506.16673},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2506.16673},
  doi          = {10.48550/ARXIV.2506.16673},
  eprinttype    = {arXiv},
  eprint       = {2506.16673},
  timestamp    = {Sun, 13 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2506-16673.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2507-08021,
  author       = {Li Li and
                  Yongliang Wu and
                  Jingze Zhu and
                  Jiawei Peng and
                  Jianfei Cai and
                  Xu Yang},
  title        = {Unveiling Effective In-Context Configurations for Image Captioning:
                  An External {\&} Internal Analysis},
  journal      = {CoRR},
  volume       = {abs/2507.08021},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2507.08021},
  doi          = {10.48550/ARXIV.2507.08021},
  eprinttype    = {arXiv},
  eprint       = {2507.08021},
  timestamp    = {Thu, 14 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2507-08021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2507-08710,
  author       = {Li Li and
                  Yingzhe Peng and
                  Xu Yang and
                  Ruoxi Cheng and
                  Haiyang Xu and
                  Ming Yan and
                  Fei Huang},
  title        = {L-CLIPScore: a Lightweight Embedding-based Captioning Metric for Evaluating
                  and Training},
  journal      = {CoRR},
  volume       = {abs/2507.08710},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2507.08710},
  doi          = {10.48550/ARXIV.2507.08710},
  eprinttype    = {arXiv},
  eprint       = {2507.08710},
  timestamp    = {Thu, 14 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2507-08710.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/fcsc/WuY24,
  author       = {Yongliang Wu and
                  Xu Yang},
  title        = {A glance at in-context learning},
  journal      = {Frontiers Comput. Sci.},
  volume       = {18},
  number       = {5},
  pages        = {185347},
  year         = {2024},
  url          = {https://doi.org/10.1007/s11704-024-40013-9},
  doi          = {10.1007/S11704-024-40013-9},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/fcsc/WuY24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nca/ZhangCXZYG24,
  author       = {Boyu Zhang and
                  Jiayuan Chen and
                  Yinfei Xu and
                  Hui Zhang and
                  Xu Yang and
                  Xin Geng},
  title        = {Auto-encoding score distribution regression for action quality assessment},
  journal      = {Neural Comput. Appl.},
  volume       = {36},
  number       = {2},
  pages        = {929--942},
  year         = {2024},
  url          = {https://doi.org/10.1007/s00521-023-09068-w},
  doi          = {10.1007/S00521-023-09068-W},
  timestamp    = {Mon, 10 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nca/ZhangCXZYG24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ShiXYCK024,
  author       = {Boyu Shi and
                  Shiyu Xia and
                  Xu Yang and
                  Haokun Chen and
                  Zhiqiang Kou and
                  Xin Geng},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Building Variable-Sized Models via Learngene Pool},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {14946--14954},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i13.29415},
  doi          = {10.1609/AAAI.V38I13.29415},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/ShiXYCK024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/XiaZYCCG24,
  author       = {Shiyu Xia and
                  Miaosen Zhang and
                  Xu Yang and
                  Ruiming Chen and
                  Haokun Chen and
                  Xin Geng},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Transformer as Linear Expansion of Learngene},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {16014--16022},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i14.29533},
  doi          = {10.1609/AAAI.V38I14.29533},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/XiaZYCCG24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/LiPCGY24,
  author       = {Li Li and
                  Jiawei Peng and
                  Huiyi Chen and
                  Chongyang Gao and
                  Xu Yang},
  title        = {How to Configure Good In-Context Sequence for Visual Question Answering},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2024, Seattle, WA, USA, June 16-22, 2024},
  pages        = {26700--26710},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/CVPR52733.2024.02522},
  doi          = {10.1109/CVPR52733.2024.02522},
  timestamp    = {Sun, 19 Jan 2025 13:39:05 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/LiPCGY24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/WangYC024,
  author       = {Qiufeng Wang and
                  Xu Yang and
                  Haokun Chen and
                  Xin Geng},
  title        = {Vision Transformers as Probabilistic Expansion from Learngene},
  booktitle    = {Forty-first International Conference on Machine Learning, {ICML} 2024,
                  Vienna, Austria, July 21-27, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=5ExWEazod5},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/WangYC024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/XiaZY024,
  author       = {Shiyu Xia and
                  Wenxuan Zhu and
                  Xu Yang and
                  Xin Geng},
  title        = {Exploring Learngene via Stage-wise Weight Sharing for Initializing
                  Variable-sized Models},
  booktitle    = {Proceedings of the Thirty-Third International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2024, Jeju, South Korea, August 3-9,
                  2024},
  pages        = {5254--5262},
  publisher    = {ijcai.org},
  year         = {2024},
  url          = {https://www.ijcai.org/proceedings/2024/581},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/XiaZY024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/00020F0024,
  author       = {Qiufeng Wang and
                  Xu Yang and
                  Fu Feng and
                  Jing Wang and
                  Xin Geng},
  editor       = {Amir Globersons and
                  Lester Mackey and
                  Danielle Belgrave and
                  Angela Fan and
                  Ulrich Paquet and
                  Jakub M. Tomczak and
                  Cheng Zhang},
  title        = {Cluster-Learngene: Inheriting Adaptive Clusters for Vision Transformers},
  booktitle    = {Advances in Neural Information Processing Systems 38: Annual Conference
                  on Neural Information Processing Systems 2024, NeurIPS 2024, Vancouver,
                  BC, Canada, December 10 - 15, 2024},
  year         = {2024},
  url          = {http://papers.nips.cc/paper\_files/paper/2024/hash/2e53c02ea028cbf603f4b6b47fef3d97-Abstract-Conference.html},
  timestamp    = {Thu, 13 Feb 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/00020F0024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PengHHP0024,
  author       = {Yingzhe Peng and
                  Chenduo Hao and
                  Xinting Hu and
                  Jiawei Peng and
                  Xin Geng and
                  Xu Yang},
  editor       = {Amir Globersons and
                  Lester Mackey and
                  Danielle Belgrave and
                  Angela Fan and
                  Ulrich Paquet and
                  Jakub M. Tomczak and
                  Cheng Zhang},
  title        = {{LIVE:} Learnable In-Context Vector for Visual Question Answering},
  booktitle    = {Advances in Neural Information Processing Systems 38: Annual Conference
                  on Neural Information Processing Systems 2024, NeurIPS 2024, Vancouver,
                  BC, Canada, December 10 - 15, 2024},
  year         = {2024},
  url          = {http://papers.nips.cc/paper\_files/paper/2024/hash/12d3e63be5574088f7c1bbc9162060bf-Abstract-Conference.html},
  timestamp    = {Thu, 13 Feb 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/PengHHP0024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/XiaZ0024,
  author       = {Shiyu Xia and
                  Yuankun Zu and
                  Xu Yang and
                  Xin Geng},
  editor       = {Amir Globersons and
                  Lester Mackey and
                  Danielle Belgrave and
                  Angela Fan and
                  Ulrich Paquet and
                  Jakub M. Tomczak and
                  Cheng Zhang},
  title        = {Initializing Variable-sized Vision Transformers from Learngene with
                  Learnable Transformation},
  booktitle    = {Advances in Neural Information Processing Systems 38: Annual Conference
                  on Neural Information Processing Systems 2024, NeurIPS 2024, Vancouver,
                  BC, Canada, December 10 - 15, 2024},
  year         = {2024},
  url          = {http://papers.nips.cc/paper\_files/paper/2024/hash/4c5e2bcbf21bdf40d75fddad0bd43dc9-Abstract-Conference.html},
  timestamp    = {Thu, 13 Feb 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/XiaZ0024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YangPMXZHZ24,
  author       = {Xu Yang and
                  Yingzhe Peng and
                  Haoxuan Ma and
                  Shuo Xu and
                  Chi Zhang and
                  Yucheng Han and
                  Hanwang Zhang},
  editor       = {Amir Globersons and
                  Lester Mackey and
                  Danielle Belgrave and
                  Angela Fan and
                  Ulrich Paquet and
                  Jakub M. Tomczak and
                  Cheng Zhang},
  title        = {Lever {LM:} Configuring In-Context Sequence to Lever Large Vision
                  Language Models},
  booktitle    = {Advances in Neural Information Processing Systems 38: Annual Conference
                  on Neural Information Processing Systems 2024, NeurIPS 2024, Vancouver,
                  BC, Canada, December 10 - 15, 2024},
  year         = {2024},
  url          = {http://papers.nips.cc/paper\_files/paper/2024/hash/b619cd6dcc986856b8a8da2b08d89396-Abstract-Conference.html},
  timestamp    = {Wed, 19 Feb 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YangPMXZHZ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-16897,
  author       = {Shiyu Xia and
                  Wenxuan Zhu and
                  Xu Yang and
                  Xin Geng},
  title        = {Exploring Learngene via Stage-wise Weight Sharing for Initializing
                  Variable-sized Models},
  journal      = {CoRR},
  volume       = {abs/2404.16897},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.16897},
  doi          = {10.48550/ARXIV.2404.16897},
  eprinttype    = {arXiv},
  eprint       = {2404.16897},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-16897.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-17534,
  author       = {Yuhang Huang and
                  Zihan Wu and
                  Chongyang Gao and
                  Jiawei Peng and
                  Xu Yang},
  title        = {Exploring the Distinctiveness and Fidelity of the Descriptions Generated
                  by Large Vision-Language Models},
  journal      = {CoRR},
  volume       = {abs/2404.17534},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.17534},
  doi          = {10.48550/ARXIV.2404.17534},
  eprinttype    = {arXiv},
  eprint       = {2404.17534},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-17534.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2405-15304,
  author       = {Yongliang Wu and
                  Shiji Zhou and
                  Mingzhuo Yang and
                  Lianzhe Wang and
                  Wenbo Zhu and
                  Heng Chang and
                  Xiao Zhou and
                  Xu Yang},
  title        = {Unlearning Concepts in Diffusion Model via Concept Domain Correction
                  and Concept Preserving Gradient},
  journal      = {CoRR},
  volume       = {abs/2405.15304},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2405.15304},
  doi          = {10.48550/ARXIV.2405.15304},
  eprinttype    = {arXiv},
  eprint       = {2405.15304},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2405-15304.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-13185,
  author       = {Yingzhe Peng and
                  Chenduo Hao and
                  Xu Yang and
                  Jiawei Peng and
                  Xinting Hu and
                  Xin Geng},
  title        = {Learnable In-Context Vector for Visual Question Answering},
  journal      = {CoRR},
  volume       = {abs/2406.13185},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.13185},
  doi          = {10.48550/ARXIV.2406.13185},
  eprinttype    = {arXiv},
  eprint       = {2406.13185},
  timestamp    = {Tue, 01 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-13185.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-17309,
  author       = {Yongliang Wu and
                  Bozheng Li and
                  Jiawang Cao and
                  Wenbo Zhu and
                  Yi Lu and
                  Weiheng Chi and
                  Chuyun Xie and
                  Haolin Zheng and
                  Ziyue Su and
                  Jay Wu and
                  Xu Yang},
  title        = {Zero-Shot Long-Form Video Understanding through Screenplay},
  journal      = {CoRR},
  volume       = {abs/2406.17309},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.17309},
  doi          = {10.48550/ARXIV.2406.17309},
  eprinttype    = {arXiv},
  eprint       = {2406.17309},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-17309.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2409-13538,
  author       = {Yingzhe Peng and
                  Yixiao Yuan and
                  Zitian Ao and
                  Huapeng Zhou and
                  Kangqi Wang and
                  Qipeng Zhu and
                  Xu Yang},
  title        = {First Place Solution to the Multiple-choice Video {QA} Track of The
                  Second Perception Test Challenge},
  journal      = {CoRR},
  volume       = {abs/2409.13538},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2409.13538},
  doi          = {10.48550/ARXIV.2409.13538},
  eprinttype    = {arXiv},
  eprint       = {2409.13538},
  timestamp    = {Wed, 05 Feb 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2409-13538.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2410-24032,
  author       = {Yingzhe Peng and
                  Xiaoting Qin and
                  Zhiyang Zhang and
                  Jue Zhang and
                  Qingwei Lin and
                  Xu Yang and
                  Dongmei Zhang and
                  Saravan Rajmohan and
                  Qi Zhang},
  title        = {Navigating the Unknown: {A} Chat-Based Collaborative Interface for
                  Personalized Exploratory Tasks},
  journal      = {CoRR},
  volume       = {abs/2410.24032},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2410.24032},
  doi          = {10.48550/ARXIV.2410.24032},
  eprinttype    = {arXiv},
  eprint       = {2410.24032},
  timestamp    = {Wed, 05 Feb 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2410-24032.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2412-08879,
  author       = {Yongliang Wu and
                  Wenbo Zhu and
                  Jiawang Cao and
                  Yi Lu and
                  Bozheng Li and
                  Weiheng Chi and
                  Zihan Qiu and
                  Lirian Su and
                  Haolin Zheng and
                  Jay Wu and
                  Xu Yang},
  title        = {Video Repurposing from User Generated Content: {A} Large-scale Dataset
                  and Benchmark},
  journal      = {CoRR},
  volume       = {abs/2412.08879},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2412.08879},
  doi          = {10.48550/ARXIV.2412.08879},
  eprinttype    = {arXiv},
  eprint       = {2412.08879},
  timestamp    = {Mon, 20 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2412-08879.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijcv/YangZGC23,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Chongyang Gao and
                  Jianfei Cai},
  title        = {Learning to Collocate Visual-Linguistic Neural Modules for Image Captioning},
  journal      = {Int. J. Comput. Vis.},
  volume       = {131},
  number       = {1},
  pages        = {82--100},
  year         = {2023},
  url          = {https://doi.org/10.1007/s11263-022-01692-8},
  doi          = {10.1007/S11263-022-01692-8},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijcv/YangZGC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/YangZC23,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Deconfounded Image Captioning: {A} Causal Retrospect},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {45},
  number       = {11},
  pages        = {12996--13010},
  year         = {2023},
  url          = {https://doi.org/10.1109/TPAMI.2021.3121705},
  doi          = {10.1109/TPAMI.2021.3121705},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pami/YangZC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YangPWXYLHHLZ23,
  author       = {Xu Yang and
                  Jiawei Peng and
                  Zihua Wang and
                  Haiyang Xu and
                  Qinghao Ye and
                  Chenliang Li and
                  Songfang Huang and
                  Fei Huang and
                  Zhangzikang Li and
                  Yu Zhang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Transforming Visual Scene Graphs to Image Captions},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {12427--12440},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.694},
  doi          = {10.18653/V1/2023.ACL-LONG.694},
  timestamp    = {Wed, 25 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/YangPWXYLHHLZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/YangLXZYLYZHH23,
  author       = {Xu Yang and
                  Zhangzikang Li and
                  Haiyang Xu and
                  Hanwang Zhang and
                  Qinghao Ye and
                  Chenliang Li and
                  Ming Yan and
                  Yu Zhang and
                  Fei Huang and
                  Songfang Huang},
  title        = {Learning Trajectory-Word Alignments for Video-Language Tasks},
  booktitle    = {{IEEE/CVF} International Conference on Computer Vision, {ICCV} 2023,
                  Paris, France, October 1-6, 2023},
  pages        = {2504--2514},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICCV51070.2023.00237},
  doi          = {10.1109/ICCV51070.2023.00237},
  timestamp    = {Wed, 25 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccv/YangLXZYLYZHH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YangWYC023,
  author       = {Xu Yang and
                  Yongliang Wu and
                  Mingzhuo Yang and
                  Haokun Chen and
                  Xin Geng},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Exploring Diverse In-Context Configurations for Image Captioning},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/804b5e300c9ed4e3ea3b073f186f4adc-Abstract-Conference.html},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YangWYC023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YuanSXYGR23,
  author       = {Hua Yuan and
                  Yu Shi and
                  Ning Xu and
                  Xu Yang and
                  Xin Geng and
                  Yong Rui},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Learning From Biased Soft Labels},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/bad8ddaed5feb552f9e8f2e37c0531a1-Abstract-Conference.html},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YuanSXYGR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-01953,
  author       = {Xu Yang and
                  Zhangzikang Li and
                  Haiyang Xu and
                  Hanwang Zhang and
                  Qinghao Ye and
                  Chenliang Li and
                  Ming Yan and
                  Yu Zhang and
                  Fei Huang and
                  Songfang Huang},
  title        = {Learning Trajectory-Word Alignments for Video-Language Tasks},
  journal      = {CoRR},
  volume       = {abs/2301.01953},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.01953},
  doi          = {10.48550/ARXIV.2301.01953},
  eprinttype    = {arXiv},
  eprint       = {2301.01953},
  timestamp    = {Wed, 25 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-01953.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-01955,
  author       = {Zihua Wang and
                  Xu Yang and
                  Haiyang Xu and
                  Hanwang Zhang and
                  Chenliang Li and
                  Songfang Huang and
                  Fei Huang and
                  Yu Zhang},
  title        = {Adaptively Clustering Neighbor Elements for Image Captioning},
  journal      = {CoRR},
  volume       = {abs/2301.01955},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.01955},
  doi          = {10.48550/ARXIV.2301.01955},
  eprinttype    = {arXiv},
  eprint       = {2301.01955},
  timestamp    = {Wed, 25 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-01955.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-02177,
  author       = {Xu Yang and
                  Jiawei Peng and
                  Zihua Wang and
                  Haiyang Xu and
                  Qinghao Ye and
                  Chenliang Li and
                  Ming Yan and
                  Fei Huang and
                  Zhangzikang Li and
                  Yu Zhang},
  title        = {Transforming Visual Scene Graphs to Image Captions},
  journal      = {CoRR},
  volume       = {abs/2305.02177},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.02177},
  doi          = {10.48550/ARXIV.2305.02177},
  eprinttype    = {arXiv},
  eprint       = {2305.02177},
  timestamp    = {Wed, 25 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-02177.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-02279,
  author       = {Qiufeng Wang and
                  Xu Yang and
                  Shuxia Lin and
                  Xin Geng},
  title        = {Learngene: Inheriting Condensed Knowledge from the Ancestry Model
                  to Descendant Models},
  journal      = {CoRR},
  volume       = {abs/2305.02279},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.02279},
  doi          = {10.48550/ARXIV.2305.02279},
  eprinttype    = {arXiv},
  eprint       = {2305.02279},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-02279.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-14800,
  author       = {Xu Yang and
                  Yongliang Wu and
                  Mingzhuo Yang and
                  Haokun Chen and
                  Xin Geng},
  title        = {Exploring Diverse In-Context Configurations for Image Captioning},
  journal      = {CoRR},
  volume       = {abs/2305.14800},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14800},
  doi          = {10.48550/ARXIV.2305.14800},
  eprinttype    = {arXiv},
  eprint       = {2305.14800},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14800.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-10225,
  author       = {Fu Feng and
                  Jing Wang and
                  Congzhi Zhang and
                  Wenqian Li and
                  Xu Yang and
                  Xin Geng},
  title        = {Genes in Intelligent Agents},
  journal      = {CoRR},
  volume       = {abs/2306.10225},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.10225},
  doi          = {10.48550/ARXIV.2306.10225},
  eprinttype    = {arXiv},
  eprint       = {2306.10225},
  timestamp    = {Sat, 31 May 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-10225.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-16483,
  author       = {Yucheng Han and
                  Chi Zhang and
                  Xin Chen and
                  Xu Yang and
                  Zhibin Wang and
                  Gang Yu and
                  Bin Fu and
                  Hanwang Zhang},
  title        = {ChartLlama: {A} Multimodal {LLM} for Chart Understanding and Generation},
  journal      = {CoRR},
  volume       = {abs/2311.16483},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.16483},
  doi          = {10.48550/ARXIV.2311.16483},
  eprinttype    = {arXiv},
  eprint       = {2311.16483},
  timestamp    = {Sat, 16 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-16483.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-00351,
  author       = {Haokun Chen and
                  Xu Yang and
                  Yuhang Huang and
                  Zihan Wu and
                  Jing Wang and
                  Xin Geng},
  title        = {Manipulating the Label Space for In-Context Classification},
  journal      = {CoRR},
  volume       = {abs/2312.00351},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.00351},
  doi          = {10.48550/ARXIV.2312.00351},
  eprinttype    = {arXiv},
  eprint       = {2312.00351},
  timestamp    = {Sat, 31 May 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-00351.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-01571,
  author       = {Li Li and
                  Jiawei Peng and
                  Huiyi Chen and
                  Chongyang Gao and
                  Xu Yang},
  title        = {How to Configure Good In-Context Sequence for Visual Question Answering},
  journal      = {CoRR},
  volume       = {abs/2312.01571},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.01571},
  doi          = {10.48550/ARXIV.2312.01571},
  eprinttype    = {arXiv},
  eprint       = {2312.01571},
  timestamp    = {Sat, 06 Sep 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-01571.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-05614,
  author       = {Shiyu Xia and
                  Miaosen Zhang and
                  Xu Yang and
                  Ruiming Chen and
                  Haokun Chen and
                  Xin Geng},
  title        = {Transformer as Linear Expansion of Learngene},
  journal      = {CoRR},
  volume       = {abs/2312.05614},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.05614},
  doi          = {10.48550/ARXIV.2312.05614},
  eprinttype    = {arXiv},
  eprint       = {2312.05614},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-05614.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-05743,
  author       = {Boyu Shi and
                  Shiyu Xia and
                  Xu Yang and
                  Haokun Chen and
                  Zhiqiang Kou and
                  Xin Geng},
  title        = {Building Variable-sized Models via Learngene Pool},
  journal      = {CoRR},
  volume       = {abs/2312.05743},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.05743},
  doi          = {10.48550/ARXIV.2312.05743},
  eprinttype    = {arXiv},
  eprint       = {2312.05743},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-05743.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-10104,
  author       = {Yingzhe Peng and
                  Xu Yang and
                  Haoxuan Ma and
                  Shuo Xu and
                  Chi Zhang and
                  Yucheng Han and
                  Hanwang Zhang},
  title        = {{ICD-LM:} Configuring Vision-Language In-Context Demonstrations by
                  Language Modeling},
  journal      = {CoRR},
  volume       = {abs/2312.10104},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.10104},
  doi          = {10.48550/ARXIV.2312.10104},
  eprinttype    = {arXiv},
  eprint       = {2312.10104},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-10104.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/YangZC22,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Auto-Encoding and Distilling Scene Graphs for Image Captioning},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {44},
  number       = {5},
  pages        = {2313--2327},
  year         = {2022},
  url          = {https://doi.org/10.1109/TPAMI.2020.3042192},
  doi          = {10.1109/TPAMI.2020.3042192},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pami/YangZC22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/LiuWY0YS022,
  author       = {Bing Liu and
                  Dong Wang and
                  Xu Yang and
                  Yong Zhou and
                  Rui Yao and
                  Zhiwen Shao and
                  Jiaqi Zhao},
  title        = {Show, Deconfound and Tell: Image Captioning with Causal Inference},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2022, New Orleans, LA, USA, June 18-24, 2022},
  pages        = {18020--18029},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/CVPR52688.2022.01751},
  doi          = {10.1109/CVPR52688.2022.01751},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/LiuWY0YS022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mm/ChenYC022,
  author       = {Yuedong Chen and
                  Xu Yang and
                  Tat{-}Jen Cham and
                  Jianfei Cai},
  editor       = {Jo{\~{a}}o Magalh{\~{a}}es and
                  Alberto Del Bimbo and
                  Shin'ichi Satoh and
                  Nicu Sebe and
                  Xavier Alameda{-}Pineda and
                  Qin Jin and
                  Vincent Oria and
                  Laura Toni},
  title        = {Towards Unbiased Visual Emotion Recognition via Causal Intervention},
  booktitle    = {{MM} '22: The 30th {ACM} International Conference on Multimedia, Lisboa,
                  Portugal, October 10 - 14, 2022},
  pages        = {60--69},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3503161.3547936},
  doi          = {10.1145/3503161.3547936},
  timestamp    = {Mon, 18 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/mm/ChenYC022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-01338,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Chongyang Gao and
                  Jianfei Cai},
  title        = {Learning to Collocate Visual-Linguistic Neural Modules for Image Captioning},
  journal      = {CoRR},
  volume       = {abs/2210.01338},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.01338},
  doi          = {10.48550/ARXIV.2210.01338},
  eprinttype    = {arXiv},
  eprint       = {2210.01338},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-01338.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/prl/ZhangSMY21,
  author       = {Yu Zhang and
                  Xinyu Shi and
                  Siya Mi and
                  Xu Yang},
  title        = {Image captioning with transformer and knowledge graph},
  journal      = {Pattern Recognit. Lett.},
  volume       = {143},
  pages        = {43--49},
  year         = {2021},
  url          = {https://doi.org/10.1016/j.patrec.2020.12.020},
  doi          = {10.1016/J.PATREC.2020.12.020},
  timestamp    = {Mon, 06 Oct 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/prl/ZhangSMY21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/YangZQ021,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Guojun Qi and
                  Jianfei Cai},
  title        = {Causal Attention for Vision-Language Tasks},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2021, virtual, June 19-25, 2021},
  pages        = {9847--9857},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2021},
  url          = {https://openaccess.thecvf.com/content/CVPR2021/html/Yang\_Causal\_Attention\_for\_Vision-Language\_Tasks\_CVPR\_2021\_paper.html},
  doi          = {10.1109/CVPR46437.2021.00972},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/YangZQ021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/YangGZ021,
  author       = {Xu Yang and
                  Chongyang Gao and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Auto-Parsing Network for Image Captioning and Visual Question Answering},
  booktitle    = {2021 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2021, Montreal, QC, Canada, October 10-17, 2021},
  pages        = {2177--2187},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICCV48922.2021.00220},
  doi          = {10.1109/ICCV48922.2021.00220},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/YangGZ021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-03493,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Guojun Qi and
                  Jianfei Cai},
  title        = {Causal Attention for Vision-Language Tasks},
  journal      = {CoRR},
  volume       = {abs/2103.03493},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.03493},
  eprinttype    = {arXiv},
  eprint       = {2103.03493},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-03493.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-12096,
  author       = {Yuedong Chen and
                  Xu Yang and
                  Tat{-}Jen Cham and
                  Jianfei Cai},
  title        = {Towards Unbiased Visual Emotion Recognition via Causal Intervention},
  journal      = {CoRR},
  volume       = {abs/2107.12096},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.12096},
  eprinttype    = {arXiv},
  eprint       = {2107.12096},
  timestamp    = {Mon, 18 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-12096.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-10568,
  author       = {Xu Yang and
                  Chongyang Gao and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Auto-Parsing Network for Image Captioning and Visual Question Answering},
  journal      = {CoRR},
  volume       = {abs/2108.10568},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.10568},
  eprinttype    = {arXiv},
  eprint       = {2108.10568},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-10568.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-11029,
  author       = {Boyu Zhang and
                  Jiayuan Chen and
                  Yinfei Xu and
                  Hui Zhang and
                  Xu Yang and
                  Xin Geng},
  title        = {Auto-Encoding Score Distribution Regression for Action Quality Assessment},
  journal      = {CoRR},
  volume       = {abs/2111.11029},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.11029},
  eprinttype    = {arXiv},
  eprint       = {2111.11029},
  timestamp    = {Mon, 10 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-11029.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/CaiHWC0YLYZSLLM20,
  author       = {Yujun Cai and
                  Lin Huang and
                  Yiwei Wang and
                  Tat{-}Jen Cham and
                  Jianfei Cai and
                  Junsong Yuan and
                  Jun Liu and
                  Xu Yang and
                  Yiheng Zhu and
                  Xiaohui Shen and
                  Ding Liu and
                  Jing Liu and
                  Nadia Magnenat{-}Thalmann},
  editor       = {Andrea Vedaldi and
                  Horst Bischof and
                  Thomas Brox and
                  Jan{-}Michael Frahm},
  title        = {Learning Progressive Joint Propagation for Human Motion Prediction},
  booktitle    = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow,
                  UK, August 23-28, 2020, Proceedings, Part {VII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12352},
  pages        = {226--242},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58571-6\_14},
  doi          = {10.1007/978-3-030-58571-6\_14},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/CaiHWC0YLYZSLLM20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/ShiYGJ020,
  author       = {Xiangxi Shi and
                  Xu Yang and
                  Jiuxiang Gu and
                  Shafiq R. Joty and
                  Jianfei Cai},
  editor       = {Andrea Vedaldi and
                  Horst Bischof and
                  Thomas Brox and
                  Jan{-}Michael Frahm},
  title        = {Finding It at Another Side: {A} Viewpoint-Adapted Matching Encoder
                  for Change Captioning},
  booktitle    = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow,
                  UK, August 23-28, 2020, Proceedings, Part {XIV}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12359},
  pages        = {574--590},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58568-6\_34},
  doi          = {10.1007/978-3-030-58568-6\_34},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/ShiYGJ020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mm/YangGZ020,
  author       = {Xu Yang and
                  Chongyang Gao and
                  Hanwang Zhang and
                  Jianfei Cai},
  editor       = {Chang Wen Chen and
                  Rita Cucchiara and
                  Xian{-}Sheng Hua and
                  Guo{-}Jun Qi and
                  Elisa Ricci and
                  Zhengyou Zhang and
                  Roger Zimmermann},
  title        = {Hierarchical Scene Graph Encoder-Decoder for Image Paragraph Captioning},
  booktitle    = {{MM} '20: The 28th {ACM} International Conference on Multimedia, Virtual
                  Event / Seattle, WA, USA, October 12-16, 2020},
  pages        = {4181--4189},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3394171.3413859},
  doi          = {10.1145/3394171.3413859},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/mm/YangGZ020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-03923,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Deconfounded Image Captioning: {A} Causal Retrospect},
  journal      = {CoRR},
  volume       = {abs/2003.03923},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.03923},
  eprinttype    = {arXiv},
  eprint       = {2003.03923},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-03923.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-14352,
  author       = {Xiangxi Shi and
                  Xu Yang and
                  Jiuxiang Gu and
                  Shafiq R. Joty and
                  Jianfei Cai},
  title        = {Finding It at Another Side: {A} Viewpoint-Adapted Matching Encoder
                  for Change Captioning},
  journal      = {CoRR},
  volume       = {abs/2009.14352},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.14352},
  eprinttype    = {arXiv},
  eprint       = {2009.14352},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-14352.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/YangTZC19,
  author       = {Xu Yang and
                  Kaihua Tang and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Auto-Encoding Scene Graphs for Image Captioning},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2019, Long Beach, CA, USA, June 16-20, 2019},
  pages        = {10685--10694},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2019},
  url          = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Yang\_Auto-Encoding\_Scene\_Graphs\_for\_Image\_Captioning\_CVPR\_2019\_paper.html},
  doi          = {10.1109/CVPR.2019.01094},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/YangTZC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/YangZC19,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Learning to Collocate Neural Modules for Image Captioning},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2019, Seoul, Korea (South), October 27 - November 2, 2019},
  pages        = {4249--4259},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCV.2019.00435},
  doi          = {10.1109/ICCV.2019.00435},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/YangZC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/GuJCZYW19,
  author       = {Jiuxiang Gu and
                  Shafiq R. Joty and
                  Jianfei Cai and
                  Handong Zhao and
                  Xu Yang and
                  Gang Wang},
  title        = {Unpaired Image Captioning via Scene Graph Alignments},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2019, Seoul, Korea (South), October 27 - November 2, 2019},
  pages        = {10322--10331},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCV.2019.01042},
  doi          = {10.1109/ICCV.2019.01042},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/GuJCZYW19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-10658,
  author       = {Jiuxiang Gu and
                  Shafiq R. Joty and
                  Jianfei Cai and
                  Handong Zhao and
                  Xu Yang and
                  Gang Wang},
  title        = {Unpaired Image Captioning via Scene Graph Alignments},
  journal      = {CoRR},
  volume       = {abs/1903.10658},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.10658},
  eprinttype    = {arXiv},
  eprint       = {1903.10658},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-10658.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-08608,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Learning to Collocate Neural Modules for Image Captioning},
  journal      = {CoRR},
  volume       = {abs/1904.08608},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.08608},
  eprinttype    = {arXiv},
  eprint       = {1904.08608},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-08608.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/YangZC18,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Jianfei Cai},
  editor       = {Vittorio Ferrari and
                  Martial Hebert and
                  Cristian Sminchisescu and
                  Yair Weiss},
  title        = {Shuffle-Then-Assemble: Learning Object-Agnostic Visual Relationship
                  Features},
  booktitle    = {Computer Vision - {ECCV} 2018 - 15th European Conference, Munich,
                  Germany, September 8-14, 2018, Proceedings, Part {XII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11216},
  pages        = {38--54},
  publisher    = {Springer},
  year         = {2018},
  url          = {https://doi.org/10.1007/978-3-030-01258-8\_3},
  doi          = {10.1007/978-3-030-01258-8\_3},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/YangZC18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-00171,
  author       = {Xu Yang and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Shuffle-Then-Assemble: Learning Object-Agnostic Visual Relationship
                  Features},
  journal      = {CoRR},
  volume       = {abs/1808.00171},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.00171},
  eprinttype    = {arXiv},
  eprint       = {1808.00171},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-00171.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-02378,
  author       = {Xu Yang and
                  Kaihua Tang and
                  Hanwang Zhang and
                  Jianfei Cai},
  title        = {Auto-Encoding Scene Graphs for Image Captioning},
  journal      = {CoRR},
  volume       = {abs/1812.02378},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.02378},
  eprinttype    = {arXiv},
  eprint       = {1812.02378},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-02378.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/HuoYXZHLG16,
  author       = {Zeng{-}Wei Huo and
                  Xu Yang and
                  Chao Xing and
                  Ying Zhou and
                  Peng Hou and
                  Jiaqi Lv and
                  Xin Geng},
  title        = {Deep Age Distribution Learning for Apparent Age Estimation},
  booktitle    = {2016 {IEEE} Conference on Computer Vision and Pattern Recognition
                  Workshops, {CVPR} Workshops 2016, Las Vegas, NV, USA, June 26 - July
                  1, 2016},
  pages        = {722--729},
  publisher    = {{IEEE} Computer Society},
  year         = {2016},
  url          = {https://doi.org/10.1109/CVPRW.2016.95},
  doi          = {10.1109/CVPRW.2016.95},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/HuoYXZHLG16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/YangGZ16,
  author       = {Xu Yang and
                  Xin Geng and
                  Deyu Zhou},
  editor       = {Subbarao Kambhampati},
  title        = {Sparsity Conditional Energy Label Distribution Learning for Age Estimation},
  booktitle    = {Proceedings of the Twenty-Fifth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July
                  2016},
  pages        = {2259--2265},
  publisher    = {{IJCAI/AAAI} Press},
  year         = {2016},
  url          = {http://www.ijcai.org/Abstract/16/322},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/YangGZ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccvw/YangGXHWZWG15,
  author       = {Xu Yang and
                  Bin{-}Bin Gao and
                  Chao Xing and
                  Zeng{-}Wei Huo and
                  Xiu{-}Shen Wei and
                  Ying Zhou and
                  Jianxin Wu and
                  Xin Geng},
  title        = {Deep Label Distribution Learning for Apparent Age Estimation},
  booktitle    = {2015 {IEEE} International Conference on Computer Vision Workshop,
                  {ICCV} Workshops 2015, Santiago, Chile, December 7-13, 2015},
  pages        = {344--350},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICCVW.2015.53},
  doi          = {10.1109/ICCVW.2015.53},
  timestamp    = {Fri, 15 Nov 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccvw/YangGXHWZWG15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}