About Me

Hang Zhang

I am Hang Zhang (张航), currently Head of the Foundation Model Team at XPeng, where I lead the development of next-generation autonomous driving systems using Vision-Language-Action (VLA) foundation models for L3 and L4 production vehicles. Previously, I was a Senior Staff Applied Research Scientist at Cruise, leading efforts in detection, segmentation, and perception model consolidation. Before Cruise, I was a Research Scientist at Meta, where I led the development of a scalable neural architecture optimization platform that supports AI models on Instagram, Portal, and VR headsets for tasks such as person understanding, AR / VR rendering, and ads ranking. Earlier in my career, I was a Senior Applied Scientist at Amazon AI, working on deep learning, computer vision, and the MXNet framework. During that time, we developed the ResNeSt model, which achieved state-of-the-art results on multiple vision benchmarks. Beyond my work, I am also enthusiastic in contributing to open source projects, including [D2Go Toolkit, PyTorch Encoding Toolkit, AutoGluon Toolkit, GluonCV Toolkit, Apache MXNet].My research has been cited more than 10,000 times in Google Scholar, and my open-source contributions have received more than 10,000 stars on GitHub.


Selected Publications

li21

Neural Architecture Search for Multiple Tasks in One Run
Bichen Wu, Chaojian Li, Hang Zhang, Xiaoliang Dai, Matthew Yu, Jialiang Wang, Yingyan Lin, Peter Vajda
arXiv, 11/2021

paper abstract bibtex

@article{wu2021fbnetv5,
  title={FBNetV5: Neural Architecture Search for Multiple Tasks in One Run},
  author={Wu, Bichen and Li, Chaojian and Zhang, Hang and Dai, Xiaoliang and Zhang, Peizhao and Yu, Matthew and Wang, Jialiang and Lin, Yingyan and Vajda, Peter},
  journal={arXiv preprint arXiv:2111.10007},
  year={2021}
}
    

zhang20

ResNeSt: Split-Attention Networks
Hang Zhang, Chongruo Wu, Zhongyue Zhang, Yi Zhu, Haibin Lin, Zhi Zhang, Yue Sun, Tong He, Jonas Mueller, R. Manmatha, Mu Li, Alex Smola
IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), 2022
arXiv, 04/2020

paper abstract bibtex slides code

@InProceedings{Zhang_2022_CVPR,
    author    = {Zhang, Hang and Wu, Chongruo and Zhang, Zhongyue and Zhu, Yi and Lin, Haibin and Zhang, Zhi and Sun, Yue and He, Tong and Mueller, Jonas and Manmatha, R. and Li, Mu and Smola, Alexander},
    title     = {ResNeSt: Split-Attention Networks},
    booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops},
    month     = {June},
    year      = {2022},
    pages     = {2736-2746}
}
    

zhang19

Co-occurrent Features in Semantic Segmentation
Hang Zhang, Han Zhang, Chenguang Wang, Junyuan Xie
IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2019

paper abstract bibtex

@InProceedings{Zhang_2019_CVPR,
author = {Hang Zhang and Han Zhang and Chenguang Wang and Junyuan Xie},
title = {Co-occurrent Features in Semantic Segmentation},
booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
year = {2019}
}
    

xie19

Bag of Tricks for Image Classification with Convolutional Neural Networks
Tong He, Zhi Zhang, Hang Zhang, Zhongyue Zhang, Junyuan Xie, Mu Li
IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2019

paper abstract bibtex code

@InProceedings{Xie2018bags,
  title={Bag of Tricks to Train Convolutional Neural Networks for Image Classification},
  author={Tong He and Zhi Zhang and Hang Zhang and Zhongyue Zhang and Junyuan Xie and Mu Li},
  booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
  year={2018}
}
    

zhang18

Context Encoding for Semantic Segmentation
Hang Zhang, Kristin Dana, Jianping Shi, Zhongyue Zhang, Xiaogang Wang, Ambrish Tyagi, Amit Agrawal
IEEE Conference on Computer Vision and Pattern Recognition
(CVPR)
, 2018 Oral (70/3309=2.1%)

paper abstract bibtex code talk slides

@InProceedings{Zhang_2018_CVPR,
author = {Zhang, Hang and Dana, Kristin and Shi, Jianping and Zhang, Zhongyue and Wang, Xiaogang and Tyagi, Ambrish and Agrawal, Amit},
title = {Context Encoding for Semantic Segmentation},
booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
month = {June},
year = {2018}
}
    

zhang17

Multi-style Generative Network for Real-time Transfer
Hang Zhang, Kristin Dana
European Conference on Computer Vision Workshops (ECCVW), 2018
arXiv, 03/2017

paper abstract bibtex code video project poster

@article{zhang2017multistyle,
title={Multi-style Generative Network for Real-time Transfer},
author={Zhang, Hang and Dana, Kristin},
journal={arXiv preprint arXiv:1703.06953},
year={2017}
}
    

zhang17

Deep TEN: Texture Encoding Network
Hang Zhang, Jia Xue, Kristin Dana
IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2017

paper abstract bibtex code blog poster slides

@InProceedings{Zhang_2017_CVPR,
author = {Zhang, Hang and Xue, Jia and Dana, Kristin},
title = {Deep TEN: Texture Encoding Network},
booktitle = {The IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
month = {July},
year = {2017}
}
    


HTML Counter unique visitors since May 2014
sitemap sitemap