MUGEN: A Playground for Video-Audio-Text Multimodal Understanding and GENeration
Thomas Hayes*, Songyang Zhang*, Xi Yin, Guan Pang, Sasha Sheng, Harry Yang, Songwei Ge, Qiyuan Hu, Devi Parikh
arXiv
[Project Page]
[PDF]
[Code]
[Bibtex]
@article{hayes2022mugen,
title={MUGEN: A Playground for Video-Audio-Text Multimodal Understanding and GENeration},
author={Hayes, Thomas and Zhang, Songyang and Yin, Xi and Pang, Guan and Sheng, Sasha and Yang, Harry and Ge, Songwei and Hu, Qiyuan and Parikh, Devi},
journal={arXiv preprint arXiv:2204.08058},
year={2022}
}
* equal contribution, ordered alphabetically
Instance-wise or Class-wise?A Tale of Neighbor Shapley for Concept-based Explanation
Jiahui Li, Kun Kuan, Lin Li, Long Chen, Songyang Zhang, Jian Shao, Jun Xiao
ACMMM 2021
[PDF]
[Bibtex]
@InProceedings{yang2021sat,
title={Instance-wise or Class-wise?A Tale of Neighbor Shapley for Concept-based Explanation},
author={Li, Jiahui and Kuan, Kun and Li, Lin and Chen, Long and Zhang, Songyang and Shao, Jian and Xiao, Jun},
booktitle={ACMMM},
year={2021}
}
SAT: 2D Semantics Assisted Training for 3D Visual Grounding
Zhengyuan Yang, Songyang Zhang, Liwei Wang, Jiebo Luo
ICCV 2021 [Oral]
[PDF]
[Code]
[Bibtex]
@InProceedings{yang2021sat,
title={SAT: 2D Semantics Assisted Training for 3D Visual Grounding},
author={Yang, Zhengyuan and Zhang, Songyang and Wang, Liwei and Luo, Jiebo},
booktitle={ICCV},
year={2021}
}
Video-aided Unsupervised Grammar Induction
Songyang Zhang, Linfeng Song, Lifeng Jin, Kun Xu, Dong Yu, Jiebo Luo
NAACL 2021 [Best Long Paper]
[PDF]
[Press]
[Code]
[Video (English)]
[Video (Chinese)]
[Bibtex]
@InProceedings{zhang2021video,
author = {Zhang, Songyang and Song, Linfeng and Jin, Lifeng and Xu, Kun and Yu, Dong and Luo, Jiebo},
title = {Video-aided Unsupervised Grammar Induction},
booktitle = {NAACL},
year = {2021}
}
Boundary Proposal Network for Two-Stage Natural Language Video Localization
Shaoning Xiao, Long Chen, Songyang Zhang, Wei Ji, Jian Shao, Lu Ye, Jun Xiao
AAAI 2021
[PDF]
[Bibtex]
@InProceedings{xiao2021boundary,
title={Boundary Proposal Network for Two-Stage Natural Language Video Localization},
author={Xiao, Shaoning and Chen, Long and Zhang, Songyang and Ji, Wei and Shao, Jian and Ye, Lu and Xiao, Jun},
booktitle={AAAI},
year={2021}
}
Content-based Analysis of the Cultural Differences between TikTok and Douyin
Li Sun, Haoqi Zhang, Songyang Zhang, Jiebo Luo
IEEE Big Data 2020
[PDF]
[Video]
[Bibtex]
@InProceedings{sun2020content,
title={Content-based Analysis of the Cultural Differences between TikTok and Douyin},
author={Sun, Li and Zhang, Haoqi and Zhang, Songyang and Luo, Jiebo},
booktitle={IEEE Big Data},
year={2020}
}
Global Image Sentiment Transfer
Jie An, Tianlang Chen, Songyang Zhang, Jiebo Luo
ICPR 2020
[PDF]
[Video]
[Press]
[Bibtex]
@InProceedings{an2020global,
title={Global Image Sentiment Transfer},
author={An, Jie and Chen, Tianlang and Zhang, Songyang and Luo, Jiebo},
booktitle={ICPR},
year={2020}
}
Mi YouTube es Su YouTube? Analyzing the Cultures using YouTube Thumbnails of Popular Videos
Songyang Zhang, Tolga Aktas, Jiebo Luo
IEEE Big Data 2021
[PDF]
[Bibtex]
@InProceedings{zhang2021mi,
title={Mi YouTube es Su YouTube? Analyzing the Cultures using YouTube Thumbnails of Popular Videos},
author={Zhang, Songyang and Aktas, Tolga and Luo, Jiebo},
booktitle={IEEE Big Data},
year={2021}
}
Learning 2D Temporal Adjacent Networks for Moment Localization with Natural Language
Songyang Zhang, Houwen Peng, Jianlong Fu, Jiebo Luo
AAAI 2020
[PDF]
[Code]
[Press]
[Bibtex]
@InProceedings{2DTAN_2020_AAAI,
author = {Zhang, Songyang and Peng, Houwen and Fu, Jianlong and Luo, Jiebo},
title = {Learning 2D Temporal Adjacent Networks forMoment Localization with Natural Language},
booktitle = {AAAI},
year = {2020}
}
Learning 2D Temporal Adjacent Networks for Temporal Action Localization
Songyang Zhang, Houwen Peng, Le Yang Jianlong Fu, Jiebo Luo
Technical Report, HACS Temporal Action Localization Challenge at ICCV'19 [Winner]
[PDF]
[Bibtex]
@article{zhang2019learning,
title={Learning Sparse 2D Temporal Adjacent Networks for Temporal Action Localization},
author={Zhang, Songyang and Peng, Houwen and Yang, Le and Fu, Jianlong and Luo, Jiebo},
journal={arXiv preprint arXiv:1912.03612},
year={2019}
}
Multi-Scale 2D Temporal Adjacency Networks for Moment Localization with Natural Language
Songyang Zhang, Houwen Peng, Jianlong Fu, Yijuan Lu, Jiebo Luo
TPAMI 2021
[PDF]
[Code]
[Bibtex]
@article{zhang2020multi,
title={Multi-Scale 2D Temporal Adjacency Networks for Moment Localization with Natural Language},
author={Zhang, Songyang and Peng, Houwen and Fu, Jianlong and Lu, Yijuan and Luo, Jiebo},
journal={TPAMI},
year={2021}
}
Exploiting Temporal Relationships in Video Moment Localization with Natural Language
Songyang Zhang, Jinsong Su, Jiebo Luo
ACMMM 2019
[PDF]
[Code]
[Bibtex]
@inproceedings{zhang2019exploiting,
title={Exploiting temporal relationships in video moment localization with natural language},
author={Zhang, Songyang and Su, Jinsong and Luo, Jiebo},
booktitle={ACMMM},
year={2019}
}
On Geometric Features for Skeleton-Based Action Recognition Using Multilayer LSTM Networks
Songyang Zhang, Xiaoming Liu, Jun Xiao
WACV 2017
[PDF]
[Code]
[Bibtex]
@InProceedings{Zhang_2017_geometric,
author = {Zhang, Songyang and Liu, Xiaoming and Xiao, Jun},
title = {On Geometric Features for Skeleton-Based Action Recognition Using Multilayer LSTM Networks},
booktitle = {WACV},
year = {2017}
}
Fusing Geometric Features for Skeleton-Based Action Recognition using Multilayer LSTM Networks
Songyang Zhang,Yang Yang, Jun Xiao, Xiaoming Liu, Yi Yang, Di Xie, Yueting Zhuang
TMM 2018
[PDF]
[Bibtex]
@article{zhang2018fusing,
title={Fusing geometric features for skeleton-based action recognition using multilayer LSTM networks},
author={Zhang, Songyang and Yang, Yang and Xiao, Jun and Liu, Xiaoming and Yang, Yi and Xie, Di and Zhuang, Yueting},
journal={IEEE Transactions on Multimedia},
volume={20},
number={9},
pages={2330--2343},
year={2018},
publisher={IEEE}
}
Robocup 3D Simulation
Core member of SEU-Jolly team
Robocup China Open 2014 [Champion]
Robocup 2014 [Quarter-finals]
Facebook AI Research (FAIR), Menlo Park, CA
Jan 2022 - Aug 2022. Mentor: Xi Yin
Project: Multimodal Generation
Tencent AI Lab, Bellevue, WA
Sep 2021 - Dec 2021. Mentor: Linfeng Song,
Lifeng Jin,
Kun Xu
Project: Unsupervised Grammar Induction
Microsoft, Redmond, WA
May 2021 - Aug 2021. Mentor: Quanzeng You, Jiang Wang
Project: Moment Localization with Natural Language
Tencent AI Lab, Bellevue, WA
May 2020 - Aug 2020. Mentor: Linfeng Song,
Lifeng Jin,
Kun Xu
Project: Unsupervised Grammar Induction
Microsoft Research Asia (MSRA), Beijing, China
May 2019 - Aug 2019. Mentor: Houwen Peng, Jianlong Fu
Project: Moment Localization with Natural Language
Tencent AI Lab, Shenzhen, China
Mar 2018 - Aug 2018. Mentor: Lin Ma, Linchao Bao
Project: Temporal Action Localization