@inproceedings{zhang-etal-2024-multi-level, title = "Multi-Level Cross-Modal Alignment for Speech Relation Extraction", author = "Zhang, Liang and Yang, Zhen and Fu, Biao and Lu, Ziyao and Shao, Liangying and Liu, Shiyu and Meng, Fandong and Zhou, Jie and Wang, Xiaoli and Su, Jinsong", editor = "Al-Onaizan, Yaser and Bansal, Mohit and Chen, Yun-Nung", booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing", month = nov, year = "2024", address = "Miami, Florida, USA", publisher = "Association for Computational Linguistics", url = "https://aclanthology.org/2024.emnlp-main.668/", doi = "10.18653/v1/2024.emnlp-main.668", pages = "11975--11986" }