@misc{misc, title = {{VisualSpeech: Enhancing Prosody Modeling in TTS Using Video}}, url = {{}}, year = {{2025}}, month = {{8}}, author = {{Que S and Ragni A}}, doi = {{10.48550/arxiv.2501.19258}}, note = {{Accessed on 2025/11/01}}}