@misc{misc, title  = {{VisualSpeech: Enhancing Prosody Modeling in TTS Using Video}},
 url = {{}},
 year = {{2025}},
 month = {{8}},
 author = {{Que S and Ragni A}},
 doi = {{10.48550/arxiv.2501.19258}},
 note = {{Accessed on 2026/06/28}}}