Bose, Digbalay; Hebbar, Rajat; Feng, Tiantian; Somandepalli, Krishna; Xu, Anfeng; Narayanan, Shrikanth
MM-AU: Towards Multimodal Understanding of Advertisement Videos Conference
ACM Multimedia , 2023.
BibTeX | Tags: advertisements, computational media understanding, content analysis, multimedia understanding, multimodal
@conference{nokey,
title = {MM-AU: Towards Multimodal Understanding of Advertisement Videos},
author = {Digbalay Bose and Rajat Hebbar and Tiantian Feng and Krishna Somandepalli and Anfeng Xu and Shrikanth Narayanan },
year = {2023},
date = {2023-10-29},
urldate = {2023-10-29},
publisher = {ACM Multimedia },
keywords = {advertisements, computational media understanding, content analysis, multimedia understanding, multimodal},
pubstate = {published},
tppubtype = {conference}
}
Baruah, Sabyasachee; Narayanan, Shrikanth
Character Coreference Resolution in Movie Screenplays Inproceedings
In: Findings of the Association for Computational Linguistics: ACL 2023, pp. 10300–10313, 2023.
Abstract | BibTeX | Tags: content analysis, coreference resolution, multimedia understanding
@inproceedings{baruah2023character,
title = {Character Coreference Resolution in Movie Screenplays},
author = {Sabyasachee Baruah and Shrikanth Narayanan},
year = {2023},
date = {2023-01-01},
urldate = {2023-01-01},
booktitle = {Findings of the Association for Computational Linguistics: ACL 2023},
pages = {10300--10313},
abstract = {Movie screenplays have a distinct narrative structure. It segments the story into scenes containing interleaving descriptions of actions, locations, and character dialogues. A typical screenplay spans several scenes and can include long-range dependencies between characters and events. A holistic document-level understanding of the screenplay requires several natural language processing capabilities, such as parsing, character identification, coreference resolution, action recognition, summarization, and attribute discovery. In this work, we develop scalable and robust methods to extract the structural information and character coreference clusters from full-length movie screenplays. We curate two datasets for screenplay parsing and character coreference— MovieParse and MovieCoref, respectively. We build a robust screenplay parser to handle inconsistencies in screenplay formatting and
leverage the parsed output to link co-referring character mentions. Our coreference models can scale to long screenplay documents without drastically increasing their memory footprints.},
keywords = {content analysis, coreference resolution, multimedia understanding},
pubstate = {published},
tppubtype = {inproceedings}
}
Guha, Tanaya; Huang, Che-Wei; Kumar, Naveen; Zhu, Yan; Narayanan, Shrikanth S
Gender Representation in Cinematic Content: A Multimodal Approach Inproceedings
In: Proceedings of the 2015 ACM on International Conference on Multimodal Interaction, pp. 31–34, Association for Computing Machinery, Seattle, Washington, USA, 2015, ISBN: 9781450339124.
Abstract | Links | BibTeX | Tags: content analysis, gender representation, movie, multimodal
@inproceedings{10.1145/2818346.2820778,
title = {Gender Representation in Cinematic Content: A Multimodal Approach},
author = {Tanaya Guha and Che-Wei Huang and Naveen Kumar and Yan Zhu and Shrikanth S Narayanan},
url = {https://doi.org/10.1145/2818346.2820778},
doi = {10.1145/2818346.2820778},
isbn = {9781450339124},
year = {2015},
date = {2015-01-01},
booktitle = {Proceedings of the 2015 ACM on International Conference on Multimodal Interaction},
pages = {31–34},
publisher = {Association for Computing Machinery},
address = {Seattle, Washington, USA},
series = {ICMI '15},
abstract = {The goal of this paper is to enable an objective understanding of gender portrayals
in popular films and media through multimodal content analysis. An automated system
for analyzing gender representation in terms of screen presence and speaking time
is developed. First, we perform independent processing of the video and the audio
content to estimate gender distribution of screen presence at shot level, and of speech
at utterance level. A measure of the movie's excitement or intensity is computed using
audiovisual features for every scene. This measure is used as a weighting function
to combine the gender-based screen/speaking time information at shot/utterance level
to compute gender representation for the entire movie. Detailed results and analyses
are presented on seventeen full length Hollywood movies.},
keywords = {content analysis, gender representation, movie, multimodal},
pubstate = {published},
tppubtype = {inproceedings}
}