-
Notifications
You must be signed in to change notification settings - Fork 1
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
1 parent
e760cfa
commit 107defd
Showing
32 changed files
with
796 additions
and
105 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,33 @@ | ||
+++ | ||
# 0 -> 'Forthcoming', | ||
# 1 -> 'Preprint', | ||
# 2 -> 'Journal', | ||
# 3 -> 'Conference Proceedings', | ||
# 4 -> 'Book chapter', | ||
# 5 -> 'Thesis' | ||
|
||
title = "Whodunnit? Inferring what happened from multimodal evidence" | ||
date = "2024-05-13" | ||
authors = ["S. A Wu\\*","E. Brockbank\\*","H. Cha","J. Fränken","E. Jin","Z. Huang","W. Liu","R. Zhang","J. Wu","T. Gerstenberg"] | ||
publication_types = ["3"] | ||
publication_short = "_Proceedings of the 46th Annual Conference of the Cognitive Science Society_" | ||
publication = "Wu*, S. A., Brockbank*, E., Cha, H., Fränken, J., Jin, E., Huang, Z., Liu, W., Zhang, R., Wu, J., Gerstenberg, T. (2024). Whodunnit? Inferring what happened from multimodal evidence. In _Proceedings of the 46th Annual Conference of the Cognitive Science Society_." | ||
abstract = "Humans are remarkably adept at inferring the causes of events in their environment; doing so often requires incorporating information from multiple sensory modalities. For instance, if a car slows down in front of us, inferences about why they did so are rapidly revised if we also hear sirens in the distance. Here, we investigate the ability to reconstruct others' actions and events from the past by integrating multimodal information. Participants were asked to infer which of two agents performed an action in a household setting given either visual evidence, auditory evidence, or both. We develop a computational model that makes inferences by generating multimodal simulations, and also evaluate our task on a large language model (GPT-4) and a large multimodal model (GPT-4V). We find that humans are relatively accurate overall and perform best when given multimodal evidence. GPT-4 and GPT-4V performance comes close overall, but is very weakly correlated with participants across individual trials. Meanwhile, the simulation model captures the pattern of human responses well. Multimodal event reconstruction represents a challenge for current AI systems, and frameworks that draw on the cognitive processes underlying people's ability to reconstruct events offer a promising avenue forward." | ||
image_preview = "" | ||
selected = false | ||
projects = [] | ||
url_pdf = "papers/wu2024whodunnit.pdf" | ||
url_preprint = "" | ||
url_code = "" | ||
url_dataset = "" | ||
url_slides = "" | ||
url_video = "" | ||
url_poster = "" | ||
url_source = "" | ||
url_custom = [{name = "Github", url = "https://github.com/cicl-stanford/whodunnit_multimodal_inference"}] | ||
math = true | ||
highlight = true | ||
[header] | ||
# image = "publications/wu2024whodunnit.png" | ||
caption = "" | ||
+++ |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Binary file not shown.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.