This bibliography is extracted from various primary sources using automatic language understanding tools. A good faith effort has been made to eliminate errors and minimize omissions. Please bring any remaining errors or omissions to the attention of CLSP by writing to [email protected].
@inproceedings{274515167,
title = {CA-SSLR: Condition-Aware Self-Supervised Learning Representation for Generalized Speech Processing},
author = {{Yen-Ju Lu} and {Jing Liu} and {Thomas Thebaud} and {L. Moro-Velázquez} and {A. Rastrow} and {N. Dehak} and {J. Villalba}},
year = 2024,
month = {12},
booktitle = {},
url = {https://www.semanticscholar.org/paper/daf0aba5a88ce8461062165249baba14f723c151},
}
@inproceedings{274598076,
title = {Are Clinical T5 Models Better for Clinical Text?},
author = {{Yahan Li} and {Keith Harrigian} and {Ayah Zirikly} and {Mark Dredze}},
year = 2024,
month = {12},
booktitle = {},
url = {https://www.semanticscholar.org/paper/88d0b0189e6d33ce0a4b9315bd8fe82bad326824},
}
@inproceedings{274606149,
title = {Decoding contextual influences on auditory perception from primary auditory cortex},
author = {{B. Englitz} and {S. Akram} and {Mounya Elhilali} and {S. Shamma}},
year = 2024,
month = {12},
booktitle = {eLife},
url = {https://www.semanticscholar.org/paper/67535ffb91c1f43a979f686f66551000013f83de},
}
@inproceedings{274529945,
title = {Sustained EEG responses to rapidly unfolding stochastic sounds reflect Bayesian inferred reliability tracking},
author = {{Sijia Zhao} and {Benjamin Skerritt-Davis} and {Mounya Elhilali} and {Frederic Dick} and {M. Chait}},
year = 2024,
month = {12},
booktitle = {Progress in neurobiology},
url = {https://www.semanticscholar.org/paper/b7f0613a7bbcb22fc658764f2269d91ecdedd542},
}
@inproceedings{273745499,
title = {Multimodal Emotion Recognition Harnessing the Complementarity of Speech, Language, and Vision},
author = {{Thomas Thebaud} and {A. Favaro} and {Yaohan Guan} and {Yuchen Yang} and {Prabhav Singh} and {J. Villalba} and {Laureano Mono-Velazquez} and {N. Dehak}},
year = 2024,
month = {11},
booktitle = {International Conference on Multimodel Interaction},
url = {https://www.semanticscholar.org/paper/acf86833b29d724bf3a2134f60a2cf4497e013e0},
}
@inproceedings{274139049,
title = {Care to Explain? AI Explanation Types Differentially Impact Chest Radiograph Diagnostic Performance and Physician Trust in AI.},
author = {{Drew Prinster} and {Amama Mahmood} and {S. Saria} and {Jean Jeudy} and {Cheng Ting Lin} and {Paul H Yi} and {Chien-Ming Huang}},
year = 2024,
month = {11},
booktitle = {Radiology},
url = {https://www.semanticscholar.org/paper/71e974f5a49bcdfa72aad21b64158a9f5c176b2e},
}
@inproceedings{274178323,
title = {A data-driven framework for identifying patient subgroups on which an AI/machine learning model may underperform},
author = {{Adarsh Subbaswamy} and {B. Sahiner} and {Nicholas Petrick} and {Vinay Pai} and {Roy Adams} and {Matthew C. Diamond} and {S. Saria}},
year = 2024,
month = {11},
booktitle = {npj Digital Medicine},
url = {https://www.semanticscholar.org/paper/54ec15ff209d42b8540da5786b4262f74e869151},
}
@inproceedings{274131239,
title = {Generative World Explorer},
author = {{Taiming Lu} and {Tianmin Shu} and {Alan Yuille} and {Daniel Khashabi} and {Jieneng Chen}},
year = 2024,
month = {11},
booktitle = {},
url = {https://www.semanticscholar.org/paper/13279a99e7a2b6c8aaac9026cef53034e6cfa1de},
}
It is challenging for models to understand complex, multimodal content such as television clips, and this is in part because video-language models often rely on single-modality reasoning and lack interpretability. To combat these issues we propose TV-TREES, the first multimodal entailment tree generator. TV-TREES serves as an approach to video understanding that promotes interpretable joint-modality reasoning by searching for trees of entailment relationships between simple text-video evidence and higher-level conclusions that prove question-answer pairs. We also introduce the task of multimodal entailment tree generation to evaluate reasoning quality. Our method{‘}s performance on the challenging TVQA benchmark demonstrates interpretable, state-of-the-art zero-shot performance on full clips, illustrating that multimodal entailment tree generation can be a best-of-both-worlds alternative to black-box systems.
@inproceedings{sanders-etal-2024-tv,
title = "{TV}-{TREES}: Multimodal Entailment Trees for Neuro-Symbolic Video Reasoning",
author = "Sanders, Kate and
Weir, Nathaniel and
Van Durme, Benjamin",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.emnlp-main.1059",
doi = "10.18653/v1/2024.emnlp-main.1059",
pages = "19009--19028",
abstract = "It is challenging for models to understand complex, multimodal content such as television clips, and this is in part because video-language models often rely on single-modality reasoning and lack interpretability. To combat these issues we propose TV-TREES, the first multimodal entailment tree generator. TV-TREES serves as an approach to video understanding that promotes interpretable joint-modality reasoning by searching for trees of entailment relationships between simple text-video evidence and higher-level conclusions that prove question-answer pairs. We also introduce the task of multimodal entailment tree generation to evaluate reasoning quality. Our method{'}s performance on the challenging TVQA benchmark demonstrates interpretable, state-of-the-art zero-shot performance on full clips, illustrating that multimodal entailment tree generation can be a best-of-both-worlds alternative to black-box systems.",
}
Humans regularly engage in analogical thinking, relating personal experiences to current situations (X is analogous to Y because of Z). Analogical thinking allows humans to solve problems in creative ways, grasp difficult concepts, and articulate ideas more effectively. Can language models (LMs) do the same? To answer this question, we propose AnaloBench, a benchmark to determine analogical reasoning ability in LMs. Our benchmarking approach focuses on aspects of this ability that are common among humans: (i) recalling related experiences from a large amount of information, and (ii) applying analogical reasoning to complex and lengthy scenarios. We collect a set of 340 high quality, human written analogies for use in our benchmark, which constitutes the largest such collection to date. We then test a broad collection of models consisting of 12 open source and 3 proprietary in various sizes and architectures. As in prior results, scaling up LMs results in some performance boosts. Surprisingly, scale offers minimal gains when, (i) analogies involve lengthy scenarios, or (ii) recalling relevant scenarios from a large pool of information, a process analogous to finding a needle in a haystack. We hope these observations encourage further research in this field.
@inproceedings{ye-etal-2024-analobench,
title = "{A}nalo{B}ench: Benchmarking the Identification of Abstract and Long-context Analogies",
author = "Ye, Xiao and
Wang, Andrew and
Choi, Jacob and
Lu, Yining and
Sharma, Shreya and
Shen, Lingfeng and
Tiyyala, Vijay Murari and
Andrews, Nicholas and
Khashabi, Daniel",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.emnlp-main.725",
doi = "10.18653/v1/2024.emnlp-main.725",
pages = "13060--13082",
abstract = "Humans regularly engage in analogical thinking, relating personal experiences to current situations (X is analogous to Y because of Z). Analogical thinking allows humans to solve problems in creative ways, grasp difficult concepts, and articulate ideas more effectively. Can language models (LMs) do the same? To answer this question, we propose AnaloBench, a benchmark to determine analogical reasoning ability in LMs. Our benchmarking approach focuses on aspects of this ability that are common among humans: (i) recalling related experiences from a large amount of information, and (ii) applying analogical reasoning to complex and lengthy scenarios. We collect a set of 340 high quality, human written analogies for use in our benchmark, which constitutes the largest such collection to date. We then test a broad collection of models consisting of 12 open source and 3 proprietary in various sizes and architectures. As in prior results, scaling up LMs results in some performance boosts. Surprisingly, scale offers minimal gains when, (i) analogies involve lengthy scenarios, or (ii) recalling relevant scenarios from a large pool of information, a process analogous to finding a needle in a haystack. We hope these observations encourage further research in this field.",
}
To explain social phenomena and identify systematic biases, much research in computational social science focuses on comparative text analyses. These studies often rely on coarse corpus-level statistics or local word-level analyses, mainly in English. We introduce the InfoGap method{–-}an efficient and reliable approach to locating information gaps and inconsistencies in articles at the fact level, across languages. We evaluate InfoGap by analyzing LGBT people{‘}s portrayals, across 2.7K biography pages on English, Russian, and French Wikipedias. We find large discrepancies in factual coverage across the languages. Moreover, our analysis reveals that biographical facts carrying negative connotations are more likely to be highlighted in Russian Wikipedia. Crucially, InfoGap both facilitates large scale analyses, and pinpoints local document- and fact-level information gaps, laying a new foundation for targeted and nuanced comparative language analysis at scale.
@inproceedings{samir-etal-2024-locating,
title = "Locating Information Gaps and Narrative Inconsistencies Across Languages: A Case Study of {LGBT} People Portrayals on {W}ikipedia",
author = "Samir, Farhan and
Park, Chan Young and
Field, Anjalie and
Shwartz, Vered and
Tsvetkov, Yulia",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.emnlp-main.384",
doi = "10.18653/v1/2024.emnlp-main.384",
pages = "6747--6762",
abstract = "To explain social phenomena and identify systematic biases, much research in computational social science focuses on comparative text analyses. These studies often rely on coarse corpus-level statistics or local word-level analyses, mainly in English. We introduce the InfoGap method{---}an efficient and reliable approach to locating information gaps and inconsistencies in articles at the fact level, across languages. We evaluate InfoGap by analyzing LGBT people{'}s portrayals, across 2.7K biography pages on English, Russian, and French Wikipedias. We find large discrepancies in factual coverage across the languages. Moreover, our analysis reveals that biographical facts carrying negative connotations are more likely to be highlighted in Russian Wikipedia. Crucially, InfoGap both facilitates large scale analyses, and pinpoints local document- and fact-level information gaps, laying a new foundation for targeted and nuanced comparative language analysis at scale.",
}
@inproceedings{274287296,
title = {Taxonomy-based prompt engineering to generate synthetic drug-related patient portal messages.},
author = {{Natalie Wang} and {Sukrit Treewaree} and {Ayah Zirikly} and {Yuzhi L. Lu} and {Michelle H. Nguyen} and {Bhavik Agarwal} and {Jash Shah} and {J. M. Stevenson} and {Casey Overby Taylor}},
year = 2024,
month = {11},
booktitle = {Journal of Biomedical Informatics},
url = {https://www.semanticscholar.org/paper/aceb915df57e8f1708fa54cb7f828da00c76c42f},
}
@inproceedings{274444639,
title = {Deep Stroop: Integrating eye tracking and speech processing to characterize people with neurodegenerative disorders while performing neuropsychological tests.},
author = {{Trevor Meyer} and {A. Favaro} and {Esther S. Oh} and {A. Butala} and {C. Motley} and {Pedro P. Irazoqui} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2024,
month = {11},
booktitle = {Computers in Biology and Medicine},
url = {https://www.semanticscholar.org/paper/528e2a1618feeb267fc7fc4873207266ef5c01a3},
}
Recent language models enable new opportunities for structured reasoning with text, such as the construction of intuitive, proof-like textual entailment trees without relying on brittle formal logic. However, progress in this direction has been hampered by a long-standing lack of a clear protocol for determining what {_}valid decompositional entailment{_} is. This absence causes noisy datasets and limited performance gains by modern neuro-symbolic entailment engines. To address these problems, we formulate a consistent and theoretically grounded approach to annotating decompositional entailment and evaluate its impact on LLM-based textual inference. We find that our new dataset, RDTE (Recognizing Decompositional Textual Entailment), has a substantially higher internal consistency than prior decompositional entailment datasets, suggesting that RDTE is a significant step forward in the long-standing problem of forming a clear protocol for discerning entailment. We also find that training an RDTE-oriented entailment classifier via knowledge distillation and employing it in an entailment tree reasoning engine significantly improves both accuracy and proof quality, illustrating the practical benefit of this advance for textual inference.
@inproceedings{weir-etal-2024-enhancing,
title = "Enhancing Systematic Decompositional Natural Language Inference Using Informal Logic",
author = "Weir, Nathaniel and
Sanders, Kate and
Weller, Orion and
Sharma, Shreya and
Jiang, Dongwei and
Jiang, Zhengping and
Dalvi Mishra, Bhavana and
Tafjord, Oyvind and
Jansen, Peter and
Clark, Peter and
Van Durme, Benjamin",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.emnlp-main.531",
doi = "10.18653/v1/2024.emnlp-main.531",
pages = "9458--9482",
abstract = "Recent language models enable new opportunities for structured reasoning with text, such as the construction of intuitive, proof-like textual entailment trees without relying on brittle formal logic. However, progress in this direction has been hampered by a long-standing lack of a clear protocol for determining what {\_}valid decompositional entailment{\_} is. This absence causes noisy datasets and limited performance gains by modern neuro-symbolic entailment engines. To address these problems, we formulate a consistent and theoretically grounded approach to annotating decompositional entailment and evaluate its impact on LLM-based textual inference. We find that our new dataset, RDTE (Recognizing Decompositional Textual Entailment), has a substantially higher internal consistency than prior decompositional entailment datasets, suggesting that RDTE is a significant step forward in the long-standing problem of forming a clear protocol for discerning entailment. We also find that training an RDTE-oriented entailment classifier via knowledge distillation and employing it in an entailment tree reasoning engine significantly improves both accuracy and proof quality, illustrating the practical benefit of this advance for textual inference.",
}
We find that the best publicly available LLMs like GPT-4 and Claude currently perform poorly on basic legal text handling. This motivates the creation of a benchmark consisting of examples that lawyers and paralegals would expect LLMs to handle zero-shot, such as looking up the text at a line of a witness deposition or at a subsection of a contract. LLMs{‘} poor performance on this benchmark casts into doubt their reliability as-is for legal practice. However, fine-tuning on our training set brings even a small model to near-perfect performance. This benchmark will be useful for fine-tuning LLMs for downstream legal tasks, as well as for tracking LLMs{‘} reliability as-is for basic legal tasks.
@inproceedings{blair-stanek-etal-2024-blt,
title = "{BLT}: Can Large Language Models Handle Basic Legal Text?",
author = "Blair-Stanek, Andrew and
Holzenberger, Nils and
Van Durme, Benjamin",
editor = "Aletras, Nikolaos and
Chalkidis, Ilias and
Barrett, Leslie and
Goan{\textcommabelow{t}}{\u{a}}, C{\u{a}}t{\u{a}}lina and
Preo{\textcommabelow{t}}iuc-Pietro, Daniel and
Spanakis, Gerasimos",
booktitle = "Proceedings of the Natural Legal Language Processing Workshop 2024",
month = nov,
year = "2024",
address = "Miami, FL, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.nllp-1.18",
doi = "10.18653/v1/2024.nllp-1.18",
pages = "216--232",
abstract = "We find that the best publicly available LLMs like GPT-4 and Claude currently perform poorly on basic legal text handling. This motivates the creation of a benchmark consisting of examples that lawyers and paralegals would expect LLMs to handle zero-shot, such as looking up the text at a line of a witness deposition or at a subsection of a contract. LLMs{'} poor performance on this benchmark casts into doubt their reliability as-is for legal practice. However, fine-tuning on our training set brings even a small model to near-perfect performance. This benchmark will be useful for fine-tuning LLMs for downstream legal tasks, as well as for tracking LLMs{'} reliability as-is for basic legal tasks.",
}
We introduce a language generation dataset grounded in a popular video game. KNUDGE (**KN**owledge Constrained **U**ser-NPC **D**ialogue **GE**neration) requires models to produce trees of dialogue between video game characters that accurately reflect quest and entity specifications stated in natural language. KNUDGE is constructed from side quest dialogues drawn directly from game data of Obsidian Entertainment{‘}s {_}The Outer Worlds{_}, leading to real-world complexities in generation: (1) utterances must remain faithful to the game lore, including character personas and backstories; (2) a dialogue must accurately reveal new quest details to the human player; and (3) dialogues are large trees as opposed to linear chains of utterances. We report results for a set of neural generation models using supervised and in-context learning techniques; we find competent performance but room for future work addressing the challenges of creating realistic, game-quality dialogues.
@inproceedings{weir-etal-2024-ontologically,
title = "Ontologically Faithful Generation of Non-Player Character Dialogues",
author = "Weir, Nathaniel and
Thomas, Ryan and
d{'}Amore, Randolph and
Hill, Kellie and
Van Durme, Benjamin and
Jhamtani, Harsh",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.emnlp-main.520",
doi = "10.18653/v1/2024.emnlp-main.520",
pages = "9212--9242",
abstract = "We introduce a language generation dataset grounded in a popular video game. KNUDGE (**KN**owledge Constrained **U**ser-NPC **D**ialogue **GE**neration) requires models to produce trees of dialogue between video game characters that accurately reflect quest and entity specifications stated in natural language. KNUDGE is constructed from side quest dialogues drawn directly from game data of Obsidian Entertainment{'}s {\_}The Outer Worlds{\_}, leading to real-world complexities in generation: (1) utterances must remain faithful to the game lore, including character personas and backstories; (2) a dialogue must accurately reveal new quest details to the human player; and (3) dialogues are large trees as opposed to linear chains of utterances. We report results for a set of neural generation models using supervised and in-context learning techniques; we find competent performance but room for future work addressing the challenges of creating realistic, game-quality dialogues.",
}
@InProceedings{chen-et-al-2024,
aclid = "2024.emnlp-main.406",
author = "Yunmo Chen and Tongfei Chen and Harsh Jhamtani and
Patrick Xia and Richard Shin and Jason Eisner and
Benjamin Van Durme",
title = "Learning to Retrieve Iteratively for In-Context
Learning",
booktitle = "Proceedings of the Conference on Empirical Methods in
Natural Language Processing (EMNLP)",
pages = "7156--7168",
year = "2024",
month = nov,
URL = "http://cs.jhu.edu/~jason/papers/#chen-et-al-2024",
}
@InProceedings{bostrom-et-al-2024,
aclid = "2024.emnlp-main.462",
author = "Kaj Bostrom and Harsh Jhamtani and Hao Fang and Sam
Thomson and Richard Shin and Patrick Xia and Benjamin
Van Durme and Jason Eisner and Jacob Andreas",
title = "Language-to-Code Translation with a Single Labeled
Example",
booktitle = "Proceedings of the Conference on Empirical Methods in
Natural Language Processing (EMNLP)",
pages = "8101--8112",
year = "2024",
month = nov,
URL = "http://cs.jhu.edu/~jason/papers/#bostrom-et-al-2024",
}
@inproceedings{273163058,
title = {On Expert Estimation in Hierarchical Mixture of Experts: Beyond Softmax Gating Functions},
author = {{Huy Nguyen} and {Xing Han} and {C. Harris} and {S. Saria} and {Nhat Ho}},
year = 2024,
month = {10},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/8fa041c2762bd3ad22dc673d89059e27daf01881},
}
@inproceedings{273636715,
title = {Temporal coherence shapes cortical responses to speech mixtures in a ferret cocktail party},
author = {{Neha Joshi} and {Wing Yiu Ng} and {Karan Thakkar} and {Daniel Duque} and {Pingbo Yin} and {Jonathan Fritz} and {Mounya Elhilali} and {S. Shamma}},
year = 2024,
month = {10},
booktitle = {Communications Biology},
url = {https://www.semanticscholar.org/paper/8afe9f8e4a9485e20070c362067d3a06f3653311},
}
@inproceedings{273648380,
title = {Unveiling early signs of Parkinson’s disease via a longitudinal analysis of celebrity speech recordings},
author = {{A. Favaro} and {A. Butala} and {Thomas Thebaud} and {J. Villalba} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2024,
month = {10},
booktitle = {npj Parkinson's Disease},
url = {https://www.semanticscholar.org/paper/4daac9614c0979ec790583db1a2c86c07456f32a},
}
@inproceedings{273691413,
title = {Enhancement of a social risk score in the electronic health record to identify social needs among medically underserved patients: using structured data and free-text provider notes},
author = {{E. Hatef} and {C. Kitchen} and {Geoffrey M Gray} and {Ayah Zirikly} and {Thomas M Richards} and {Luis M Ahumada} and {Jonathan P. Weiner}},
year = 2024,
month = {10},
booktitle = {JAMIA Open},
url = {https://www.semanticscholar.org/paper/d5013b3593f9a1e25a3b0bb84150158911d752f0},
}
@inproceedings{273323322,
title = {Evaluating Differentially Private Synthetic Data Generation in High-Stakes Domains},
author = {{Krithika Ramesh} and {Nupoor Gandhi} and {Pulkit Madaan} and {Lisa Bauer} and {Charith Peris} and {Anjalie Field}},
year = 2024,
month = {10},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/d1bc6e53f2cc088406ab8bb4d8b63d26944c15c8},
}
@InProceedings{hashemi-et-al-2024,
aclid = "2024.acl-long.745",
author = "Helia Hashemi and Corby Rosset and Benjamin Van Durme
and Jason Eisner and Chris Kedzie",
title = "\textsc{LLM-Rubric}: {A} Multidimensional, Calibrated
Approach to Automated Evaluation of Natural Language
Texts",
booktitle = "Proceedings of the 62nd Annual Meeting of the
Association for Computational Linguistics (ACL)",
pages = "13806--13834",
year = "2024",
month = aug,
URL = "http://cs.jhu.edu/~jason/papers/#hashemi-et-al-2024",
}
@InProceedings{wang-et-al-2024-tools,
aclid = "2024.acl-long.570",
author = "Boshi Wang and Hao Fang and Jason Eisner and Benjamin
Van Durme and Yu Su",
title = "{LLMs} in the {I}maginarium: Tool Learning through
Simulated Trial and Error",
booktitle = "Proceedings of the 62nd Annual Meeting of the
Association for Computational Linguistics (ACL)",
pages = "10583--10604",
year = "2024",
month = aug,
URL = "http://cs.jhu.edu/~jason/papers/#wang-et-al-2024-tools",
}
@InProceedings{wang-et-al-2024-hallucination,
aclid = "2024.findings-acl.260",
author = "Sky CH-Wang and Benjamin Van Durme and Jason Eisner
and Chris Kedzie",
title = "Do Androids Know They’re Only Dreaming of Electric
Sheep?",
booktitle = "Findings of the 62nd Annual Meeting of the Association
for Computational Linguistics (ACL)",
pages = "4401--4420",
year = "2024",
month = aug,
URL = "http://cs.jhu.edu/~jason/papers/#wang-et-al-2024-hallucination",
}
@InProceedings{monea-et-al-2024,
aclid = "2024.acl-long.369",
author = "Giovanni Monea and Maxime Peyrard and Martin Josifoski
and Vishrav Chaudhary and Jason Eisner and Emre
K{\i}c{\i}man and Hamid Palangi and Barun Patra and
Robert West",
title = "A Glitch in the {M}atrix? {L}ocating and Detecting
Language Model Grounding with {F}akepedia",
booktitle = "Proceedings of the 62nd Annual Meeting of the
Association for Computational Linguistics (ACL)",
pages = "6828--6844",
year = "2024",
month = aug,
URL = "http://cs.jhu.edu/~jason/papers/#monea-et-al-2024",
}
@InProceedings{du-et-al-2024-tight,
aclid = "2024.findings-acl.659",
author = "Li Du and Jason Eisner and Holden Lee and Ryan
Cotterell",
title = "When is a Language Process a Language Model?",
booktitle = "Findings of the 62nd Annual Meeting of the Association
for Computational Linguistics (ACL)",
pages = "11083--11094",
year = "2024",
month = aug,
URL = "http://cs.jhu.edu/~jason/papers/#du-et-al-2024-tight",
}
@InProceedings{du-et-al-2024-mcmc,
author = "Li Du and Afra Amini and Lucas Torroba Hennigen and
Xinyan Velocity Yu and Holden Lee and Jason Eisner and
Ryan Cotterell",
title = "Principled Gradient-Based {MCMC} for Conditional
Sampling of Text",
booktitle = "Proceedings of the 41st International Conference on
Machine Learning (ICML)",
year = "2024",
month = jul,
URL = "http://cs.jhu.edu/~jason/papers/#du-et-al-2024-mcmc",
}
Existing watermarked generation algorithms employ token-level designs and therefore, are vulnerable to paraphrase attacks. To address this issue, we introduce watermarking on the semantic representation of sentences. We propose SemStamp, a robust sentence-level semantic watermarking algorithm that uses locality-sensitive hashing (LSH) to partition the semantic space of sentences. The algorithm encodes and LSH-hashes a candidate sentence generated by a language model, and conducts rejection sampling until the sampled sentence falls in watermarked partitions in the semantic embedding space. To test the paraphrastic robustness of watermarking algorithms, we propose a {“}bigram paraphrase{”} attack that produces paraphrases with small bigram overlap with the original sentence. This attack is shown to be effective against existing token-level watermark algorithms, while posing only minor degradations to SemStamp. Experimental results show that our novel semantic watermark algorithm is not only more robust than the previous state-of-the-art method on various paraphrasers and domains, but also better at preserving the quality of generation.
@inproceedings{hou-etal-2024-semstamp,
title = "{S}em{S}tamp: A Semantic Watermark with Paraphrastic Robustness for Text Generation",
author = "Hou, Abe and
Zhang, Jingyu and
He, Tianxing and
Wang, Yichen and
Chuang, Yung-Sung and
Wang, Hongwei and
Shen, Lingfeng and
Van Durme, Benjamin and
Khashabi, Daniel and
Tsvetkov, Yulia",
editor = "Duh, Kevin and
Gomez, Helena and
Bethard, Steven",
booktitle = "Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.naacl-long.226",
doi = "10.18653/v1/2024.naacl-long.226",
pages = "4067--4082",
abstract = "Existing watermarked generation algorithms employ token-level designs and therefore, are vulnerable to paraphrase attacks. To address this issue, we introduce watermarking on the semantic representation of sentences. We propose SemStamp, a robust sentence-level semantic watermarking algorithm that uses locality-sensitive hashing (LSH) to partition the semantic space of sentences. The algorithm encodes and LSH-hashes a candidate sentence generated by a language model, and conducts rejection sampling until the sampled sentence falls in watermarked partitions in the semantic embedding space. To test the paraphrastic robustness of watermarking algorithms, we propose a {``}bigram paraphrase{''} attack that produces paraphrases with small bigram overlap with the original sentence. This attack is shown to be effective against existing token-level watermark algorithms, while posing only minor degradations to SemStamp. Experimental results show that our novel semantic watermark algorithm is not only more robust than the previous state-of-the-art method on various paraphrasers and domains, but also better at preserving the quality of generation.",
}
Large Language Models (LLMs) have shown promising in-context learning abilities. However, conventional In-Context Learning (ICL) approaches are often impeded by length limitations of transformer architecture, which pose challenges when attempting to effectively integrate supervision from a substantial number of demonstration examples. In this paper, we introduce a novel framework, called Naive Bayes-based Context Extension (NBCE), to enable existing LLMs to perform ICL with an increased number of demonstrations by significantly expanding their context size. Importantly, this expansion does not require fine-tuning or dependence on particular model architectures, all the while preserving linear efficiency. NBCE initially splits the context into equal-sized windows fitting the target LLM{‘}s maximum length. Then, it introduces a voting mechanism to select the most relevant window, regarded as the posterior context. Finally, it employs Bayes{‘} theorem to generate the test task. Our experimental results demonstrate that NBCE substantially enhances performance, particularly as the number of demonstration examples increases, consistently outperforming alternative methods. The NBCE code will be made publicly accessible. The code NBCE is available at: https://github.com/amurtadha/NBCE-master
@inproceedings{su-etal-2024-naive,
title = "Naive {B}ayes-based Context Extension for Large Language Models",
author = "Su, Jianlin and
Ahmed, Murtadha and
Wen, Bo and
Ao, Luo and
Zhu, Mingren and
Liu, Yunfeng",
editor = "Duh, Kevin and
Gomez, Helena and
Bethard, Steven",
booktitle = "Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.naacl-long.431",
doi = "10.18653/v1/2024.naacl-long.431",
pages = "7791--7807",
abstract = "Large Language Models (LLMs) have shown promising in-context learning abilities. However, conventional In-Context Learning (ICL) approaches are often impeded by length limitations of transformer architecture, which pose challenges when attempting to effectively integrate supervision from a substantial number of demonstration examples. In this paper, we introduce a novel framework, called Naive Bayes-based Context Extension (NBCE), to enable existing LLMs to perform ICL with an increased number of demonstrations by significantly expanding their context size. Importantly, this expansion does not require fine-tuning or dependence on particular model architectures, all the while preserving linear efficiency. NBCE initially splits the context into equal-sized windows fitting the target LLM{'}s maximum length. Then, it introduces a voting mechanism to select the most relevant window, regarded as the posterior context. Finally, it employs Bayes{'} theorem to generate the test task. Our experimental results demonstrate that NBCE substantially enhances performance, particularly as the number of demonstration examples increases, consistently outperforming alternative methods. The NBCE code will be made publicly accessible. The code NBCE is available at: https://github.com/amurtadha/NBCE-master",
}
While Transformer-based neural machine translation (NMT) is very effective in high-resource settings, many languages lack the necessary large parallel corpora to benefit from it. In the context of low-resource (LR) MT between two closely-related languages, a natural intuition is to seek benefits from structural {“}shortcuts{”}, such as copying subwords from the source to the target, given that such language pairs often share a considerable number of identical words, cognates, and borrowings. We test Pointer-Generator Networks for this purpose for six language pairs over a variety of resource ranges, and find weak improvements for most settings. However, analysis shows that the model does not show greater improvements for closely-related vs. more distant language pairs, or for lower resource ranges, and that the models do not exhibit the expected usage of the mechanism for shared subwords. Our discussion of the reasons for this behaviour highlights several general challenges for LR NMT, such as modern tokenization strategies, noisy real-world conditions, and linguistic complexities. We call for better scrutiny of linguistically motivated improvements to NMT given the blackbox nature of Transformer models, as well as for a focus on the above problems in the field.
@inproceedings{bafna-etal-2024-pointer,
title = "Pointer-Generator Networks for Low-Resource Machine Translation: Don{'}t Copy That!",
author = "Bafna, Niyati and
Koehn, Philipp and
Yarowsky, David",
editor = "Tafreshi, Shabnam and
Akula, Arjun and
Sedoc, Jo{\~a}o and
Drozd, Aleksandr and
Rogers, Anna and
Rumshisky, Anna",
booktitle = "Proceedings of the Fifth Workshop on Insights from Negative Results in NLP",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.insights-1.9",
doi = "10.18653/v1/2024.insights-1.9",
pages = "60--72",
abstract = "While Transformer-based neural machine translation (NMT) is very effective in high-resource settings, many languages lack the necessary large parallel corpora to benefit from it. In the context of low-resource (LR) MT between two closely-related languages, a natural intuition is to seek benefits from structural {``}shortcuts{''}, such as copying subwords from the source to the target, given that such language pairs often share a considerable number of identical words, cognates, and borrowings. We test Pointer-Generator Networks for this purpose for six language pairs over a variety of resource ranges, and find weak improvements for most settings. However, analysis shows that the model does not show greater improvements for closely-related vs. more distant language pairs, or for lower resource ranges, and that the models do not exhibit the expected usage of the mechanism for shared subwords. Our discussion of the reasons for this behaviour highlights several general challenges for LR NMT, such as modern tokenization strategies, noisy real-world conditions, and linguistic complexities. We call for better scrutiny of linguistically motivated improvements to NMT given the blackbox nature of Transformer models, as well as for a focus on the above problems in the field.",
}
Understanding event descriptions is a central aspect of language processing, but current approaches focus overwhelmingly on single sentences or documents. Aggregating information about an event across documents can offer a much richer understanding. To this end, we present FAMuS, a new corpus of Wikipedia passages that report on some event, paired with underlying, genre-diverse (non-Wikipedia) source articles for the same event. Events and (cross-sentence) arguments in both report and source are annotated against FrameNet, providing broad coverage of different event types. We present results on two key event understanding tasks enabled by FAMuS: source validation{–-}determining whether a document is a valid source for a target report event{–-}and cross-document argument extraction{–-}full-document argument extraction for a target event from both its report and the correct source article.
@inproceedings{vashishtha-etal-2024-famus,
title = "{FAM}u{S}: Frames Across Multiple Sources",
author = "Vashishtha, Siddharth and
Martin, Alexander and
Gantt, William and
Van Durme, Benjamin and
White, Aaron",
editor = "Duh, Kevin and
Gomez, Helena and
Bethard, Steven",
booktitle = "Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.naacl-long.457",
doi = "10.18653/v1/2024.naacl-long.457",
pages = "8250--8273",
abstract = "Understanding event descriptions is a central aspect of language processing, but current approaches focus overwhelmingly on single sentences or documents. Aggregating information about an event across documents can offer a much richer understanding. To this end, we present FAMuS, a new corpus of Wikipedia passages that report on some event, paired with underlying, genre-diverse (non-Wikipedia) source articles for the same event. Events and (cross-sentence) arguments in both report and source are annotated against FrameNet, providing broad coverage of different event types. We present results on two key event understanding tasks enabled by FAMuS: source validation{---}determining whether a document is a valid source for a target report event{---}and cross-document argument extraction{---}full-document argument extraction for a target event from both its report and the correct source article.",
}
Reference-based metrics that operate at the sentence-level typically outperform quality estimation metrics, which have access only to the source and system output.This is unsurprising, since references resolve ambiguities that may be present in the source.In this paper, we investigate whether additional source context can effectively substitute for a reference.We present a metric named SLIDE (SLIding Document Evaluator), which operates on blocks of sentences. SLIDE leverages a moving window that slides over each document in the test set, feeding each chunk of sentences into an unmodified, off-the-shelf quality estimation model.We find that SLIDE obtains significantly higher pairwise system accuracy than its sentence-level baseline, in some cases even eliminating the gap with reference-base metrics.This suggests that source context may provide the same information as a human reference in disambiguating source ambiguities. This finding is especially pertinent for reference-free document-level evaluation, wherein SLIDE could provide higher-quality pairwise system assessments while only requiring document boundary annotations.
@inproceedings{raunak-etal-2024-slide,
title = "{SLIDE}: Reference-free Evaluation for Machine Translation using a Sliding Document Window",
author = "Raunak, Vikas and
Kocmi, Tom and
Post, Matt",
editor = "Duh, Kevin and
Gomez, Helena and
Bethard, Steven",
booktitle = "Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 2: Short Papers)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.naacl-short.18",
doi = "10.18653/v1/2024.naacl-short.18",
pages = "205--211",
abstract = "Reference-based metrics that operate at the sentence-level typically outperform quality estimation metrics, which have access only to the source and system output.This is unsurprising, since references resolve ambiguities that may be present in the source.In this paper, we investigate whether additional source context can effectively substitute for a reference.We present a metric named SLIDE (SLIding Document Evaluator), which operates on blocks of sentences. SLIDE leverages a moving window that slides over each document in the test set, feeding each chunk of sentences into an unmodified, off-the-shelf quality estimation model.We find that SLIDE obtains significantly higher pairwise system accuracy than its sentence-level baseline, in some cases even eliminating the gap with reference-base metrics.This suggests that source context may provide the same information as a human reference in disambiguating source ambiguities. This finding is especially pertinent for reference-free document-level evaluation, wherein SLIDE could provide higher-quality pairwise system assessments while only requiring document boundary annotations.",
}
@InProceedings{moghe-et-al-2024,
aclid = "2024.findings-naacl.255",
author = "Nikita Moghe and Patrick Xia and Jacob Andreas and
Jason Eisner and Benjamin Van Durme and Harsh
Jhamtani",
title = "Interpreting User Requests in the Context of Natural
Language Standing Instructions",
booktitle = "Findings of the North American Conference on
Cmputational Linguistics (NAACL)",
volume = "arXiv:2311.09796",
pages = "4043--4060",
year = "2024",
month = jun,
URL = "http://cs.jhu.edu/~jason/papers/#moghe-et-al-2024",
}
The growing emphasis on fairness in speech-processing tasks requires datasets with speakers from diverse subgroups that allow training and evaluating fair speech technology systems. However, creating such datasets through manual annotation can be costly. To address this challenge, we present a semi-automated dataset creation pipeline that leverages large language models. We use this pipeline to generate a dataset of speakers identifying themself or another speaker as belonging to a particular race, ethnicity, or national origin group. We use OpenaAI{‘}s GPT-4 to perform two complex annotation tasks- separating files relevant to our intended dataset from the irrelevant ones (filtering) and finding and extracting information on identifications within a transcript (tagging). By evaluating GPT-4{‘}s performance using human annotations as ground truths, we show that it can reduce resources required by dataset annotation while barely losing any important information. For the filtering task, GPT-4 had a very low miss rate of 6.93{\%}. GPT-4{‘}s tagging performance showed a trade-off between precision and recall, where the latter got as high as 97{\%}, but precision never exceeded 45{\%}. Our approach reduces the time required for the filtering and tagging tasks by 95{\%} and 80{\%}, respectively. We also present an in-depth error analysis of GPT-4{‘}s performance.
@inproceedings{jahan-etal-2024-finding,
title = "Finding Spoken Identifications: Using {GPT}-4 Annotation for an Efficient and Fast Dataset Creation Pipeline",
author = "Jahan, Maliha and
Wang, Helin and
Thebaud, Thomas and
Sun, Yinglun and
Le, Giang Ha and
Fagyal, Zsuzsanna and
Scharenborg, Odette and
Hasegawa-Johnson, Mark and
Moro Velazquez, Laureano and
Dehak, Najim",
editor = "Calzolari, Nicoletta and
Kan, Min-Yen and
Hoste, Veronique and
Lenci, Alessandro and
Sakti, Sakriani and
Xue, Nianwen",
booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://aclanthology.org/2024.lrec-main.641",
pages = "7296--7306",
abstract = "The growing emphasis on fairness in speech-processing tasks requires datasets with speakers from diverse subgroups that allow training and evaluating fair speech technology systems. However, creating such datasets through manual annotation can be costly. To address this challenge, we present a semi-automated dataset creation pipeline that leverages large language models. We use this pipeline to generate a dataset of speakers identifying themself or another speaker as belonging to a particular race, ethnicity, or national origin group. We use OpenaAI{'}s GPT-4 to perform two complex annotation tasks- separating files relevant to our intended dataset from the irrelevant ones (filtering) and finding and extracting information on identifications within a transcript (tagging). By evaluating GPT-4{'}s performance using human annotations as ground truths, we show that it can reduce resources required by dataset annotation while barely losing any important information. For the filtering task, GPT-4 had a very low miss rate of 6.93{\%}. GPT-4{'}s tagging performance showed a trade-off between precision and recall, where the latter got as high as 97{\%}, but precision never exceeded 45{\%}. Our approach reduces the time required for the filtering and tagging tasks by 95{\%} and 80{\%}, respectively. We also present an in-depth error analysis of GPT-4{'}s performance.",
}
Multilingual machine translation has proven immensely useful for both parameter efficiency and overall performance across many language pairs via complete multilingual parameter sharing. However, some language pairs in multilingual models can see worse performance than in bilingual models, especially in the one-to-many translation setting. Motivated by their empirical differences, we examine the geometric differences in representations from bilingual models versus those from one-to-many multilingual models. Specifically, we compute the isotropy of these representations using intrinsic dimensionality and IsoScore, in order to measure how the representations utilize the dimensions in their underlying vector space. Using the same evaluation data in both models, we find that for a given language pair, its multilingual model decoder representations are consistently less isotropic and occupy fewer dimensions than comparable bilingual model decoder representations. Additionally, we show that much of the anisotropy in multilingual decoder representations can be attributed to modeling language-specific information, therefore limiting remaining representational capacity.
@inproceedings{verma-etal-2024-exploring,
title = "Exploring Geometric Representational Disparities between Multilingual and Bilingual Translation Models",
author = "Verma, Neha and
Murray, Kenton and
Duh, Kevin",
editor = "Calzolari, Nicoletta and
Kan, Min-Yen and
Hoste, Veronique and
Lenci, Alessandro and
Sakti, Sakriani and
Xue, Nianwen",
booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://aclanthology.org/2024.lrec-main.604",
pages = "6909--6921",
abstract = "Multilingual machine translation has proven immensely useful for both parameter efficiency and overall performance across many language pairs via complete multilingual parameter sharing. However, some language pairs in multilingual models can see worse performance than in bilingual models, especially in the one-to-many translation setting. Motivated by their empirical differences, we examine the geometric differences in representations from bilingual models versus those from one-to-many multilingual models. Specifically, we compute the isotropy of these representations using intrinsic dimensionality and IsoScore, in order to measure how the representations utilize the dimensions in their underlying vector space. Using the same evaluation data in both models, we find that for a given language pair, its multilingual model decoder representations are consistently less isotropic and occupy fewer dimensions than comparable bilingual model decoder representations. Additionally, we show that much of the anisotropy in multilingual decoder representations can be attributed to modeling language-specific information, therefore limiting remaining representational capacity.",
}
In this study, we present a generalizable workflow to identify documents in a historic language with a nonstandard language and script combination, Armeno-Turkish. We introduce the task of detecting distinct patterns of multilinguality based on the frequency of structured language alternations within a document.
@inproceedings{sirin-etal-2024-detecting,
title = "Detecting Structured Language Alternations in Historical Documents by Combining Language Identification with {F}ourier Analysis",
author = "Sirin, Hale and
Li, Sabrina and
Lippincott, Thomas",
editor = "Bizzoni, Yuri and
Degaetano-Ortlieb, Stefania and
Kazantseva, Anna and
Szpakowicz, Stan",
booktitle = "Proceedings of the 8th Joint SIGHUM Workshop on Computational Linguistics for Cultural Heritage, Social Sciences, Humanities and Literature (LaTeCH-CLfL 2024)",
month = mar,
year = "2024",
address = "St. Julians, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.latechclfl-1.6",
pages = "46--50",
abstract = "In this study, we present a generalizable workflow to identify documents in a historic language with a nonstandard language and script combination, Armeno-Turkish. We introduce the task of detecting distinct patterns of multilinguality based on the frequency of structured language alternations within a document.",
}
We present a novel combination of dynamic embedded topic models and change-point detection to explore diachronic change of lexical semantic modality in classical and early Christian Latin. We demonstrate several methods for finding and characterizing patterns in the output, and relating them to traditional scholarship in Comparative Literature and Classics. This simple approach to unsupervised models of semantic change can be applied to any suitable corpus, and we conclude with future directions and refinements aiming to allow noisier, less-curated materials to meet that threshold.
@inproceedings{sirin-lippincott-2024-dynamic,
title = "Dynamic embedded topic models and change-point detection for exploring literary-historical hypotheses",
author = "Sirin, Hale and
Lippincott, Thomas",
editor = "Bizzoni, Yuri and
Degaetano-Ortlieb, Stefania and
Kazantseva, Anna and
Szpakowicz, Stan",
booktitle = "Proceedings of the 8th Joint SIGHUM Workshop on Computational Linguistics for Cultural Heritage, Social Sciences, Humanities and Literature (LaTeCH-CLfL 2024)",
month = mar,
year = "2024",
address = "St. Julians, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.latechclfl-1.22",
pages = "231--236",
abstract = "We present a novel combination of dynamic embedded topic models and change-point detection to explore diachronic change of lexical semantic modality in classical and early Christian Latin. We demonstrate several methods for finding and characterizing patterns in the output, and relating them to traditional scholarship in Comparative Literature and Classics. This simple approach to unsupervised models of semantic change can be applied to any suitable corpus, and we conclude with future directions and refinements aiming to allow noisier, less-curated materials to meet that threshold.",
}
We present the overview of the CLPsych 2024 Shared Task, focusing on leveraging open source Large Language Models (LLMs) for identifying textual evidence that supports the suicidal risk level of individuals on Reddit. In particular, given a Reddit user, their pre- determined suicide risk level ({`}Low{‘}, {`}Mod- erate{‘} or {`}High{‘}) and all of their posts in the r/SuicideWatch subreddit, we frame the task of identifying relevant pieces of text in their posts supporting their suicidal classification in two ways: (a) on the basis of evidence highlighting (extracting sub-phrases of the posts) and (b) on the basis of generating a summary of such evidence. We annotate a sample of 125 users and introduce evaluation metrics based on (a) BERTScore and (b) natural language inference for the two sub-tasks, respectively. Finally, we provide an overview of the system submissions and summarise the key findings.
@inproceedings{chim-etal-2024-overview,
title = "Overview of the {CLP}sych 2024 Shared Task: Leveraging Large Language Models to Identify Evidence of Suicidality Risk in Online Posts",
author = "Chim, Jenny and
Tsakalidis, Adam and
Gkoumas, Dimitris and
Atzil-Slonim, Dana and
Ophir, Yaakov and
Zirikly, Ayah and
Resnik, Philip and
Liakata, Maria",
editor = "Yates, Andrew and
Desmet, Bart and
Prud{'}hommeaux, Emily and
Zirikly, Ayah and
Bedrick, Steven and
MacAvaney, Sean and
Bar, Kfir and
Ireland, Molly and
Ophir, Yaakov",
booktitle = "Proceedings of the 9th Workshop on Computational Linguistics and Clinical Psychology (CLPsych 2024)",
month = mar,
year = "2024",
address = "St. Julians, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.clpsych-1.15",
pages = "177--190",
abstract = "We present the overview of the CLPsych 2024 Shared Task, focusing on leveraging open source Large Language Models (LLMs) for identifying textual evidence that supports the suicidal risk level of individuals on Reddit. In particular, given a Reddit user, their pre- determined suicide risk level ({`}Low{'}, {`}Mod- erate{'} or {`}High{'}) and all of their posts in the r/SuicideWatch subreddit, we frame the task of identifying relevant pieces of text in their posts supporting their suicidal classification in two ways: (a) on the basis of evidence highlighting (extracting sub-phrases of the posts) and (b) on the basis of generating a summary of such evidence. We annotate a sample of 125 users and introduce evaluation metrics based on (a) BERTScore and (b) natural language inference for the two sub-tasks, respectively. Finally, we provide an overview of the system submissions and summarise the key findings.",
}
Large Language Models (LLMs) may hallucinate and generate fake information, despite pre-training on factual data. Inspired by the journalistic device of {“}according to sources{”}, we propose according-to prompting: directing LLMs to ground responses against previously observed text. To quantify this grounding, we propose a novel evaluation metric (QUIP-Score) that measures the extent to which model-produced answers are directly found in underlying text corpora. We illustrate with experiments on three corpora (Wikipedia, PubMed, and the U.S. legal tax code) that these prompts improve grounding under our metrics, with the additional benefit of often improving end-task performance. Furthermore, prompts that ask the model to decrease grounding (or to ground to other corpora) indeed decrease QUIP-Score, indicating the ability of LLMs to increase or decrease grounded generations on request.
@inproceedings{weller-etal-2024-according,
title = "{``}According to . . . {''}: Prompting Language Models Improves Quoting from Pre-Training Data",
author = "Weller, Orion and
Marone, Marc and
Weir, Nathaniel and
Lawrie, Dawn and
Khashabi, Daniel and
Van Durme, Benjamin",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.eacl-long.140",
pages = "2288--2301",
abstract = "Large Language Models (LLMs) may hallucinate and generate fake information, despite pre-training on factual data. Inspired by the journalistic device of {``}according to sources{''}, we propose according-to prompting: directing LLMs to ground responses against previously observed text. To quantify this grounding, we propose a novel evaluation metric (QUIP-Score) that measures the extent to which model-produced answers are directly found in underlying text corpora. We illustrate with experiments on three corpora (Wikipedia, PubMed, and the U.S. legal tax code) that these prompts improve grounding under our metrics, with the additional benefit of often improving end-task performance. Furthermore, prompts that ask the model to decrease grounding (or to ground to other corpora) indeed decrease QUIP-Score, indicating the ability of LLMs to increase or decrease grounded generations on request.",
}
Using large language models (LMs) for query or document expansion can improve generalization in information retrieval. However, it is unknown whether these techniques are universally beneficial or only effective in specific settings, such as for particular retrieval models, dataset domains, or query types. To answer this, we conduct the first comprehensive analysis of LM-based expansion. We find that there exists a strong negative correlation between retriever performance and gains from expansion: expansion improves scores for weaker models, but generally harms stronger models. We show this trend holds across a set of eleven expansion techniques, twelve datasets with diverse distribution shifts, and twenty-four retrieval models. Through qualitative error analysis, we hypothesize that although expansions provide extra information (potentially improving recall), they add additional noise that makes it difficult to discern between the top relevant documents (thus introducing false positives). Our results suggest the following recipe: use expansions for weaker models or when the target dataset significantly differs from training corpus in format; otherwise, avoid expansions to keep the relevance signal clear.
@inproceedings{weller-etal-2024-generative,
title = "When do Generative Query and Document Expansions Fail? A Comprehensive Study Across Methods, Retrievers, and Datasets",
author = "Weller, Orion and
Lo, Kyle and
Wadden, David and
Lawrie, Dawn and
Van Durme, Benjamin and
Cohan, Arman and
Soldaini, Luca",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Findings of the Association for Computational Linguistics: EACL 2024",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.findings-eacl.134",
pages = "1987--2003",
abstract = "Using large language models (LMs) for query or document expansion can improve generalization in information retrieval. However, it is unknown whether these techniques are universally beneficial or only effective in specific settings, such as for particular retrieval models, dataset domains, or query types. To answer this, we conduct the first comprehensive analysis of LM-based expansion. We find that there exists a strong negative correlation between retriever performance and gains from expansion: expansion improves scores for weaker models, but generally harms stronger models. We show this trend holds across a set of eleven expansion techniques, twelve datasets with diverse distribution shifts, and twenty-four retrieval models. Through qualitative error analysis, we hypothesize that although expansions provide extra information (potentially improving recall), they add additional noise that makes it difficult to discern between the top relevant documents (thus introducing false positives). Our results suggest the following recipe: use expansions for weaker models or when the target dataset significantly differs from training corpus in format; otherwise, avoid expansions to keep the relevance signal clear.",
}
Augmenting large language models (LLM) to use external tools enhances their performance across a variety of tasks. However, prior works over-rely on task-specific demonstration of tool use that limits their generalizability and computational cost due to making many calls to large-scale LLMs. We introduce GEAR, a computationally efficient query-tool grounding algorithm that is generalizable to various tasks that require tool use while not relying on task-specific demonstrations. GEAR achieves better efficiency by delegating tool grounding and execution to small language models (SLM) and LLM, respectively; while leveraging semantic and pattern-based evaluation at both question and answer levels for generalizable tool grounding. We evaluate GEAR on 14 datasets across 6 downstream tasks, demonstrating its strong generalizability to novel tasks, tools and different SLMs. Despite offering more efficiency, GEAR achieves higher precision in tool grounding compared to prior strategies using LLM prompting, thus improving downstream accuracy at a reduced computational cost. For example, we demonstrate that GEAR-augmented GPT-J and GPT-3 outperform counterpart tool-augmented baselines because of better tool use.
@inproceedings{lu-etal-2024-gear,
title = "{GEAR}: Augmenting Language Models with Generalizable and Efficient Tool Resolution",
author = "Lu, Yining and
Yu, Haoping and
Khashabi, Daniel",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.eacl-long.7",
pages = "112--138",
abstract = "Augmenting large language models (LLM) to use external tools enhances their performance across a variety of tasks. However, prior works over-rely on task-specific demonstration of tool use that limits their generalizability and computational cost due to making many calls to large-scale LLMs. We introduce GEAR, a computationally efficient query-tool grounding algorithm that is generalizable to various tasks that require tool use while not relying on task-specific demonstrations. GEAR achieves better efficiency by delegating tool grounding and execution to small language models (SLM) and LLM, respectively; while leveraging semantic and pattern-based evaluation at both question and answer levels for generalizable tool grounding. We evaluate GEAR on 14 datasets across 6 downstream tasks, demonstrating its strong generalizability to novel tasks, tools and different SLMs. Despite offering more efficiency, GEAR achieves higher precision in tool grounding compared to prior strategies using LLM prompting, thus improving downstream accuracy at a reduced computational cost. For example, we demonstrate that GEAR-augmented GPT-J and GPT-3 outperform counterpart tool-augmented baselines because of better tool use.",
}
Negation is a common everyday phenomena and has been a consistent area of weakness for language models (LMs). Although the Information Retrieval (IR) community has adopted LMs as the backbone of modern IR architectures, there has been little to no research in understanding how negation impacts neural IR. We therefore construct a straightforward benchmark on this theme: asking IR models to rank two documents that differ only by negation. We show that the results vary widely according to the type of IR architecture: cross-encoders perform best, followed by late-interaction models, and in last place are bi-encoder and sparse neural architectures. We find that most current information retrieval models do not consider negation, performing similarly or worse than randomly ranking. We show that although the obvious approach of continued fine-tuning on a dataset of contrastive documents containing negations increases performance (as does model size), there is still a large gap between machine and human performance.
@inproceedings{weller-etal-2024-nevir,
title = "{N}ev{IR}: Negation in Neural Information Retrieval",
author = "Weller, Orion and
Lawrie, Dawn and
Van Durme, Benjamin",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.eacl-long.139",
pages = "2274--2287",
abstract = "Negation is a common everyday phenomena and has been a consistent area of weakness for language models (LMs). Although the Information Retrieval (IR) community has adopted LMs as the backbone of modern IR architectures, there has been little to no research in understanding how negation impacts neural IR. We therefore construct a straightforward benchmark on this theme: asking IR models to rank two documents that differ only by negation. We show that the results vary widely according to the type of IR architecture: cross-encoders perform best, followed by late-interaction models, and in last place are bi-encoder and sparse neural architectures. We find that most current information retrieval models do not consider negation, performing similarly or worse than randomly ranking. We show that although the obvious approach of continued fine-tuning on a dataset of contrastive documents containing negations increases performance (as does model size), there is still a large gap between machine and human performance.",
}
Despite the impressive advancements achieved through vision-and-language pretraining, it remains unclear whether multi-modal learning can help understand each individual modality. In this work, we conduct a comparative analysis of the visual representations in existing vision-and-language models and vision-only models by probing on a broad range of tasks. Five probing tasks are evaluated in order to assess the quality of the learned representations in a nuanced manner. Our results on five probing tasks suggest vision-and-language models are better at label prediction tasks like object and attribute prediction, while vision-only models are stronger at dense prediction tasks that require more localized information. We hope our study sheds light on the role of language in visual learning, and serves as an empirical guide for various pretrained models.
@inproceedings{li-etal-2024-localization,
title = "Localization vs. Semantics: Visual Representations in Unimodal and Multimodal Models",
author = "Li, Zhuowan and
Xie, Cihang and
Van Durme, Benjamin and
Yuille, Alan",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.eacl-long.146",
pages = "2378--2390",
abstract = "Despite the impressive advancements achieved through vision-and-language pretraining, it remains unclear whether multi-modal learning can help understand each individual modality. In this work, we conduct a comparative analysis of the visual representations in existing vision-and-language models and vision-only models by probing on a broad range of tasks. Five probing tasks are evaluated in order to assess the quality of the learned representations in a nuanced manner. Our results on five probing tasks suggest vision-and-language models are better at label prediction tasks like object and attribute prediction, while vision-only models are stronger at dense prediction tasks that require more localized information. We hope our study sheds light on the role of language in visual learning, and serves as an empirical guide for various pretrained models.",
}
Recent work in open-domain question answering (ODQA) has shown that adversarial poisoning of the search collection can cause large drops in accuracy for production systems. However, little to no work has proposed methods to defend against these attacks. To do so, we rely on the intuition that redundant information often exists in large corpora. To find it, we introduce a method that uses query augmentation to search for a diverse set of passages that could answer the original question but are less likely to have been poisoned. We integrate these new passages into the model through the design of a novel confidence method, comparing the predicted answer to its appearance in the retrieved contexts (what we call Confidence from Answer Redundancy, i.e. CAR). Together these methods allow for a simple but effective way to defend against poisoning attacks that provides gains of nearly 20{\%} exact match across varying levels of data poisoning/knowledge conflicts.
@inproceedings{weller-etal-2024-defending,
title = "Defending Against Disinformation Attacks in Open-Domain Question Answering",
author = "Weller, Orion and
Khan, Aleem and
Weir, Nathaniel and
Lawrie, Dawn and
Van Durme, Benjamin",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics (Volume 2: Short Papers)",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.eacl-short.35",
pages = "402--417",
abstract = "Recent work in open-domain question answering (ODQA) has shown that adversarial poisoning of the search collection can cause large drops in accuracy for production systems. However, little to no work has proposed methods to defend against these attacks. To do so, we rely on the intuition that redundant information often exists in large corpora. To find it, we introduce a method that uses query augmentation to search for a diverse set of passages that could answer the original question but are less likely to have been poisoned. We integrate these new passages into the model through the design of a novel confidence method, comparing the predicted answer to its appearance in the retrieved contexts (what we call Confidence from Answer Redundancy, i.e. CAR). Together these methods allow for a simple but effective way to defend against poisoning attacks that provides gains of nearly 20{\%} exact match across varying levels of data poisoning/knowledge conflicts.",
}
@inproceedings{268987627,
title = {Verifiable by Design: Aligning Language Models to Quote from Pre-Training Data},
author = {{Jingyu (Jack) Zhang} and {Marc Marone} and {Tianjian Li} and {Benjamin Van Durme} and {Daniel Khashabi}},
year = 2024,
month = {4},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/9689b5fdb0d3a1bad802d03d348bd32aa5a4c2df},
}
We introduce MultiMUC, the first multilingual parallel corpus for template filling, comprising translations of the classic MUC-4 template filling benchmark into five languages: Arabic, Chinese, Farsi, Korean, and Russian. We obtain automatic translations from a strong multilingual machine translation system and manually project the original English annotations into each target language. For all languages, we also provide human translations for key portions of the dev and test splits. Finally, we present baselines on MultiMUC both with state-of-the-art template filling models for MUC-4 and with ChatGPT. We release MUC-4 and the supervised baselines to facilitate further work on document-level information extraction in multilingual settings.
@inproceedings{gantt-etal-2024-multimuc,
title = "{M}ulti{MUC}: Multilingual Template Filling on {MUC}-4",
author = "Gantt, William and
Behzad, Shabnam and
An, Hannah and
Chen, Yunmo and
White, Aaron and
Van Durme, Benjamin and
Yarmohammadi, Mahsa",
editor = "Graham, Yvette and
Purver, Matthew",
booktitle = "Proceedings of the 18th Conference of the European Chapter of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = mar,
year = "2024",
address = "St. Julian{'}s, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.eacl-long.21",
pages = "349--368",
abstract = "We introduce MultiMUC, the first multilingual parallel corpus for template filling, comprising translations of the classic MUC-4 template filling benchmark into five languages: Arabic, Chinese, Farsi, Korean, and Russian. We obtain automatic translations from a strong multilingual machine translation system and manually project the original English annotations into each target language. For all languages, we also provide human translations for key portions of the dev and test splits. Finally, we present baselines on MultiMUC both with state-of-the-art template filling models for MUC-4 and with ChatGPT. We release MUC-4 and the supervised baselines to facilitate further work on document-level information extraction in multilingual settings.",
}
@inproceedings{272654115,
title = {Explainable Metrics for the Assessment of Neurodegenerative Diseases through Handwriting Analysis},
author = {{Thomas Thebaud} and {A. Favaro} and {Casey Chen} and {Gabrielle Chavez} and {L. Moro-Velázquez} and {A. Butala} and {N. Dehak}},
year = 2024,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/c8851ccf781b66eb487ca7a77784baf168d9ef23},
}
@inproceedings{273770555,
title = {The SHADOW team submission to the ASVSpoof 2024 Challenge},
author = {{J. Villalba} and {Tiantian Feng} and {Thomas Thebaud} and {Jihwan Lee} and {Shrikanth S. Narayanan} and {N. Dehak}},
year = 2024,
month = {8},
booktitle = {The Automatic Speaker Verification Spoofing Countermeasures Workshop (ASVspoof 2024)},
url = {https://www.semanticscholar.org/paper/20ab192366ccf71e3d1feda7c8b040030d58266f},
}
@inproceedings{272236956,
title = {Trends in Glucagon-Like Peptide-1 Receptor Agonist Social Media Posts Using Artificial Intelligence},
author = {{Aamir Javaid} and {Sruthika Baviriseaty} and {Rehan Javaid} and {Ayah Zirikly} and {Harshita Kukreja} and {Chang H. Kim} and {Michael J. Blaha} and {Roger S. Blumenthal} and {Seth S. Martin} and {F. Marvel}},
year = 2024,
month = {8},
booktitle = {JACC: Advances},
url = {https://www.semanticscholar.org/paper/fa5702a10f5b9b5d53cd7e82e06658bfde95c77f},
}
@inproceedings{272694526,
title = {EzAudio: Enhancing Text-to-Audio Generation with Efficient Diffusion Transformer},
author = {{Jiarui Hai} and {Yong Xu} and {Hao Zhang} and {Chenxing Li} and {Helin Wang} and {Mounya Elhilali} and {Dong Yu}},
year = 2024,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/8e146956594a7580148dad5ccdb2c0c791abd386},
}
@inproceedings{269005582,
title = {SELF-[IN]CORRECT: LLMs Struggle with Refining Self-Generated Responses},
author = {{Dongwei Jiang} and {Jingyu (Jack) Zhang} and {Orion Weller} and {Nathaniel Weir} and {Benjamin Van Durme} and {Daniel Khashabi}},
year = 2024,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/9e3d14e4697a325fcabc6d952232a3ad7e9fa809},
}
@inproceedings{268063486,
title = {RORA: Robust Free-Text Rationale Evaluation},
author = {{Zhengping Jiang} and {Yining Lu} and {Hanjie Chen} and {Daniel Khashabi} and {Benjamin Van Durme} and {Anqi Liu}},
year = 2024,
month = {2},
booktitle = {Annual Meeting of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/17ba73a2a332a44bb1a00622beab96f33d4b1ba7},
}
@inproceedings{268527006,
title = {Biomimetic Mappings for Active Sonar Object Recognition in Clutter},
author = {{Sangwook Park} and {Angeles Salles} and {Kathryne Allen} and {Cynthia Moss} and {Mounya Elhilali}},
year = 2024,
month = {4},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/aba6e97d493b8b593eac929b49ee8d1c7bf9c953},
}
@inproceedings{272087268,
title = {Time Scale Network: An Efficient Shallow Neural Network For Time Series Data in Biomedical Applications},
author = {{Trevor Meyer} and {Camden Shultz} and {N. Dehak} and {L. Moro-Velázquez} and {Pedro P. Irazoqui}},
year = 2024,
booktitle = {IEEE Journal on Selected Topics in Signal Processing},
url = {https://www.semanticscholar.org/paper/4e2f72bf6970fdbafb922f26d80b1d5626fa6939},
}
@inproceedings{267028540,
title = {Contrastive Preference Optimization: Pushing the Boundaries of LLM Performance in Machine Translation},
author = {{Haoran Xu} and {Amr Sharaf} and {Yunmo Chen} and {Weiting Tan} and {Lingfeng Shen} and {Benjamin Van Durme} and {Kenton Murray} and {Young Jin Kim}},
year = 2024,
month = {1},
booktitle = {International Conference on Machine Learning},
url = {https://www.semanticscholar.org/paper/ebd1c04c61f73f46def3305ca11d038c46665b65},
}
@inproceedings{271093594,
title = {Rel-A.I.: An Interaction-Centered Approach To Measuring Human-LM Reliance},
author = {{Kaitlyn Zhou} and {Jena D. Hwang} and {Xiang Ren} and {Nouha Dziri} and {Dan Jurafsky} and {Maarten Sap} and {Epistemic Marker} and {Sebastian Schuster} and {Judith Degen. 2019} and {Aarohi Srivastava} and {Abhinav Rastogi} and {Abhishek Rao} and {Abu Awal} and {Md. Shoeb} and {Abubakar Abid} and {Adam Fisch} and {Adam R. Brown} and {Adam Santoro} and {Aditya Gupta} and {Adrià Garriga-Alonso} and {Agnieszka Kluska} and {Aitor Lewkowycz} and {Akshat Agarwal} and {Alethea Power} and {Alex Ray} and {Alex Warstadt} and {Alexander W. Kocurek} and {Ali Safaya} and {Ali Tazarv} and {Alice Xiang} and {Alicia Parrish} and {Allen Nie} and {Aman Hussain} and {Amanda Askell} and {Amanda Dsouza} and {Ameet Ambrose Slone} and {Annasaheb Rahane} and {Anantharaman S. Iyer} and {Anders Andreassen} and {Andrea Madotto} and {A. Santilli} and {Andreas Stuhlmuller} and {Andrew M. Dai} and {Andrew La} and {Andrew K. Lampinen} and {Andy Zou} and {Angela Jiang} and {Angelica Chen} and {Anh Vuong} and {Animesh Gupta} and {Anna Gottardi} and {Antonio Norelli} and {Anu Venkatesh} and {Arash Gholamidavoodi} and {A. Tabassum} and {Arul Menezes} and {Arun Kirubarajan} and {A. Mullokandov} and {Ashish Sabharwal} and {Austin Herrick} and {Avia Efrat} and {Aykut Erdem} and {Ayla Karakacs} and {Ryan Roberts} and {B. S. Loe} and {Barret Zoph} and {Bartlomiej Bojanowski} and {Batuhan Ozyurt} and {Behnam Hedayatnia} and {Behnam Neyshabur} and {Benjamin Inden} and {Benno Stein} and {Berk Ekmekci} and {Bill Yuchen} and {B. Lin} and {Bryan Howald} and {Orinion Cameron} and {Cameron Diao} and {Catherine Dour} and {Stinson Cedrick} and {Argueta} and {C’esar Ferri} and {C. Ram’irez} and {Charles Singh} and {Chenlin Rathkopf} and {Chitta Meng} and {Chiyu Baral} and {Chris Wu} and {Christopher Callison-Burch} and {Christian Waites} and {Christian Voigt} and {Manning Christopher} and {Cindy Potts} and {Clara Ramirez} and {Rivera Clemencia} and {Colin Siro} and {Courtney Raffel} and {Ashcraft Cristina} and {Damien Garbacea} and {Dan Sileo} and {Daniel H Garrette} and {Dan Hendrycks} and {D. Kilman} and {Roth Daniel} and {Daniel Freeman} and {Daniel Khashabi} and {Levy Daniel} and {Danielle R Mosegu’i Gonz’alez} and {Perszyk Danny} and {Danqi Hernandez} and {Daphne Chen} and {Ippolito Dar} and {D. Gilboa} and {David Dohan} and {D. Drakard} and {Debajyoti Jurgens} and {Deep Datta} and {Denis Ganguli} and {Denis Emelin} and {D. Kleyko} and {Derek Yuret} and {Chen Derek} and {Dieuwke Tam} and {Diganta Hupkes} and {Dilyar Misra} and {Dimitri Coelho Buzan} and {Diyi Mollo} and {Dong-Ho Yang} and {Dylan Lee} and {Ekaterina Schrader} and {Ekin Dogus Shutova} and {Elad Cubuk} and {Eleanor Segal} and {Elizabeth Hagerman} and {Elizabeth Barnes} and {E. Donoway} and {Pavlick Emanuele} and {E. Rodolà} and {Eric Lam} and {Eric Chu} and {Tang Erkut} and {Ernie Erdem} and {Ethan A Chang} and {Ethan A. Chi} and {J. DyerEthan} and {E. Jerzak} and {Eunice Engefu Kim} and {Manyasi Evgenii} and {Fanyue Zheltonozhskii} and {Fatemeh Xia} and {Siar Fernando} and {Francesca Mart’inez-Plumed} and {Happ’e François} and {Frieda Chollet} and {Gaurav Rong} and {Mishra} and {Genta Indra} and {Gerard Winata} and {Germán de Melo} and {Giambattista Kruszewski} and {Giorgio Parascandolo} and {Gloria Mariani} and {Gonzalo Wang} and {Jaimovitch-L’opez Gregor} and {Guy Betz} and {Hana Gur-Ari} and {Galijasevic Hannah} and {Hannah Kim} and {Hannaneh Rashkin} and {Hajishirzi Harsh} and {Hayden Mehta} and {Henry Bogar} and {Shevlin Hinrich} and {Hiromu Schutze} and {Hongming Yakura} and {Zhang Hugh Mee} and {Ian Wong} and {Isaac Ng} and {Jaap Noble} and {Jumelet Jack} and {Jack Geissinger} and {Jacob Kernion} and {Jaehoon Hilton} and {Jaime Fernández Lee} and {James B Fisac} and {James B. Simon} and {James Koppel} and {James Zheng} and {Jan Zou} and {Koco’n Jana} and {Janelle Thompson} and {Jared Wingfield} and {Kaplan Jarema} and {Radom} and {Jascha Narain} and {Jason Sohl-Dickstein} and {Jason Phang} and {Jason Wei} and {Jekaterina Yosinski} and {Jelle Novikova} and {Jennifer Bosscher} and {Jeremy Marsh} and {Jeroen Kim} and {Jesse Taal} and {Jesujoba Engel} and {Oluwadara} and {K. Kanclerz} and {Karl Livescu} and {Karthik Krauth} and {Katerina Gopalakrishnan} and {Katja Ignatyeva} and {D. MarkertKaustubh} and {Kevin Dhole} and {Kevin Gimpel} and {Omondi Kory Wallace} and {Kristen Mathewson} and {Ksenia Chiafullo} and {Kumar Shkaruta} and {Kyle Shridhar} and {Kyle McDonell} and {Laria Richardson} and {Leo Reynolds} and {Li Gao} and {Zhang Liam} and {Lianhui Dugan} and {Lidia Qin} and {Contreras-Ochando} and {Luke Metz} and {Lutfi Kerem} and {Maarten Sap Maartje ter Hoeve Maarten Bosma} and {Maheen Farooqi} and {Manaal Faruqui} and {Mantas Mazeika} and {Marco Baturan} and {Marco Marelli} and {Marco Maru} and {Maria Jose Ram’irez Quintana} and {M. Tolkiehn} and {Mario Giulianelli} and {Martha Lewis} and {Martin Potthast} and {Matthew L. Leavitt} and {Matthias Hagen} and {Medina M’aty’as Schubert} and {Melody Baitemirova} and {Melvin Andrew Arnaud} and {Michael A McElrath} and {Yee Michael} and {Michael Cohen} and {Michael Gu} and {Michael Ivanitskiy} and {Michael Starritt} and {M. Strube} and {Michele Swkedrowski} and {Michihiro Bevilacqua} and {Mihir Yasunaga} and {Mike Kale} and {Mimee Cain} and {Xu Mirac} and {Mitch Suzgun} and {Monica Walker} and {Mohit Tiwari} and {Moin Bansal} and {Mor Aminnaseri} and {Mozhdeh Geva} and {T. Gheini} and {Nanyun MukundVarma} and {Nathan A Peng} and {Nayeon Chi} and {Neta Lee} and {Gur-Ari} and {Nicholas Krakover} and {Nicholas Cameron} and {Nicholas Roberts} and {Nicole Doiron} and {Nikita Martinez} and {Niklas Nangia} and {Niklas Deckers} and {Muennighoff} and {Nitish Shirish} and {Niveditha Keskar} and {Iyer Noah} and {Noah Constant} and {Nuan Fiedel} and {Oliver Wen} and {Omar Zhang} and {Omar Agha} and {Omer Elbaghdadi} and {Levy Owain} and {Pablo Evans} and {Antonio Moreno} and {Parth Casares} and {Pascale Doshi} and {Paul Pu Fung} and {P. Liang} and {Vicol Pegah} and {Peiyuan Alipoormolabashi} and {Percy Liao} and {Liang Peter} and {Peter Chang} and {Phu Mon Eckersley} and {Pi-Bei Htut} and {P. Hwang} and {Piyush S Milkowski} and {Pouya Patil} and {Priti Pezeshkpour} and {Qiaozhu Oli} and {Qing Mei} and {Lyu Qinlang} and {Rabin Chen} and {Rachel Etta Banjade} and {Rudolph Raefer} and {Rahel Gabriel} and {Ramon Habacker} and {Risco Raphael} and {Rhythm Milliere} and {Richard Garg} and {A. BarnesRif} and {Riku Saurous} and {Robbe Arakawa} and {Raymaekers Robert} and {Rohan Frank} and {Roman Sikand} and {Roman Novak} and {Ronan Sitelew} and {Rosanne Lebras} and {Rowan Liu} and {Jacobs Rui} and {Ruslan Zhang} and {Ryan Salakhutdinov} and {Ryan Chi} and {Ryan Lee} and {Ryan Stovall} and {Rylan Teehan} and {Sahib Yang} and {Saif M Singh} and {Sajant Mohammad} and {Sam Anand} and {Sam Dillavou} and {Sam Shleifer} and {Samuel Wiseman} and {Samuel Gruetter} and {Sam Bowman} and {Schoenholz Sanghyun} and {Sanjeev Han} and {Sarah A Kwatra} and {Rous Sarik} and {Sayan Ghazarian} and {Sean Ghosh} and {Casey Sebastian} and {Sebastian Bischoff} and {Sebastian Gehrmann} and {Sepideh Schuster} and {Shadi S Sadeghi} and {Hamdan}},
year = 2024,
month = {7},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/1d370b8b475603a44b4babcee622362aa4579f87},
}
Johns Hopkins University (JHU) submitted systems for all eight language pairs in the 2024 Low-Resource Language Track. The main effort of this work revolves around fine-tuning large and publicly available models in three proposed systems: i) end-to-end speech translation (ST) fine-tuning of Seamless4MT v2; ii) ST fine-tuning of Whisper; iii) a cascaded system involving automatic speech recognition with fine-tuned Whisper and machine translation with NLLB. On top of systems above, we conduct a comparative analysis on different training paradigms, such as intra-distillation for NLLB as well as joint training and curriculum learning for SeamlessM4T v2. Our results show that the best-performing approach differs by language pairs, but that i) fine-tuned SeamlessM4T v2 tends to perform best for source languages on which it was pre-trained, ii) multi-task training helps Whisper fine-tuning, iii) cascaded systems with Whisper and NLLB tend to outperform Whisper alone, and iv) intra-distillation helps NLLB fine-tuning.
@inproceedings{romney-robinson-etal-2024-jhu,
title = "{JHU} {IWSLT} 2024 Dialectal and Low-resource System Description",
author = "Romney Robinson, Nathaniel and
Sun, Kaiser and
Xiao, Cihan and
Bafna, Niyati and
Tan, Weiting and
Xu, Haoran and
Li Xinyuan, Henry and
Kejriwal, Ankur and
Khudanpur, Sanjeev and
Murray, Kenton and
McNamee, Paul",
editor = "Salesky, Elizabeth and
Federico, Marcello and
Carpuat, Marine",
booktitle = "Proceedings of the 21st International Conference on Spoken Language Translation (IWSLT 2024)",
month = aug,
year = "2024",
address = "Bangkok, Thailand (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.iwslt-1.19",
doi = "10.18653/v1/2024.iwslt-1.19",
pages = "140--153",
abstract = "Johns Hopkins University (JHU) submitted systems for all eight language pairs in the 2024 Low-Resource Language Track. The main effort of this work revolves around fine-tuning large and publicly available models in three proposed systems: i) end-to-end speech translation (ST) fine-tuning of Seamless4MT v2; ii) ST fine-tuning of Whisper; iii) a cascaded system involving automatic speech recognition with fine-tuned Whisper and machine translation with NLLB. On top of systems above, we conduct a comparative analysis on different training paradigms, such as intra-distillation for NLLB as well as joint training and curriculum learning for SeamlessM4T v2. Our results show that the best-performing approach differs by language pairs, but that i) fine-tuned SeamlessM4T v2 tends to perform best for source languages on which it was pre-trained, ii) multi-task training helps Whisper fine-tuning, iii) cascaded systems with Whisper and NLLB tend to outperform Whisper alone, and iv) intra-distillation helps NLLB fine-tuning.",
}
@inproceedings{269031228,
title = {Predicting pressure injury risk in hospitalised patients using machine learning with electronic health records: a US multilevel cohort study},
author = {{William V Padula} and {David G. Armstrong} and {Peter J Pronovost} and {S. Saria}},
year = 2024,
month = {4},
booktitle = {BMJ Open},
url = {https://www.semanticscholar.org/paper/d44b54dab53950fcd81592d3b9181c1aa8c4d73b},
}
@inproceedings{272345914,
title = {Exploring the Complementary Nature of Speech and Eye Movements for Profiling Neurological Disorders},
author = {{Yuzhe Wang} and {A. Favaro} and {Thomas Thebaud} and {J. Villalba} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2024,
month = {9},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/06c6bbd302ec67def5ccd2df13d8563e2d4a5e31},
}
@inproceedings{267781862,
title = {Large language models for science and medicine},
author = {{Amalio Telenti} and {Michael Auli} and {B. Hie} and {Cyrus Maher} and {S. Saria} and {J. P. Ioannidis}},
year = 2024,
month = {2},
booktitle = {European Journal of Clinical Investigation},
url = {https://www.semanticscholar.org/paper/6dcb9cb40c948aa6033c0ae2228542c14acf0ff7},
}
@inproceedings{271211023,
title = {A Phonetic Analysis of Speaker Verification Systems through Phoneme selection and Integrated Gradients},
author = {{Thomas Thebaud} and {Gabriel Hernández} and {Sarah Flora Samson Juan} and {Marie Tahon}},
year = 2024,
month = {6},
booktitle = {The Speaker and Language Recognition Workshop},
url = {https://www.semanticscholar.org/paper/098e0d7c2f273bc052a74f1bd91db8cf2b57cd1f},
}
A majority of language technologies are tailored for a small number of high-resource languages, while relatively many low-resource languages are neglected. One such group, Creole languages, have long been marginalized in academic study, though their speakers could benefit from machine translation (MT). These languages are predominantly used in much of Latin America, Africa and the Caribbean. We present the largest cumulative dataset to date for Creole language MT, including 14.5M unique Creole sentences with parallel translations{–-}11.6M of which we release publicly, and the largest bitexts gathered to date for 41 languages{–-}the first ever for 21. In addition, we provide MT models supporting all 41 Creole languages in 172 translation directions. Given our diverse dataset, we produce a model for Creole language MT exposed to more genre diversity then ever before, which outperforms a genre-specific Creole MT model on its own benchmark for 23 of 34 translation directions.
@inproceedings{robinson-etal-2024-kreyol,
title = "Krey{\`o}l-{MT}: Building {MT} for {L}atin {A}merican, {C}aribbean and Colonial {A}frican Creole Languages",
author = {Robinson, Nathaniel and
Dabre, Raj and
Shurtz, Ammon and
Dent, Rasul and
Onesi, Onenamiyi and
Monroc, Claire and
Grobol, Lo{\"\i}c and
Muhammad, Hasan and
Garg, Ashi and
Etori, Naome and
Tiyyala, Vijay Murari and
Samuel, Olanrewaju and
Stutzman, Matthew and
Odoom, Bismarck and
Khudanpur, Sanjeev and
Richardson, Stephen and
Murray, Kenton},
editor = "Duh, Kevin and
Gomez, Helena and
Bethard, Steven",
booktitle = "Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers)",
month = jun,
year = "2024",
address = "Mexico City, Mexico",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.naacl-long.170",
doi = "10.18653/v1/2024.naacl-long.170",
pages = "3083--3110",
abstract = "A majority of language technologies are tailored for a small number of high-resource languages, while relatively many low-resource languages are neglected. One such group, Creole languages, have long been marginalized in academic study, though their speakers could benefit from machine translation (MT). These languages are predominantly used in much of Latin America, Africa and the Caribbean. We present the largest cumulative dataset to date for Creole language MT, including 14.5M unique Creole sentences with parallel translations{---}11.6M of which we release publicly, and the largest bitexts gathered to date for 41 languages{---}the first ever for 21. In addition, we provide MT models supporting all 41 Creole languages in 172 translation directions. Given our diverse dataset, we produce a model for Creole language MT exposed to more genre diversity then ever before, which outperforms a genre-specific Creole MT model on its own benchmark for 23 of 34 translation directions.",
}
@inproceedings{267144330,
title = {Slowness Regularized Contrastive Predictive Coding for Acoustic Unit Discovery},
author = {{Saurabhchand Bhati} and {J. Villalba} and {Piotr Żelasko} and {L. Moro-Velázquez} and {N. Dehak}},
year = 2024,
booktitle = {IEEE/ACM Transactions on Audio Speech and Language Processing},
url = {https://www.semanticscholar.org/paper/1748de2018438a1015f557ed72424602b144f5ba},
}
@inproceedings{268264353,
title = {LLMs in the Imaginarium: Tool Learning through Simulated Trial and Error},
author = {{Boshi Wang} and {Hao Fang} and {Jason Eisner} and {Benjamin Van Durme} and {Yu Su}},
year = 2024,
month = {3},
booktitle = {Annual Meeting of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/ae4635297ad87fcb3ec4105a51b5cbcb4075e5e2},
}
@inproceedings{271745819,
title = {The Trickle-down Impact of Reward Inconsistency on RLHF},
author = {{Lingfeng Shen} and {Sihao Chen} and {Linfeng Song} and {Lifeng Jin} and {Baolin Peng} and {Haitao Mi} and {Daniel Khashabi} and {Dong Yu}},
year = 2024,
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/1eecfd21543286d45ca44e424a2e351d1ee6ab12},
}
@inproceedings{268531479,
title = {Dated Data: Tracing Knowledge Cutoffs in Large Language Models},
author = {{Jeffrey Cheng} and {Marc Marone} and {Orion Weller} and {Dawn Lawrie} and {Daniel Khashabi} and {Benjamin Van Durme}},
year = 2024,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/5ee0c8975b965a413b27332b5cbfb2745251dc52},
}
@inproceedings{268532373,
title = {FaceXFormer: A Unified Transformer for Facial Analysis},
author = {{Kartik Narayan} and {VS Vibashan} and {R. Chellappa} and {Vishal M. Patel}},
year = 2024,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/cf9ea0a2ae56bce6d2fdbc9f81633ef8ce9df59c},
}
@inproceedings{267200158,
title = {The Language Barrier: Dissecting Safety Challenges of LLMs in Multilingual Contexts},
author = {{Lingfeng Shen} and {Weiting Tan} and {Sihao Chen} and {Yunmo Chen} and {Jingyu (Jack) Zhang} and {Haoran Xu} and {Boyuan Zheng} and {Philipp Koehn} and {Daniel Khashabi}},
year = 2024,
month = {1},
booktitle = {Annual Meeting of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/3cd81b0123b5f8477f6b5777681030ef6b05dd46},
}
@inproceedings{272653876,
title = {Clean Label Attacks against SLU Systems},
author = {{Henry Li Xinyuan} and {Sonal Joshi} and {Thomas Thebaud} and {J. Villalba} and {N. Dehak} and {S. Khudanpur}},
year = 2024,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/4196ee966cae649605415e0069dd9e830545f9fe},
}
@inproceedings{272332095,
title = {Evaluating the Santa Barbara Corpus: Challenges of the Breadth of Conversational Spoken Language},
author = {{Matthew Maciejewski} and {Dominik Klement} and {Ruizhe Huang} and {Matthew Wiesner} and {S. Khudanpur}},
year = 2024,
month = {9},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/01da401eabaca52dccc642ec6d25fb5170e0538b},
}
@inproceedings{272357972,
title = {Enhancing Neural Transducer for Multilingual ASR with Synchronized Language Diarization},
author = {{Amir Hussein} and {Desh Raj} and {Matthew Wiesner} and {Dan Povey} and {Paola Garcia} and {S. Khudanpur}},
year = 2024,
month = {9},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/8f6b595c7e09a7bec11726e8e1520c3eb693fec4},
}
@inproceedings{271162279,
title = {Benchmarking Language Model Creativity: A Case Study on Code Generation},
author = {{Yining Lu} and {Dixuan Wang} and {Tianjian Li} and {Dongwei Jiang} and {Daniel Khashabi}},
year = 2024,
month = {7},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/20be3ba3f361d9630cc0c17442a0d0132873e63d},
}
While large language models exhibit certain cross-lingual generalization capabilities, they suffer from performance degradation (PD) on unseen closely-related languages (CRLs) and dialects relative to their high-resource language neighbour (HRLN). However, we currently lack a fundamental understanding of what kinds of linguistic distances contribute to PD, and to what extent. Furthermore, studies of cross-lingual generalization are confounded by unknown quantities of CRL language traces in the training data, and by the frequent lack of availability of evaluation data in lower-resource related languages and dialects. To address these issues, we model phonological, morphological, and lexical distance as Bayesian noise processes to synthesize artificial languages that are controllably distant from the HRLN. We analyse PD as a function of underlying noise parameters, offering insights on model robustness to isolated and composed linguistic phenomena, and the impact of task and HRL characteristics on PD. We calculate parameter posteriors on real CRL-HRLN pair data and show that they follow computed trends of artificial languages, demonstrating the viability of our noisers. Our framework offers a cheap solution for estimating task performance on an unseen CRL given HRLN performance using its posteriors, as well as for diagnosing observed PD on a CRL in terms of its linguistic distances from its HRLN, and opens doors to principled methods of mitigating performance degradation.
@inproceedings{bafna-etal-2024-evaluating,
title = "Evaluating Large Language Models along Dimensions of Language Variation: A Systematik Invesdigatiom uv Cross-lingual Generalization",
author = "Bafna, Niyati and
Murray, Kenton and
Yarowsky, David",
editor = "Al-Onaizan, Yaser and
Bansal, Mohit and
Chen, Yun-Nung",
booktitle = "Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing",
month = nov,
year = "2024",
address = "Miami, Florida, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.emnlp-main.1044",
doi = "10.18653/v1/2024.emnlp-main.1044",
pages = "18742--18762",
abstract = "While large language models exhibit certain cross-lingual generalization capabilities, they suffer from performance degradation (PD) on unseen closely-related languages (CRLs) and dialects relative to their high-resource language neighbour (HRLN). However, we currently lack a fundamental understanding of what kinds of linguistic distances contribute to PD, and to what extent. Furthermore, studies of cross-lingual generalization are confounded by unknown quantities of CRL language traces in the training data, and by the frequent lack of availability of evaluation data in lower-resource related languages and dialects. To address these issues, we model phonological, morphological, and lexical distance as Bayesian noise processes to synthesize artificial languages that are controllably distant from the HRLN. We analyse PD as a function of underlying noise parameters, offering insights on model robustness to isolated and composed linguistic phenomena, and the impact of task and HRL characteristics on PD. We calculate parameter posteriors on real CRL-HRLN pair data and show that they follow computed trends of artificial languages, demonstrating the viability of our noisers. Our framework offers a cheap solution for estimating task performance on an unseen CRL given HRLN performance using its posteriors, as well as for diagnosing observed PD on a CRL in terms of its linguistic distances from its HRLN, and opens doors to principled methods of mitigating performance degradation.",
}
@inproceedings{270845380,
title = {Efficient Large Multi-modal Models via Visual Context Compression},
author = {{Jieneng Chen} and {Luoxin Ye} and {Ju He} and {Zhao-Yang Wang} and {Daniel Khashabi} and {Alan L. Yuille}},
year = 2024,
month = {6},
booktitle = {},
url = {https://www.semanticscholar.org/paper/227c2f542f7848c16af712ea417ea2177a6450b9},
}
@inproceedings{267413013,
title = {FuseMoE: Mixture-of-Experts Transformers for Fleximodal Fusion},
author = {{Xing Han} and {Huy Nguyen} and {C. Harris} and {Nhat Ho} and {S. Saria}},
year = 2024,
month = {2},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/f71ea9673be9c7a76d0fa6695a5713f150b64304},
}
@inproceedings{270688653,
title = {Insights into LLM Long-Context Failures: When Transformers Know but Don't Tell},
author = {{Taiming Lu} and {Muhan Gao} and {Kuai Yu} and {Adam Byerly} and {Daniel Khashabi}},
year = 2024,
month = {6},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/2138841e6e5ecf59d881a0108e0d9551484cfe32},
}
@inproceedings{270702574,
title = {DreamVoice: Text-Guided Voice Conversion},
author = {{Jiarui Hai} and {Karan Thakkar} and {Helin Wang} and {Zengyi Qin} and {Mounya Elhilali}},
year = 2024,
month = {6},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/fe5cccd11f8cdcfa6584b25b3762d06253bdd813},
}
@inproceedings{267522236,
title = {Artificial Intelligence and Technology Collaboratories: Innovating aging research and Alzheimer's care},
author = {{Peter M Abadir} and {Esther S Oh} and {Rama Chellappa} and {N. Choudhry} and {George Demiris} and {Deepak Ganesan} and {Jason Karlawish} and {Benjamin M. Marlin} and {Rose M Li} and {N. Dehak} and {Alicia Arbaje} and {Mathias Unberath} and {Thomas K. M. Cudjoe} and {Christopher Chute} and {Jason H Moore} and {Phillip Phan} and {Quincy M. Samus} and {Nancy L. Schoenborn} and {Alexis Battle} and {Jeremy D Walston}},
year = 2024,
month = {2},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/893d9dc2d86b71e3ba67490decd96f91954e47ce},
}
@inproceedings{272600353,
title = {SSR-Speech: Towards Stable, Safe and Robust Zero-shot Text-based Speech Editing and Synthesis},
author = {{Helin Wang} and {Meng Yu} and {Jiarui Hai} and {Chen Chen} and {Yuchen Hu} and {Rilin Chen} and {N. Dehak} and {Dong Yu}},
year = 2024,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/a96b6a7d9d8146cb28643672a5013fec19ad4cbb},
}
@inproceedings{271894946,
title = {Ask Again, Then Fail: Large Language Models’ Vacillations in Judgment},
author = {{Qiming Xie} and {Zengzhi Wang} and {Yihao Feng} and {Rui Xia} and {Neel Guha} and {Tatsunori Hashimoto} and {Peter Henderson} and {John Hewitt} and {Daniel E. Ho} and {Jenny Hong} and {Kyle Hsu} and {Jing Huang} and {Thomas Icard} and {Saahil Jain} and {Dan Juraf-sky} and {Pratyusha Kalluri} and {Siddharth Karamcheti} and {Geoff Keeling} and {Fereshte Khani} and {Pang Omar Khattab} and {Wei Koh} and {M. Krass} and {Ranjay Krishna} and {Tom Brown} and {Benjamin Mann} and {Nick Ryder} and {Melanie Subbiah} and {Jared Kaplan} and {Prafulla Dhariwal} and {Arvind Neelakantan} and {Pranav Shyam} and {Girish Sastry} and {Amanda Askell} and {Sandhini Agarwal} and {Ariel Herbert-Voss} and {Gretchen Krueger} and {T. Henighan} and {R. Child} and {Aditya Ramesh} and {Daniel M. Ziegler} and {Jeffrey Wu} and {Clemens Winter} and {Chris Hesse} and {Mark Chen} and {Eric Sigler} and {Ma-teusz Litwin} and {Scott Gray} and {B. Chess} and {J. Clark} and {Christopher Berner} and {Sam McCandlish} and {Wei-Lin Chiang} and {Zhuohan Li} and {Zi Lin} and {Ying Sheng} and {Zhanghao Wu} and {Hao Zhang} and {Lianmin Zheng} and {Siyuan Zhuang} and {Yonghao Zhuang} and {Joseph E. Gonzalez} and {Aakanksha Chowdhery} and {Sharan Narang} and {Jacob Devlin} and {Maarten Bosma} and {Gaurav Mishra} and {Adam Roberts} and {Hyung Paul Barham} and {Won Chung} and {Charles Sutton} and {Sebastian Gehrmann} and {Parker Schuh} and {Kensen Shi} and {Sasha Tsvyashchenko} and {Joshua Maynez} and {Abhishek Rao} and {Parker Barnes} and {Yi Tay} and {Noam M. Shazeer} and {Vinodkumar Prabhakaran} and {Emily Reif} and {Nan Du} and {Ben Hutchinson} and {Reiner Pope} and {James Bradbury} and {Jacob Austin} and {M. Isard} and {Guy Gur-Ari} and {Pengcheng Yin} and {Toju Duke} and {Anselm Levskaya} and {Sanjay Ghe-mawat} and {Sunipa Dev} and {H. Michalewski} and {Xavier Garcia} and {Vedant Misra} and {Kevin Robinson} and {Liam Fe-dus} and {Denny Zhou} and {Daphne Ippolito} and {D. Luan} and {Hyeontaek Lim} and {Barret Zoph} and {A. Spiridonov} and {Ryan Sepassi} and {David Dohan} and {Shivani Agrawal} and {Mark Omernick} and {Andrew M. Dai} and {Thanumalayan Sankaranarayana Pillai} and {Marie Pellat} and {Aitor Lewkowycz} and {Erica Moreira} and {Oleksandr Polozov} and {Katherine Lee} and {Zongwei Zhou} and {Xuezhi Wang} and {Brennan Saeta} and {Mark Díaz} and {Orhan Firat} and {M. Catasta} and {Jason Wei} and {K. Meier-Hellstern} and {K. Cobbe} and {Vineet Kosaraju} and {Mo Bavarian} and {Heewoo Jun} and {Lukasz Kaiser} and {Matthias Plappert} and {Jerry Tworek} and {Jacob Hilton} and {Reiichiro Nakano} and {L. D. Angelis} and {F. Baglivo} and {G. Arzilli} and {Gaetano Pierpaolo} and {P. Privitera} and {Alberto Eugenio Ferrag-ina} and {Tozzi Caterina} and {Rizzo} and {ChatGPT} and {Deep Ganguli} and {Liane Lovitt} and {John Kernion} and {Yuntao Bai} and {Saurav Kadavath} and {Ethan Perez} and {Nicholas Schiefer} and {Kamal Ndousse} and {Andy Jones} and {Sam Bowman} and {Anna Chen} and {Tom Con-erly} and {Nova Dassarma} and {Dawn Drain} and {Sheer Nelson El-hage} and {El Showk} and {Stanislav Fort} and {Zac Hatfield-Dodds} and {Danny Hernandez} and {Tristan Hume} and {J. Jacobson} and {Scott Johnston} and {Shauna Kravec} and {Catherine Olsson} and {Sam Ringer} and {Eli Tran-Johnson} and {Dario Amodei} and {Nicholas Joseph} and {C. Olah} and {Mor Geva} and {Daniel Khashabi} and {Elad Segal} and {Tushar Khot} and {Dan Roth} and {Jonathan Berant. 2021} and {Did Aristo-tle} and {Kai Greshake} and {Sahar Abdelnabi} and {Shailesh Mishra} and {Christoph Endres} and {Thorsten Holz} and {Dan Hendrycks} and {Collin Burns} and {Steven Basart} and {Andy Zou} and {Mantas Mazeika} and {Mohammad Hosseini} and {Catherine A Gao} and {David M. Liebovitz} and {Faraz Alexandre M Carvalho} and {S. Ahmad} and {Yuan Luo} and {N. MacDonald} and {Kristi L. Holmes} and {Abel Kho. 2023} and {An} and {Edward J. Hu} and {Yelong Shen} and {Zeyuan Phillip Wallis} and {Kevin B. Johnson} and {Wei-Qi Wei} and {D. Weeraratne} and {M. Frisse} and {K. Misulis} and {Kyu Rhee} and {Juan Zhao} and {Tom Conerly} and {Nelson Elhage} and {Tristan Hume} and {Kamal Ndousse} and {Stephanie Lin} and {Owain Evans. 2022} and {Yao Lu} and {Max Bartolo} and {Alastair Moore} and {Sewon Min} and {Xinxi Lyu} and {Ari Holtzman} and {Mikel Artetxe} and {Ouyang Long} and {Xu Jiang} and {Diogo Almeida} and {Carroll L. Wainwright} and {Pamela Mishkin} and {Chong Zhang} and {Katarina Slama} and {Alex Ray} and {John Schulman} and {Fraser Kelton} and {Luke Miller} and {Maddie Simens} and {P. Welinder} and {Paul F. Christiano} and {Jan Leike} and {Ryan Lowe. 2022} and {Kamilė Lukošiūtė} and {Karina Nguyen} and {Edwin Chen} and {Scott Heiner} and {Craig Pettit} and {Sandipan Kundu} and {Saurav Kada-vath} and {Brian Israel} and {Bryan Seethor} and {C. McKinnon} and {Da Yan} and {D. Amodei} and {Dustin Li} and {Guro Khundadze} and {James Landis} and {Jamie Kerr} and {J. Mueller} and {Jeeyoon Hyun} and {Joshua Landau} and {Landon Goldberg} and {Martin Lucas} and {M. Sellitto} and {Miranda Zhang} and {Neerav Kingsland} and {Noem'i Mercado} and {Oliver Rausch} and {Robin Larson} and {Tamera Lanham} and {Timothy Telleen-Lawton} and {Roger Grosse} and {Evan Hubinger} and {Ansh Radhakrishnan} and {Carol Chen} and {Carson E. Denison} and {Esin Durmus} and {Newton Cheng} and {Sheer Sam McCan-dlish} and {Tamera Lanham} and {Tim Maxwell} and {Venkatesa Chandrasekaran}},
year = 2024,
booktitle = {Volume 1},
url = {https://www.semanticscholar.org/paper/7925f16e76cf274c257570ed3aa0ab97638be7d1},
}
@inproceedings{269459473,
title = {Odyssey 2024 - Speech Emotion Recognition Challenge: Dataset, Baseline Framework, and Results},
author = {{Lucas Goncalves} and {Ali N. Salman} and {Abinay Reddy Naini} and {Laureano Moro Velázquez} and {Thomas Thebaud} and {Leibny Paola} and {Najim Garcia} and {Berrak Dehak} and {Carlos Sisman} and {Busso}},
year = 2024,
month = {6},
booktitle = {The Speaker and Language Recognition Workshop},
url = {https://www.semanticscholar.org/paper/44a30157f437065fd0672b1327edaa32a9239ce5},
}
@inproceedings{266873790,
title = {Sustained EEG responses to rapidly unfolding stochastic sounds reflect precision tracking},
author = {{Sijia Zhao} and {Benjamin Skirritt-Davis} and {Mounya Elhilali} and {Fred Dick} and {M. Chait}},
year = 2024,
month = {1},
booktitle = {bioRxiv},
url = {https://www.semanticscholar.org/paper/e69427d53f37698a57706e91a275d57e582baba4},
}
@inproceedings{270521572,
title = {Multi-Channel Multi-Speaker ASR Using Target Speaker’s Solo Segment},
author = {{Yiwen Shao} and {Shizhong Zhang} and {Yong Xu} and {Meng Yu} and {Dong Yu} and {Dan Povey} and {S. Khudanpur}},
year = 2024,
month = {6},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/18eadf3b7cf2ceb7b3c4e034b948af90ceec7219},
}
@inproceedings{272653828,
title = {SoloAudio: Target Sound Extraction with Language-oriented Audio Diffusion Transformer},
author = {{Helin Wang} and {Jiarui Hai} and {Yen-Ju Lu} and {Karan Thakkar} and {Mounya Elhilali} and {N. Dehak}},
year = 2024,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/7f38e38bcdf7312cad3534211d40f4a86431ff7d},
}
@inproceedings{271776874,
title = {End-to-End Neural Speaker Diarization With Non-Autoregressive Attractors},
author = {{Magdalena Rybicka} and {J. Villalba} and {Thomas Thebaud} and {N. Dehak} and {Konrad Kowalczyk}},
year = 2024,
booktitle = {IEEE/ACM Transactions on Audio Speech and Language Processing},
url = {https://www.semanticscholar.org/paper/3eb78f245370801e1ed5a80972c8d88d275b0852},
}
@inproceedings{272653901,
title = {HLTCOE JHU Submission to the Voice Privacy Challenge 2024},
author = {{Henry Li Xinyuan} and {Zexin Cai} and {Ashi Garg} and {Kevin Duh} and {Leibny Paola Garc'ia-Perera} and {S. Khudanpur} and {Nicholas Andrews} and {Matthew Wiesner}},
year = 2024,
month = {9},
booktitle = {4th Symposium on Security and Privacy in Speech Communication},
url = {https://www.semanticscholar.org/paper/d20a9b6e43042214017716d06e7cd7f21da9371c},
}
@inproceedings{269408252,
title = {Online speech synthesis using a chronically implanted brain–computer interface in an individual with ALS},
author = {{Miguel Angrick} and {Shiyu Luo} and {Qinwan Rabbani} and {Daniel N Candrea} and {Samyak Shah} and {Griffin W. Milsap} and {William S Anderson} and {Chad R Gordon} and {Kathryn R Rosenblatt} and {Lora Clawson} and {Donna C. Tippett} and {Nicholas J Maragakis} and {F. Tenore} and {M. Fifer} and {H. Hermansky} and {Nick F Ramsey} and {N. Crone}},
year = 2024,
month = {4},
booktitle = {Scientific Reports},
url = {https://www.semanticscholar.org/paper/fa58f21ecda2053d2c1c9360e682b1140b6ff4c1},
}
@inproceedings{269987122,
title = {Temporal-Coherence Induces Binding of Responses to Sound Sequences in Ferret Auditory Cortex},
author = {{Kai Lu} and {Kelsey Dutta} and {Mounya Elhilali} and {S. Shamma}},
year = 2024,
month = {5},
booktitle = {bioRxiv},
url = {https://www.semanticscholar.org/paper/ad2b79189ddfee6af017d1569bfebde37e587aea},
}
@inproceedings{271967099,
title = {Iterative alignment discovery of speech-associated neural activity},
author = {{Qinwan Rabbani} and {Samyak Shah} and {Griffin W. Milsap} and {M. Fifer} and {H. Hermansky} and {N. Crone}},
year = 2024,
month = {8},
booktitle = {Journal of Neural Engineering},
url = {https://www.semanticscholar.org/paper/d182dc65e550bb6cf2eb956e5c2278a45c983572},
}
@inproceedings{271088562,
title = {WorldAPIs: The World Is Worth How Many APIs? A Thought Experiment},
author = {{Jiefu Ou} and {Arda Uzunouglu} and {Benjamin Van Durme} and {Daniel Khashabi}},
year = 2024,
month = {7},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/143ff789f500307bab6725c466da97492cb5c771},
}
@inproceedings{268531391,
title = {Tur[k]ingBench: A Challenge Benchmark for Web Agents},
author = {{Kevin Xu} and {Yeganeh Kordi} and {Kate Sanders} and {Yizhong Wang} and {Adam Byerly} and {Jingyu (Jack) Zhang} and {Benjamin Van Durme} and {Daniel Khashabi}},
year = 2024,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/341da3f8af6edd31edd8f5a3d9452957aeaaa744},
}
@inproceedings{272689050,
title = {Target Speaker ASR with Whisper},
author = {{Alexander Polok} and {Dominik Klement} and {Matthew Wiesner} and {S. Khudanpur} and {J. Černocký} and {L. Burget}},
year = 2024,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/9ff8924b37f827d695db1354ab15374e2076abc3},
}
@inproceedings{270380183,
title = {Noise-robust Speech Separation with Fast Generative Correction},
author = {{Helin Wang} and {J. Villalba} and {L. Moro-Velázquez} and {Jiarui Hai} and {Thomas Thebaud} and {N. Dehak}},
year = 2024,
month = {6},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/6983f5ef3a136df52cbaf0b623c16a7983e99d59},
}
@inproceedings{270746357,
title = {Assessing racial bias in healthcare predictive models: Practical lessons from an empirical evaluation of 30-day hospital readmission models},
author = {{H. E. Wang} and {Jonathan P. Weiner} and {S. Saria} and {Harold P. Lehmann} and {Hadi Kharrazi}},
year = 2024,
month = {6},
booktitle = {Journal of Biomedical Informatics},
url = {https://www.semanticscholar.org/paper/205acb6a954600dacbcb877a625605a16ca261f2},
}
Knowing the particular context associated with a conversation can help improving the performance of an automatic speech recognition (ASR) system. For example, if we are provided with a list of in-context words or phrases {–-} such as the speaker{‘}s contacts or recent song playlists {–-} during inference, we can bias the recognition process towards this list. There are many works addressing contextual ASR; however, there is few publicly available real benchmark for evaluation, making it difficult to compare different solutions. To this end, we provide a corpus ({“}ConEC{”}) and baselines to evaluate contextual ASR approaches, grounded on real-world applications. The ConEC corpus is based on public-domain earnings calls (ECs) and associated supplementary materials, such as presentation slides, earnings news release as well as a list of meeting participants{‘} names and affiliations. We demonstrate that such real contexts are noisier than artificially synthesized contexts that contain the ground truth, yet they still make great room for future improvement of contextual ASR technology
@inproceedings{huang-etal-2024-conec,
title = "{C}on{EC}: Earnings Call Dataset with Real-world Contexts for Benchmarking Contextual Speech Recognition",
author = "Huang, Ruizhe and
Yarmohammadi, Mahsa and
Trmal, Jan and
Liu, Jing and
Raj, Desh and
Garcia, Leibny Paola and
Ivanov, Alexei V. and
Ehlen, Patrick and
Yu, Mingzhi and
Povey, Dan and
Khudanpur, Sanjeev",
editor = "Calzolari, Nicoletta and
Kan, Min-Yen and
Hoste, Veronique and
Lenci, Alessandro and
Sakti, Sakriani and
Xue, Nianwen",
booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)",
month = may,
year = "2024",
address = "Torino, Italia",
publisher = "ELRA and ICCL",
url = "https://aclanthology.org/2024.lrec-main.328",
pages = "3700--3706",
abstract = "Knowing the particular context associated with a conversation can help improving the performance of an automatic speech recognition (ASR) system. For example, if we are provided with a list of in-context words or phrases {---} such as the speaker{'}s contacts or recent song playlists {---} during inference, we can bias the recognition process towards this list. There are many works addressing contextual ASR; however, there is few publicly available real benchmark for evaluation, making it difficult to compare different solutions. To this end, we provide a corpus ({``}ConEC{''}) and baselines to evaluate contextual ASR approaches, grounded on real-world applications. The ConEC corpus is based on public-domain earnings calls (ECs) and associated supplementary materials, such as presentation slides, earnings news release as well as a list of meeting participants{'} names and affiliations. We demonstrate that such real contexts are noisier than artificially synthesized contexts that contain the ground truth, yet they still make great room for future improvement of contextual ASR technology",
}
@inproceedings{266977175,
title = {Reframing Tax Law Entailment as Analogical Reasoning},
author = {{Xinrui Zou} and {Ming Zhang} and {Nathaniel Weir} and {Benjamin Van Durme} and {Nils Holzenberger}},
year = 2024,
month = {1},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/e993e7971fa8b96514fd63699c12bec68e83b6d1},
}
@inproceedings{271207138,
title = {Discovering Invariant Patterns of Cognitive Decline Via an Automated Analysis of the Cookie Thief Picture Description Task},
author = {{A. Favaro} and {N. Dehak} and {Thomas Thebaud} and {J. Villalba} and {Esther S Oh} and {L. Moro-Velázquez}},
year = 2024,
month = {6},
booktitle = {The Speaker and Language Recognition Workshop},
url = {https://www.semanticscholar.org/paper/99dec8ab1d7aa47117062e1daf36dcbcce4aece2},
}
@inproceedings{271212774,
title = {Improving Neural Biasing for Contextual Speech Recognition by Early Context Injection and Text Perturbation},
author = {{Ruizhe Huang} and {M. Yarmohammadi} and {S. Khudanpur} and {Dan Povey}},
year = 2024,
month = {7},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/6ebfef1daea743456536d620e894eee8992aa124},
}
@inproceedings{267406764,
title = {Streaming Sequence Transduction through Dynamic Compression},
author = {{Weiting Tan} and {Yunmo Chen} and {Tongfei Chen} and {Guanghui Qin} and {Haoran Xu} and {Heidi C. Zhang} and {Benjamin Van Durme} and {Philipp Koehn}},
year = 2024,
month = {2},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/50b2a8c4c8a0d4b26621e84e3e0b5b300775e030},
}
@inproceedings{268091248,
title = {Unraveling Adversarial Examples against Speaker Identification - Techniques for Attack Detection and Victim Model Classification},
author = {{Sonal Joshi} and {Thomas Thebaud} and {J. Villalba} and {N. Dehak}},
year = 2024,
month = {2},
booktitle = {The Speaker and Language Recognition Workshop},
url = {https://www.semanticscholar.org/paper/af87c6786c1e7f8345f3c5768668617df6cc2771},
}
@inproceedings{272330336,
title = {Position: Do pretrained Transformers Learn In-Context by Gradient Descent?},
author = {{Lingfeng Shen} and {Aayush Mishra} and {Daniel Khashabi}},
year = 2024,
booktitle = {International Conference on Machine Learning},
url = {https://www.semanticscholar.org/paper/703ead78cdfa8e77b7800d29a9163d22891d4adc},
}
@inproceedings{267750325,
title = {k-SemStamp: A Clustering-Based Semantic Watermark for Detection of Machine-Generated Text},
author = {{A. Hou} and {Jingyu (Jack) Zhang} and {Yichen Wang} and {Daniel Khashabi} and {Tianxing He}},
year = 2024,
month = {2},
booktitle = {Annual Meeting of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/94c28609614719c68469081ed99315f54cb1fb6a},
}
@inproceedings{269983348,
title = {DiffNorm: Self-Supervised Normalization for Non-autoregressive Speech-to-speech Translation},
author = {{Weiting Tan} and {Jingyu (Jack) Zhang} and {Lingfeng Shen} and {Daniel Khashabi} and {Philipp Koehn}},
year = 2024,
month = {5},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/f2b48782b86f4f8bc0b537d1d91bae6cf642c8c4},
}
@inproceedings{272340732,
title = {Leveraging Universal Speech Representations for Detecting and Assessing the Severity of Mild Cognitive Impairment Across Languages},
author = {{A. Favaro} and {Tianyu Cao} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2024,
month = {9},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/a01c088d9cd7523e36c21353cc972690f0de307d},
}
@inproceedings{269987070,
title = {Temporal Coherence Shapes Cortical Responses to Speech Mixtures in a Ferret Cocktail Party},
author = {{Neha Joshi} and {Yu Ng} and {Karan Thakkkar} and {Daniel Duque} and {Pingbo Yin} and {Jonathan Fritz} and {Mounya Elhilali} and {S. Shamma}},
year = 2024,
month = {6},
booktitle = {bioRxiv},
url = {https://www.semanticscholar.org/paper/ba6ad577da0d2144dbd3313404ea580fc155ad03},
}
@inproceedings{269741223,
title = {Conformal Validity Guarantees Exist for Any Data Distribution (and How to Find Them)},
author = {{Drew Prinster} and {Samuel Stanton} and {Anqi Liu} and {S. Saria}},
year = 2024,
month = {5},
booktitle = {International Conference on Machine Learning},
url = {https://www.semanticscholar.org/paper/bb86b50363e9d100606a534c6a877dacbf8b0e25},
}
@inproceedings{272593614,
title = {WearGait-PD: An Open-Access Wearables Dataset for Gait in Parkinson's Disease and Age-Matched Controls},
author = {{Anthony J. Anderson} and {David Eguren} and {Michael A. Gonzalez} and {Naima Khan} and {Sophia Watkinson} and {Michael Caiola} and {Siegfried S Hirczy} and {Cyrus P. Zabetian} and {Kelly Mills} and {Emile Moukheiber} and {L. Moro-Velázquez} and {N. Dehak} and {Chelsie Motely} and {B. Muir} and {A. Butala} and {Kimberly Kontson}},
year = 2024,
month = {9},
booktitle = {medRxiv},
url = {https://www.semanticscholar.org/paper/74a0ee0f0a4fb6f63c903768d002413e58458269},
}
@inproceedings{267311651,
title = {On Speaker Attribution with SURT},
author = {{Desh Raj} and {Matthew Wiesner} and {Matthew Maciejewski} and {Leibny Paola García-Perera} and {Daniel Povey} and {S. Khudanpur}},
year = 2024,
month = {1},
booktitle = {The Speaker and Language Recognition Workshop},
url = {https://www.semanticscholar.org/paper/924d189fbe7aa43ab9de9989ce45d4e4936f533d},
}
@inproceedings{272423555,
title = {Privacy versus Emotion Preservation Trade-offs in Emotion-Preserving Speaker Anonymization},
author = {{Zexin Cai} and {Henry Li Xinyuan} and {Ashi Garg} and {Leibny Paola Garc'ia-Perera} and {Kevin Duh} and {S. Khudanpur} and {Nicholas Andrews} and {Matthew Wiesner}},
year = 2024,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/3c2d94cfa24b979eb13ca06d8a2bce79b5ab2321},
}
@inproceedings{269006160,
title = {Use of artificial intelligence in critical care: opportunities and obstacles},
author = {{Michael R. Pinsky} and {Armando Bedoya} and {A. Bihorac} and {L. Celi} and {Matthew Churpek} and {Nicoleta J. Economou-Zavlanos} and {Paul Elbers} and {S. Saria} and {Vincent Liu} and {Patrick G. Lyons} and {B. Shickel} and {Patrick Toral} and {D. Tscholl} and {Gilles Clermont}},
year = 2024,
month = {4},
booktitle = {Critical Care},
url = {https://www.semanticscholar.org/paper/a386424f2f61647ebec3dd27e33c6db92c1c07ac},
}
@inproceedings{268877286,
title = {Preliminary Evidence for Global Properties in Human Listeners During Natural Auditory Scene Perception},
author = {{Margaret A. McMullin} and {Rohit Kumar} and {Nathan C. Higgins} and {Brian Gygi} and {Mounya Elhilali} and {J. Snyder}},
year = 2024,
month = {3},
booktitle = {Open Mind},
url = {https://www.semanticscholar.org/paper/e46542680689e1358d6ed072560f1ec7eefce069},
}
@inproceedings{268863052,
title = {Multi-rate modulation encoding via unsupervised learning for audio event detection},
author = {{Sandeep Reddy Kothinti} and {Mounya Elhilali}},
year = 2024,
month = {4},
booktitle = {EURASIP Journal on Audio, Speech, and Music Processing},
url = {https://www.semanticscholar.org/paper/3cc427a861147fc147b316bfd73da03761e41a4d},
}
@inproceedings{266798865,
title = {Automating the analysis of eye movement for different neurodegenerative disorders},
author = {{Deming Li} and {A. Butala} and {L. Moro-Velázquez} and {Trevor Meyer} and {Esther S. Oh} and {Chelsey Motley} and {J. Villalba} and {N. Dehak}},
year = 2024,
month = {1},
booktitle = {Comput. Biol. Medicine},
url = {https://www.semanticscholar.org/paper/f375c9d0a595152ff21f96a0a5606c7d033548f3},
}
@inproceedings{268577202,
title = {Less Peaky and More Accurate CTC Forced Alignment by Label Priors},
author = {{Ruizhe Huang} and {Xiaohui Zhang} and {Zhaoheng Ni} and {Li Sun} and {Moto Hira} and {Jeff Hwang} and {Vimal Manohar} and {Vineel Pratap} and {Matthew Wiesner} and {Shinji Watanabe} and {Daniel Povey} and {S. Khudanpur}},
year = 2024,
month = {4},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/ca6c9789f4dd10e1908aaeaa6a37bd682af4f86a},
}
@inproceedings{271039322,
title = {Core: Robust Factual Precision with Informative Sub-Claim Identification},
author = {{Zhengping Jiang} and {Jingyu (Jack) Zhang} and {Nathaniel Weir} and {Seth Ebner} and {Miriam Wanner} and {Kate Sanders} and {Daniel Khashabi} and {Anqi Liu} and {Benjamin Van Durme}},
year = 2024,
month = {7},
booktitle = {},
url = {https://www.semanticscholar.org/paper/1a37246f60f0c47cd7d3f9d91b09d7be970850a6},
}
@inproceedings{267043424,
title = {Model-Based Fairness Metric for Speaker Verification},
author = {{Maliha Jahan} and {L. Moro-Velázquez} and {Thomas Thebaud} and {N. Dehak} and {J. Villalba}},
year = 2023,
month = {12},
booktitle = {Automatic Speech Recognition & Understanding},
url = {https://www.semanticscholar.org/paper/f308fc3883c5a18c050b44ec932b59067dfd83f3},
}
@inproceedings{266574417,
title = {Decoding contextual influences on auditory perception from primary auditory cortex},
author = {{B. Englitz} and {S. Akram} and {Mounya Elhilali} and {S. Shamma}},
year = 2023,
month = {12},
booktitle = {bioRxiv},
url = {https://www.semanticscholar.org/paper/2e536d19f547f000d99351659622ae8204f3467a},
}
@inproceedings{267044002,
title = {Boosting Modality Representation With Pre-Trained Models and Multi-Task Training for Multimodal Sentiment Analysis},
author = {{Jiarui Hai} and {Yu-Jeh Liu} and {Mounya Elhilali}},
year = 2023,
month = {12},
booktitle = {Automatic Speech Recognition & Understanding},
url = {https://www.semanticscholar.org/paper/053dc825f19474a6b8b49239a7c0290aecb57771},
}
@inproceedings{266373629,
title = {A Nationwide Network of Health AI Assurance Laboratories.},
author = {{Nigam H. Shah} and {John D Halamka} and {S. Saria} and {Michael J. Pencina} and {Troy Tazbaz} and {Micky Tripathi} and {Alison Callahan} and {Hailey Hildahl} and {Brian Anderson}},
year = 2023,
month = {12},
booktitle = {Journal of the American Medical Association (JAMA)},
url = {https://www.semanticscholar.org/paper/194398467b7ae5074cbc626a859935ff2a790962},
}
@inproceedings{266523855,
title = {Multi‐task analysis of oculographic biomarkers to evaluate motoric and cognitive patterns in Alzheimer’s Disease},
author = {{Deming Li} and {Trevor Meyer} and {Esther S Oh} and {A. Butala} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2023,
month = {12},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/c2f99d03369b3583618c774b58c871c9707724bb},
}
@inproceedings{266602177,
title = {Binocular Discoordination Kinetic Features: A Novel Approach to Evaluate Neurodegenerative Diseases},
author = {{Y. Wang} and {L. Moro-Velázquez} and {A. Favaro} and {D. Li} and {E. Oh} and {A. Butala} and {J. Villalba} and {N. Dehak}},
year = 2023,
month = {12},
booktitle = {IEEE Signal Processing in Medicine and Biology Symposium},
url = {https://www.semanticscholar.org/paper/306f3684946774ed21ddba490c0f120f02a5421a},
}
@inproceedings{266523081,
title = {Evaluation of Interpretable Speech Biomarkers for Monitoring Alzheimer’s Disease and Mild Cognitive Impairment Progression},
author = {{A. Favaro} and {N. Dehak} and {Thomas Thebaud} and {Esther S Oh} and {L. Moro-Velázquez}},
year = 2023,
month = {12},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/2f88f04aeb6eb8cac8c5706c294bcd3045faa966},
}
@inproceedings{266523924,
title = {Handwriting characteristics analysis for Alzheimer’s Disease and Mild Cognitive Impairments Assessment},
author = {{Thomas Thebaud} and {Casey Chen} and {L. Moro-Velázquez} and {N. Dehak} and {Esther S Oh}},
year = 2023,
month = {12},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/b6ffb09dbe20a54ddb5f3e6f3a319f482bb3c0aa},
}
@inproceedings{266573169,
title = {Do Androids Know They're Only Dreaming of Electric Sheep?},
author = {{Sky CH-Wang} and {Benjamin Van Durme} and {Jason Eisner} and {Chris Kedzie}},
year = 2023,
month = {12},
booktitle = {Annual Meeting of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/6789e0a19f70e283b120fd6a3792162d01a021d5},
}
@inproceedings{266522435,
title = {Handwriting characteristics analysis for Alzheimer’s Disease and Mild Cognitive Impairments Assessment},
author = {{Thomas Thebaud} and {Casey Chen} and {L. Moro-Velázquez} and {N. Dehak} and {Esther S Oh}},
year = 2023,
month = {12},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/65b786c68cef24ed41374bd9f279617d694e2dd4},
}
@inproceedings{267044159,
title = {Joint Energy-Based Model for Robust Speech Classification System Against Dirty-Label Backdoor Poisoning Attacks},
author = {{Martin Sustek} and {Sonal Joshi} and {Henry Li} and {Thomas Thebaud} and {J. Villalba} and {S. Khudanpur} and {N. Dehak}},
year = 2023,
month = {12},
booktitle = {Automatic Speech Recognition & Understanding},
url = {https://www.semanticscholar.org/paper/1fd003bf9de393bcddbda63b738b71ced6203802},
}
@inproceedings{266523165,
title = {Evaluation of Interpretable Speech Biomarkers for Monitoring Alzheimer’s Disease and Mild Cognitive Impairment Progression},
author = {{A. Favaro} and {N. Dehak} and {Thomas Thebaud} and {Esther S Oh} and {L. Moro-Velázquez}},
year = 2023,
month = {12},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/3434b5755b9c8bdb4250cabaabad655aee402440},
}
@inproceedings{267043595,
title = {Clustering Unsupervised Representations as Defense Against Poisoning Attacks on Speech Commands Classification System},
author = {{Thomas Thebaud} and {Sonal Joshi} and {Henry Li} and {Martin Sustek} and {J. Villalba} and {S. Khudanpur} and {N. Dehak}},
year = 2023,
month = {12},
booktitle = {Automatic Speech Recognition & Understanding},
url = {https://www.semanticscholar.org/paper/d59282b7adbdd1aef7754309aa72e98598059c1a},
}
@inproceedings{266522904,
title = {Multi‐task analysis of oculographic biomarkers to evaluate motoric and cognitive patterns in Alzheimer’s Disease},
author = {{Deming Li} and {Trevor Meyer} and {Esther S Oh} and {A. Butala} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2023,
month = {12},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/d958ba9662d442878a1d1d11d4e0968e6df42e4d},
}
@InProceedings{tan-et-al-2023,
author = "Weiting Tan and Chu-Cheng Lin and Jason Eisner",
title = "Structure-Aware Path Inference for Neural Finite State
Transducers",
booktitle = "Proceedings of the {NeurIPS} 2023 Workshop ``{I}
Can’t Believe It’s Not Better: Failure Modes in the
Age of Foundation Models''",
year = "2023",
month = dec,
URL = "http://cs.jhu.edu/~jason/papers/#tan-et-al-2023",
}
@InProceedings{roy-et-al-2023,
author = "Subhro Roy and Sam Thomson and Tongfei Chen and
Richard Shin and Adam Pauls and Jason Eisner and
Benjamin Van Durme",
title = "{BenchCLAMP}: {A} Benchmark for Evaluating Language
Models on Syntactic and Semantic Parsing",
booktitle = "Proceedings of the Thirty-Seventh Conference on Neural
Information Processing Systems",
note = "Datasets and Benchmarks Track",
year = "2023",
month = dec,
URL = "http://cs.jhu.edu/~jason/papers/#roy-et-al-2023",
}
@InProceedings{zhong-et-al-2023,
aclid = "2023.emnlp-main.312",
author = "Ruiqi Zhong and Charlie Snell and Dan Klein and Jason
Eisner",
title = "Non-Programmers Can Label Programs Indirectly via
Active Examples: {A} Case Study with Text-to-{SQL}",
booktitle = "Proceedings of the 2023 Conference on Empirical
Methods in Natural Language Processing",
pages = "5126--5152",
year = "2023",
month = dec,
URL = "http://cs.jhu.edu/~jason/papers/#zhong-et-al-2023",
}
@inproceedings{265281100,
title = {Improving fairness for spoken language understanding in atypical speech with Text-to-Speech},
author = {{Helin Wang} and {Venkatesh Ravichandran} and {Milind Rao} and {Becky Lammers} and {Myra Sydnor} and {Nicholas J Maragakis} and {A. Butala} and {Jayne Zhang} and {Lora Clawson} and {Victoria Chovaz} and {L. Moro-Velázquez}},
year = 2023,
month = {11},
booktitle = {},
url = {https://www.semanticscholar.org/paper/45e3115df40de802f9c4095f329ea374aac56825},
}
@inproceedings{265128667,
title = {Time Scale Network: A Shallow Neural Network For Time Series Data},
author = {{Trevor Meyer} and {Camden Shultz} and {N. Dehak} and {L. Moro-Velázquez} and {Pedro P. Irazoqui}},
year = 2023,
month = {11},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/deacbb4906e1d2e597602a65b434a8132953ad8d},
}
@inproceedings{265033117,
title = {Narrowing the Gap between Zero- and Few-shot Machine Translation by Matching Styles},
author = {{Weiting Tan} and {Haoran Xu} and {Lingfeng Shen} and {Shuyue Stella Li} and {Kenton Murray} and {Philipp Koehn} and {Benjamin Van Durme} and {Yunmo Chen}},
year = 2023,
month = {11},
booktitle = {NAACL-HLT},
url = {https://www.semanticscholar.org/paper/bac133a9cb14eadea94c55ec15ea3bb866bf6c03},
}
@inproceedings{265539658,
title = {Are acoustics enough? Semantic effects on auditory salience in natural scenes},
author = {{Sandeep Reddy Kothinti} and {Mounya Elhilali}},
year = 2023,
month = {11},
booktitle = {Frontiers in Psychology},
url = {https://www.semanticscholar.org/paper/cdb491d1d121a7461fac00c4c71dfc45b9c8ae7a},
}
@inproceedings{264935647,
title = {Investigating Self-Supervised Deep Representations for EEG-Based Auditory Attention Decoding},
author = {{Karan Thakkar} and {Jiarui Hai} and {Mounya Elhilali}},
year = 2023,
month = {11},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/57b903a709dc9ab64b3bd81378f33547eabb01bd},
}
@inproceedings{265213263,
title = {Toucan: Token-Aware Character Level Language Modeling},
author = {{William Fleshman} and {Benjamin Van Durme}},
year = 2023,
month = {11},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/28c75ab7f6951f1c2bb349b34abc3204ba8b9498},
}
@inproceedings{265220995,
title = {Interpreting User Requests in the Context of Natural Language Standing Instructions},
author = {{Nikita Moghe} and {Patrick Xia} and {Jacob Andreas} and {J. Eisner} and {Benjamin Van Durme} and {Harsh Jhamtani}},
year = 2023,
month = {11},
booktitle = {NAACL-HLT},
url = {https://www.semanticscholar.org/paper/f2abeec1256f80970827d60f0151c7a19f2dbe7a},
}
@inproceedings{264426857,
title = {InstructExcel: A Benchmark for Natural Language Instruction in Excel},
author = {{Justin Payan} and {Swaroop Mishra} and {Mukul Singh} and {Carina Negreanu} and {Christian Poelitz} and {Chitta Baral} and {Subhro Roy} and {Rasika Chakravarthy} and {Benjamin Van Durme} and {E. Nouri}},
year = 2023,
month = {10},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/706fc333fc951f48ea26169d88478b5e4c36e82c},
}
@inproceedings{263605981,
title = {Error Norm Truncation: Robust Training in the Presence of Data Noise for Text Generation Models},
author = {{Tianjian Li} and {Haoran Xu} and {Philipp Koehn} and {Daniel Khashabi} and {Kenton Murray}},
year = 2023,
month = {10},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/d15021d750dbe9cee120b562acea857ca02d9104},
}
@inproceedings{263620438,
title = {Dodo: Dynamic Contextual Compression for Decoder-only LMs},
author = {{Guanghui Qin} and {Corby Rosset} and {Ethan C. Chau} and {Nikhil Rao} and {Benjamin Van Durme}},
year = 2023,
month = {10},
booktitle = {Annual Meeting of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/883187d0bacf57238ac95e2749bcc601baf2c212},
}
@inproceedings{263669151,
title = {Application of natural language processing to identify social needs from patient medical notes: development and assessment of a scalable, performant, and rule-based model in an integrated healthcare delivery system},
author = {{Geoffrey M Gray} and {Ayah Zirikly} and {Luis M Ahumada} and {Masoud Rouhizadeh} and {Thomas M Richards} and {C. Kitchen} and {Iman Foroughmand} and {E. Hatef}},
year = 2023,
month = {10},
booktitle = {JAMIA Open},
url = {https://www.semanticscholar.org/paper/1be931a9ebfeaa018e47abc582b1a9760ced4710},
}
@inproceedings{272144679,
title = {SemStamp: A Semantic Watermark with Paraphrastic Robustness for Text Generation},
author = {{A. Hou} and {Jingyu (Jack) Zhang} and {Tianxing He} and {Yichen Wang} and {Yung-Sung Chuang} and {Hongwei Wang} and {Lingfeng Shen} and {Benjamin Van Durme} and {Daniel Khashabi} and {Yulia Tsvetkov}},
year = 2023,
month = {10},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/f81faa4f130c287a293c9d21eb27b325be9b5ee9},
}
@inproceedings{263909464,
title = {Do pretrained Transformers Learn In-Context by Gradient Descent?},
author = {{Lingfeng Shen} and {Aayush Mishra} and {Daniel Khashabi}},
year = 2023,
month = {10},
booktitle = {},
url = {https://www.semanticscholar.org/paper/f30ddf0c7455f89f016c540564e235b191c503db},
}
@inproceedings{261899586,
title = {Diff-Pitcher: Diffusion-Based Singing Voice Pitch Correction},
author = {{Jiarui Hai} and {Mounya Elhilali}},
year = 2023,
month = {10},
booktitle = {IEEE Workshop on Applications of Signal Processing to Audio and Acoustics},
url = {https://www.semanticscholar.org/paper/377ffdc7cf16822e8aa12ea28ab16d0f5bc8f0c2},
}
@inproceedings{264305897,
title = {Data Augmentations for Improved (Large) Language Model Generalization},
author = {{Amir Feder} and {Yoav Wald} and {Claudia Shi} and {S. Saria} and {David M. Blei}},
year = 2023,
month = {10},
booktitle = {},
url = {https://www.semanticscholar.org/paper/23f96db82ae02c5c3c0a861571e7aa8d27c91bc9},
}
@inproceedings{264448311,
title = {Stable Decoding from a Speech BCI Enables Control for an Individual with ALS without Recalibration for 3 Months},
author = {{Shiyu Luo} and {Miguel Angrick} and {Christopher Coogan} and {Daniel N Candrea} and {Kimberley Wyse-Sookoo} and {Samyak Shah} and {Qinwan Rabbani} and {Griffin W. Milsap} and {Alexander R Weiss} and {William S Anderson} and {Donna C. Tippett} and {Nicholas J Maragakis} and {Lora Clawson} and {M. Vansteensel} and {Brock Andrew Wester} and {F. Tenore} and {H. Hermansky} and {M. Fifer} and {Nick F Ramsey} and {N. Crone}},
year = 2023,
month = {10},
booktitle = {Advancement of science},
url = {https://www.semanticscholar.org/paper/dee851d6c5652ee423118132e1483bc0af9f30fc},
}
@inproceedings{260957214,
title = {Nugget: Neural Agglomerative Embeddings of Text},
author = {{Guanghui Qin} and {Benjamin Van Durme}},
year = 2023,
month = {10},
booktitle = {International Conference on Machine Learning},
url = {https://www.semanticscholar.org/paper/531b37c44c7e39539f617fb1a4149ef8cce8f4ec},
}
@inproceedings{263827534,
title = {A Linguistic Analysis of Instagram Captions Between Adolescent Suicide Decedents and Living Controls.},
author = {{Alex Walker} and {Ayah Zirikly} and {Melissa D. Stockbridge} and {H. C. Wilcox}},
year = 2023,
month = {10},
booktitle = {Crisis},
url = {https://www.semanticscholar.org/paper/a0ee01acead1ccb6064f603f75186f8aa25d2562},
}
@inproceedings{264426523,
title = {A Unified View of Evaluation Metrics for Structured Prediction},
author = {{Yunmo Chen} and {William Gantt Walden} and {Tongfei Chen} and {Aaron Steven White} and {Benjamin Van Durme}},
year = 2023,
month = {10},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/a0df8169889043dae6ac111136a61162a5185a77},
}
@inproceedings{263830793,
title = {DPM-TSE: A Diffusion Probabilistic Model for Target Sound Extraction},
author = {{Jiarui Hai} and {Helin Wang} and {Dongchao Yang} and {Karan Thakkar} and {N. Dehak} and {Mounya Elhilali}},
year = 2023,
month = {10},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/70aec6486668cc5ca25d45240c68de223a8deda7},
}
The phenomena of in-context learning has typically been thought of as {“}learning from examples{”}. In this work which focuses on Machine Translation, we present a perspective of in-context learning as the desired generation task maintaining coherency with its context, i.e., the prompt examples. We first investigate randomly sampled prompts across 4 domains, and find that translation performance improves when shown in-domain prompts. Next, we investigate coherency for the in-domain setting, which uses prompt examples from a moving window. We study this with respect to other factors that have previously been identified in the literature such as length, surface similarity and sentence embedding similarity. Our results across 3 models (GPTNeo2.7B, Bloom3B, XGLM2.9B), and three translation directions (en$\rightarrow${pt, de, fr}) suggest that the long-term coherency of the prompts and the test sentence is a good indicator of downstream translation performance. In doing so, we demonstrate the efficacy of in-context Machine Translation for on-the-fly adaptation.
@inproceedings{sia-duh-2023-context,
title = "In-context Learning as Maintaining Coherency: A Study of On-the-fly Machine Translation Using Large Language Models",
author = "Sia, Suzanna and
Duh, Kevin",
editor = "Utiyama, Masao and
Wang, Rui",
booktitle = "Proceedings of Machine Translation Summit XIX, Vol. 1: Research Track",
month = sep,
year = "2023",
address = "Macau SAR, China",
publisher = "Asia-Pacific Association for Machine Translation",
url = "https://aclanthology.org/2023.mtsummit-research.15",
pages = "173--185",
abstract = "The phenomena of in-context learning has typically been thought of as {``}learning from examples{''}. In this work which focuses on Machine Translation, we present a perspective of in-context learning as the desired generation task maintaining coherency with its context, i.e., the prompt examples. We first investigate randomly sampled prompts across 4 domains, and find that translation performance improves when shown in-domain prompts. Next, we investigate coherency for the in-domain setting, which uses prompt examples from a moving window. We study this with respect to other factors that have previously been identified in the literature such as length, surface similarity and sentence embedding similarity. Our results across 3 models (GPTNeo2.7B, Bloom3B, XGLM2.9B), and three translation directions (en$\rightarrow${pt, de, fr}) suggest that the long-term coherency of the prompts and the test sentence is a good indicator of downstream translation performance. In doing so, we demonstrate the efficacy of in-context Machine Translation for on-the-fly adaptation.",
}
@InProceedings{chi-et-al-2023,
author = "Jie Chi and Brian Lu and Jason Eisner and Peter Bell
and Preethi Jyothi and Ahmed M. Ali",
title = "Unsupervised Code-Switched Text Generation from
Parallel Text",
booktitle = "Proceedings of INTERSPEECH",
year = "2023",
month = aug,
address = "Dublin",
URL = "http://cs.jhu.edu/~jason/papers/#chi-et-al-2023",
}
Large Language Models (LLMs) such as GPT-3 have emerged as general-purpose language models capable of addressing many natural language generation or understanding tasks. On the task of Machine Translation (MT), multiple works have investigated few-shot prompting mechanisms to elicit better translations from LLMs. However, there has been relatively little investigation on how such translations differ qualitatively from the translations generated by standard Neural Machine Translation (NMT) models. In this work, we investigate these differences in terms of the literalness of translations produced by the two systems. Using literalness measures involving word alignment and monotonicity, we find that translations out of English (E-X) from GPTs tend to be less literal, while exhibiting similar or better scores on MT quality metrics. We demonstrate that this finding is borne out in human evaluations as well. We then show that these differences are especially pronounced when translating sentences that contain idiomatic expressions.
@inproceedings{raunak-etal-2023-gpts,
title = "Do {GPT}s Produce Less Literal Translations?",
author = "Raunak, Vikas and
Menezes, Arul and
Post, Matt and
Hassan, Hany",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-short.90",
doi = "10.18653/v1/2023.acl-short.90",
pages = "1041--1050",
abstract = "Large Language Models (LLMs) such as GPT-3 have emerged as general-purpose language models capable of addressing many natural language generation or understanding tasks. On the task of Machine Translation (MT), multiple works have investigated few-shot prompting mechanisms to elicit better translations from LLMs. However, there has been relatively little investigation on how such translations differ qualitatively from the translations generated by standard Neural Machine Translation (NMT) models. In this work, we investigate these differences in terms of the literalness of translations produced by the two systems. Using literalness measures involving word alignment and monotonicity, we find that translations out of English (E-X) from GPTs tend to be less literal, while exhibiting similar or better scores on MT quality metrics. We demonstrate that this finding is borne out in human evaluations as well. We then show that these differences are especially pronounced when translating sentences that contain idiomatic expressions.",
}
Hyperparameter optimization is an important but often overlooked process in the research of deep learning technologies. To obtain a good model, one must carefully tune hyperparameters that determine the architecture and training algorithm. Insufficient tuning may result in poor results, while inequitable tuning may lead to exaggerated differences between models. We present a hyperparameter optimization toolkit for neural machine translation (NMT) to help researchers focus their time on the creative rather than the mundane. The toolkit is implemented as a wrapper on top of the open-source Sockeye NMT software. Using the Asynchronous Successive Halving Algorithm (ASHA), we demonstrate that it is possible to discover near-optimal models under a computational budget with little effort. Code: \url{https://github.com/kevinduh/sockeye-recipes3Video} demo: \url{https://cs.jhu.edu/kevinduh/j/demo.mp4}
@inproceedings{zhang-etal-2023-hyperparameter,
title = "A Hyperparameter Optimization Toolkit for Neural Machine Translation Research",
author = "Zhang, Xuan and
Duh, Kevin and
McNamee, Paul",
editor = "Bollegala, Danushka and
Huang, Ruihong and
Ritter, Alan",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 3: System Demonstrations)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-demo.15",
doi = "10.18653/v1/2023.acl-demo.15",
pages = "161--168",
abstract = "Hyperparameter optimization is an important but often overlooked process in the research of deep learning technologies. To obtain a good model, one must carefully tune hyperparameters that determine the architecture and training algorithm. Insufficient tuning may result in poor results, while inequitable tuning may lead to exaggerated differences between models. We present a hyperparameter optimization toolkit for neural machine translation (NMT) to help researchers focus their time on the creative rather than the mundane. The toolkit is implemented as a wrapper on top of the open-source Sockeye NMT software. Using the Asynchronous Successive Halving Algorithm (ASHA), we demonstrate that it is possible to discover near-optimal models under a computational budget with little effort. Code: \url{https://github.com/kevinduh/sockeye-recipes3Video} demo: \url{https://cs.jhu.edu/kevinduh/j/demo.mp4}",
}
This paper presents JHU{‘}s submissions to the IWSLT 2023 dialectal and low-resource track of Tunisian Arabic to English speech translation. The Tunisian dialect lacks formal orthography and abundant training data, making it challenging to develop effective speech translation (ST) systems. To address these challenges, we explore the integration of large pre-trained machine translation (MT) models, such as mBART and NLLB-200 in both end-to-end (E2E) and cascaded speech translation (ST) systems. We also improve the performance of automatic speech recognition (ASR) through the use of pseudo-labeling data augmentation and channel matching on telephone data. Finally, we combine our E2E and cascaded ST systems with Minimum Bayes-Risk decoding. Our combined system achieves a BLEU score of 21.6 and 19.1 on test2 and test3, respectively.
@inproceedings{hussein-etal-2023-jhu,
title = "{JHU} {IWSLT} 2023 Dialect Speech Translation System Description",
author = "Hussein, Amir and
Xiao, Cihan and
Verma, Neha and
Thebaud, Thomas and
Wiesner, Matthew and
Khudanpur, Sanjeev",
editor = "Salesky, Elizabeth and
Federico, Marcello and
Carpuat, Marine",
booktitle = "Proceedings of the 20th International Conference on Spoken Language Translation (IWSLT 2023)",
month = jul,
year = "2023",
address = "Toronto, Canada (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.iwslt-1.26",
doi = "10.18653/v1/2023.iwslt-1.26",
pages = "283--290",
abstract = "This paper presents JHU{'}s submissions to the IWSLT 2023 dialectal and low-resource track of Tunisian Arabic to English speech translation. The Tunisian dialect lacks formal orthography and abundant training data, making it challenging to develop effective speech translation (ST) systems. To address these challenges, we explore the integration of large pre-trained machine translation (MT) models, such as mBART and NLLB-200 in both end-to-end (E2E) and cascaded speech translation (ST) systems. We also improve the performance of automatic speech recognition (ASR) through the use of pseudo-labeling data augmentation and channel matching on telephone data. Finally, we combine our E2E and cascaded ST systems with Minimum Bayes-Risk decoding. Our combined system achieves a BLEU score of 21.6 and 19.1 on test2 and test3, respectively.",
}
We present PaRTE, a collection of 1,126 pairs of Recognizing Textual Entailment (RTE) examples to evaluate whether models are robust to paraphrasing. We posit that if RTE models understand language, their predictions should be consistent across inputs that share the same meaning. We use the evaluation set to determine if RTE models{‘} predictions change when examples are paraphrased. In our experiments, contemporary models change their predictions on 8-16{\%} of paraphrased examples, indicating that there is still room for improvement.
@inproceedings{verma-etal-2023-evaluating,
title = "Evaluating Paraphrastic Robustness in Textual Entailment Models",
author = "Verma, Dhruv and
Lal, Yash Kumar and
Sinha, Shreyashee and
Van Durme, Benjamin and
Poliak, Adam",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-short.76",
doi = "10.18653/v1/2023.acl-short.76",
pages = "880--892",
abstract = "We present PaRTE, a collection of 1,126 pairs of Recognizing Textual Entailment (RTE) examples to evaluate whether models are robust to paraphrasing. We posit that if RTE models understand language, their predictions should be consistent across inputs that share the same meaning. We use the evaluation set to determine if RTE models{'} predictions change when examples are paraphrased. In our experiments, contemporary models change their predictions on 8-16{\%} of paraphrased examples, indicating that there is still room for improvement.",
}
Cross-lingual annotation projection is a practical method for improving performance on low resource structured prediction tasks. An important step in annotation projection is obtaining alignments between the source and target texts, which enables the mapping of annotations across the texts. By manually correcting automatically generated alignments, we examine the impact of alignment quality{–-}automatic, manual, and mixed{–-}on downstream performance for two information extraction tasks and quantify the trade-off between annotation effort and model performance.
@inproceedings{behzad-etal-2023-effect,
title = "The Effect of Alignment Correction on Cross-Lingual Annotation Projection",
author = "Behzad, Shabnam and
Ebner, Seth and
Marone, Marc and
Van Durme, Benjamin and
Yarmohammadi, Mahsa",
editor = "Prange, Jakob and
Friedrich, Annemarie",
booktitle = "Proceedings of the 17th Linguistic Annotation Workshop (LAW-XVII)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.law-1.24",
doi = "10.18653/v1/2023.law-1.24",
pages = "244--251",
abstract = "Cross-lingual annotation projection is a practical method for improving performance on low resource structured prediction tasks. An important step in annotation projection is obtaining alignments between the source and target texts, which enables the mapping of annotations across the texts. By manually correcting automatically generated alignments, we examine the impact of alignment quality{---}automatic, manual, and mixed{---}on downstream performance for two information extraction tasks and quantify the trade-off between annotation effort and model performance.",
}
We describe the Johns Hopkins ACL 60-60 Speech Translation systems submitted to the IWSLT 2023 Multilingual track, where we were tasked to translate ACL presentations from English into 10 languages. We developed cascaded speech translation systems for both the constrained and unconstrained subtracks. Our systems make use of pre-trained models as well as domain-specific corpora for this highly technical evaluation-only task. We find that the specific technical domain which ACL presentations fall into presents a unique challenge for both ASR and MT, and we present an error analysis and an ACL-specific corpus we produced to enable further work in this area.
@inproceedings{xinyuan-etal-2023-jhu,
title = "{JHU} {IWSLT} 2023 Multilingual Speech Translation System Description",
author = "Xinyuan, Henry Li and
Verma, Neha and
Bamfo Odoom, Bismarck and
Pradeep, Ujvala and
Wiesner, Matthew and
Khudanpur, Sanjeev",
editor = "Salesky, Elizabeth and
Federico, Marcello and
Carpuat, Marine",
booktitle = "Proceedings of the 20th International Conference on Spoken Language Translation (IWSLT 2023)",
month = jul,
year = "2023",
address = "Toronto, Canada (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.iwslt-1.28",
doi = "10.18653/v1/2023.iwslt-1.28",
pages = "302--310",
abstract = "We describe the Johns Hopkins ACL 60-60 Speech Translation systems submitted to the IWSLT 2023 Multilingual track, where we were tasked to translate ACL presentations from English into 10 languages. We developed cascaded speech translation systems for both the constrained and unconstrained subtracks. Our systems make use of pre-trained models as well as domain-specific corpora for this highly technical evaluation-only task. We find that the specific technical domain which ACL presentations fall into presents a unique challenge for both ASR and MT, and we present an error analysis and an ACL-specific corpus we produced to enable further work in this area.",
}
Riveter provides a complete easy-to-use pipeline for analyzing verb connotations associated with entities in text corpora. We prepopulate the package with connotation frames of sentiment, power, and agency, which have demonstrated usefulness for capturing social phenomena, such as gender bias, in a broad range of corpora. For decades, lexical frameworks have been foundational tools in computational social science, digital humanities, and natural language processing, facilitating multifaceted analysis of text corpora. But working with verb-centric lexica specifically requires natural language processing skills, reducing their accessibility to other researchers. By organizing the language processing pipeline, providing complete lexicon scores and visualizations for all entities in a corpus, and providing functionality for users to target specific research questions, Riveter greatly improves the accessibility of verb lexica and can facilitate a broad range of future research.
@inproceedings{antoniak-etal-2023-riveter,
title = "Riveter: Measuring Power and Social Dynamics Between Entities",
author = "Antoniak, Maria and
Field, Anjalie and
Mun, Jimin and
Walsh, Melanie and
Klein, Lauren and
Sap, Maarten",
editor = "Bollegala, Danushka and
Huang, Ruihong and
Ritter, Alan",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 3: System Demonstrations)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-demo.36",
doi = "10.18653/v1/2023.acl-demo.36",
pages = "377--388",
abstract = "Riveter provides a complete easy-to-use pipeline for analyzing verb connotations associated with entities in text corpora. We prepopulate the package with connotation frames of sentiment, power, and agency, which have demonstrated usefulness for capturing social phenomena, such as gender bias, in a broad range of corpora. For decades, lexical frameworks have been foundational tools in computational social science, digital humanities, and natural language processing, facilitating multifaceted analysis of text corpora. But working with verb-centric lexica specifically requires natural language processing skills, reducing their accessibility to other researchers. By organizing the language processing pipeline, providing complete lexicon scores and visualizations for all entities in a corpus, and providing functionality for users to target specific research questions, Riveter greatly improves the accessibility of verb lexica and can facilitate a broad range of future research.",
}
This paper reports on the shared tasks organized by the 20th IWSLT Conference. The shared tasks address 9 scientific challenges in spoken language translation: simultaneous and offline translation, automatic subtitling and dubbing, speech-to-speech translation, multilingual, dialect and low-resource speech translation, and formality control. The shared tasks attracted a total of 38 submissions by 31 teams. The growing interest towards spoken language translation is also witnessed by the constantly increasing number of shared task organizers and contributors to the overview paper, almost evenly distributed across industry and academia.
@inproceedings{agrawal-etal-2023-findings,
title = "{FINDINGS} {OF} {THE} {IWSLT} 2023 {EVALUATION} {CAMPAIGN}",
author = {Agarwal, Milind and
Agrawal, Sweta and
Anastasopoulos, Antonios and
Bentivogli, Luisa and
Bojar, Ond{\v{r}}ej and
Borg, Claudia and
Carpuat, Marine and
Cattoni, Roldano and
Cettolo, Mauro and
Chen, Mingda and
Chen, William and
Choukri, Khalid and
Chronopoulou, Alexandra and
Currey, Anna and
Declerck, Thierry and
Dong, Qianqian and
Duh, Kevin and
Est{\`e}ve, Yannick and
Federico, Marcello and
Gahbiche, Souhir and
Haddow, Barry and
Hsu, Benjamin and
Mon Htut, Phu and
Inaguma, Hirofumi and
Javorsk{\'y}, D{\'a}vid and
Judge, John and
Kano, Yasumasa and
Ko, Tom and
Kumar, Rishu and
Li, Pengwei and
Ma, Xutai and
Mathur, Prashant and
Matusov, Evgeny and
McNamee, Paul and
P. McCrae, John and
Murray, Kenton and
Nadejde, Maria and
Nakamura, Satoshi and
Negri, Matteo and
Nguyen, Ha and
Niehues, Jan and
Niu, Xing and
Kr. Ojha, Atul and
E. Ortega, John and
Pal, Proyag and
Pino, Juan and
van der Plas, Lonneke and
Pol{\'a}k, Peter and
Rippeth, Elijah and
Salesky, Elizabeth and
Shi, Jiatong and
Sperber, Matthias and
St{\"u}ker, Sebastian and
Sudoh, Katsuhito and
Tang, Yun and
Thompson, Brian and
Tran, Kevin and
Turchi, Marco and
Waibel, Alex and
Wang, Mingxuan and
Watanabe, Shinji and
Zevallos, Rodolfo},
editor = "Salesky, Elizabeth and
Federico, Marcello and
Carpuat, Marine",
booktitle = "Proceedings of the 20th International Conference on Spoken Language Translation (IWSLT 2023)",
month = jul,
year = "2023",
address = "Toronto, Canada (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.iwslt-1.1",
doi = "10.18653/v1/2023.iwslt-1.1",
pages = "1--61",
abstract = "This paper reports on the shared tasks organized by the 20th IWSLT Conference. The shared tasks address 9 scientific challenges in spoken language translation: simultaneous and offline translation, automatic subtitling and dubbing, speech-to-speech translation, multilingual, dialect and low-resource speech translation, and formality control. The shared tasks attracted a total of 38 submissions by 31 teams. The growing interest towards spoken language translation is also witnessed by the constantly increasing number of shared task organizers and contributors to the overview paper, almost evenly distributed across industry and academia.",
}
Semantic proto-role labeling (SPRL) assigns properties to arguments based on a series of binary labels. While multiple studies have evaluated various approaches to SPRL, it has only been studied in-depth as a standalone task using gold predicate/argument pairs. How do SPRL systems perform as part of an information extraction pipeline? We model SPRL jointly with predicate-argument extraction using a deep transformer model. We find that proto-role labeling is surprisingly robust in this setting, with only a small decrease when using predicted arguments. We include a detailed analysis of each component of the joint system, and an error analysis to understand correlations in errors between system stages. Finally, we study the effects of annotation errors on SPRL.
@inproceedings{spaulding-etal-2023-joint,
title = "Joint End-to-end Semantic Proto-role Labeling",
author = "Spaulding, Elizabeth and
Kazantsev, Gary and
Dredze, Mark",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-short.63",
doi = "10.18653/v1/2023.acl-short.63",
pages = "723--736",
abstract = "Semantic proto-role labeling (SPRL) assigns properties to arguments based on a series of binary labels. While multiple studies have evaluated various approaches to SPRL, it has only been studied in-depth as a standalone task using gold predicate/argument pairs. How do SPRL systems perform as part of an information extraction pipeline? We model SPRL jointly with predicate-argument extraction using a deep transformer model. We find that proto-role labeling is surprisingly robust in this setting, with only a small decrease when using predicted arguments. We include a detailed analysis of each component of the joint system, and an error analysis to understand correlations in errors between system stages. Finally, we study the effects of annotation errors on SPRL.",
}
Fifteen years of work on entity linking has established the importance of different information sources in making linking decisions: mention and entity name similarity, contextual relevance, and features of the knowledge base. Modern state-of-the-art systems build on these features, including through neural representations (Wu et al., 2020). In contrast to this trend, the autoregressive language model GENRE (De Cao et al., 2021) generates normalized entity names for mentions and beats many other entity linking systems, despite making no use of knowledge base (KB) information. How is this possible? We analyze the behavior of GENRE on several entity linking datasets and demonstrate that its performance stems from memorization of name patterns. In contrast, it fails in cases that might benefit from using the KB. We experiment with a modification to the model to enable it to utilize KB information, highlighting challenges to incorporating traditional entity linking information sources into autoregressive models.
@inproceedings{schumacher-etal-2023-surprising,
title = "On the Surprising Effectiveness of Name Matching Alone in Autoregressive Entity Linking",
author = "Schumacher, Elliot and
Mayfield, James and
Dredze, Mark",
editor = "Hruschka, Estevam and
Mitchell, Tom and
Rahman, Sajjadur and
Mladeni{\'c}, Dunja and
Grobelnik, Marko",
booktitle = "Proceedings of the First Workshop on Matching From Unstructured and Structured Data (MATCHING 2023)",
month = jul,
year = "2023",
address = "Toronto, ON, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.matching-1.6",
doi = "10.18653/v1/2023.matching-1.6",
pages = "58--69",
abstract = "Fifteen years of work on entity linking has established the importance of different information sources in making linking decisions: mention and entity name similarity, contextual relevance, and features of the knowledge base. Modern state-of-the-art systems build on these features, including through neural representations (Wu et al., 2020). In contrast to this trend, the autoregressive language model GENRE (De Cao et al., 2021) generates normalized entity names for mentions and beats many other entity linking systems, despite making no use of knowledge base (KB) information. How is this possible? We analyze the behavior of GENRE on several entity linking datasets and demonstrate that its performance stems from memorization of name patterns. In contrast, it fails in cases that might benefit from using the KB. We experiment with a modification to the model to enable it to utilize KB information, highlighting challenges to incorporating traditional entity linking information sources into autoregressive models.",
}
Autoregressive language models are trained by minimizing the cross-entropy of the model distribution Q relative to the data distribution P {–} that is, minimizing the forward cross-entropy, which is equivalent to maximum likelihood estimation (MLE). We have observed that models trained in this way may {“}over-generalize{”}, in the sense that they produce non-human-like text. Moreover, we believe that reverse cross-entropy, i.e., the cross-entropy of P relative to Q, is a better reflection of how a human would evaluate text generated by a model. Hence, we propose learning with MixCE, an objective that mixes the forward and reverse cross-entropies. We evaluate models trained with this objective on synthetic data settings (where P is known) and real data, and show that the resulting models yield better generated text without complex decoding strategies.
@inproceedings{zhang-etal-2023-mixce,
title = "{M}ix{CE}: Training Autoregressive Language Models by Mixing Forward and Reverse Cross-Entropies",
author = "Zhang, Shiyue and
Wu, Shijie and
Irsoy, Ozan and
Lu, Steven and
Bansal, Mohit and
Dredze, Mark and
Rosenberg, David",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-long.502",
doi = "10.18653/v1/2023.acl-long.502",
pages = "9027--9050",
abstract = "Autoregressive language models are trained by minimizing the cross-entropy of the model distribution Q relative to the data distribution P {--} that is, minimizing the forward cross-entropy, which is equivalent to maximum likelihood estimation (MLE). We have observed that models trained in this way may {``}over-generalize{''}, in the sense that they produce non-human-like text. Moreover, we believe that reverse cross-entropy, i.e., the cross-entropy of P relative to Q, is a better reflection of how a human would evaluate text generated by a model. Hence, we propose learning with MixCE, an objective that mixes the forward and reverse cross-entropies. We evaluate models trained with this objective on synthetic data settings (where P is known) and real data, and show that the resulting models yield better generated text without complex decoding strategies.",
}
Large language models have achieved impressive few-shot performance on a wide variety of tasks. However, in many settings, users require confidence estimates for model predictions. While traditional classifiers produce scores for each label, language models instead produce scores for the generation which may not be well calibrated. We compare generations across diverse prompts and show that these can be used to create confidence scores. By utilizing more prompts we can get more precise confidence estimates and use response diversity as a proxy for confidence. We evaluate this approach across ten multiple-choice question-answering datasets using three models: T0, FLAN-T5, and GPT-3. In addition to analyzing multiple human written prompts, we automatically generate more prompts using a language model in order to produce finer-grained confidence estimates. Our method produces more calibrated confidence estimates compared to the log probability of the answer to a single prompt. These improvements could benefit users who rely on prediction confidence for integration into a larger system or in decision-making processes.
@inproceedings{portillo-wightman-etal-2023-strength,
title = "Strength in Numbers: Estimating Confidence of Large Language Models by Prompt Agreement",
author = "Portillo Wightman, Gwenyth and
Delucia, Alexandra and
Dredze, Mark",
editor = "Ovalle, Anaelia and
Chang, Kai-Wei and
Mehrabi, Ninareh and
Pruksachatkun, Yada and
Galystan, Aram and
Dhamala, Jwala and
Verma, Apurv and
Cao, Trista and
Kumar, Anoop and
Gupta, Rahul",
booktitle = "Proceedings of the 3rd Workshop on Trustworthy Natural Language Processing (TrustNLP 2023)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.trustnlp-1.28",
doi = "10.18653/v1/2023.trustnlp-1.28",
pages = "326--362",
abstract = "Large language models have achieved impressive few-shot performance on a wide variety of tasks. However, in many settings, users require confidence estimates for model predictions. While traditional classifiers produce scores for each label, language models instead produce scores for the generation which may not be well calibrated. We compare generations across diverse prompts and show that these can be used to create confidence scores. By utilizing more prompts we can get more precise confidence estimates and use response diversity as a proxy for confidence. We evaluate this approach across ten multiple-choice question-answering datasets using three models: T0, FLAN-T5, and GPT-3. In addition to analyzing multiple human written prompts, we automatically generate more prompts using a language model in order to produce finer-grained confidence estimates. Our method produces more calibrated confidence estimates compared to the log probability of the answer to a single prompt. These improvements could benefit users who rely on prediction confidence for integration into a larger system or in decision-making processes.",
}
We present a simple yet efficient method to enhance the quality of machine translation models trained on multimodal corpora by augmenting the training text with labels of detected objects in the corresponding video segments. We then test the effects of label augmentation in both baseline and two automatic speech recognition (ASR) conditions. In contrast with multimodal techniques that merge visual and textual features, our modular method is easy to implement and the results are more interpretable. Comparisons are made with Transformer translation architectures trained with baseline and augmented labels, showing improvements of up to +1.0 BLEU on the How2 dataset.
@inproceedings{gwinnup-etal-2023-enhancing,
title = "Enhancing Video Translation Context with Object Labels",
author = "Gwinnup, Jeremy and
Anderson, Tim and
Ore, Brian and
Hansen, Eric and
Duh, Kevin",
editor = "Salesky, Elizabeth and
Federico, Marcello and
Carpuat, Marine",
booktitle = "Proceedings of the 20th International Conference on Spoken Language Translation (IWSLT 2023)",
month = jul,
year = "2023",
address = "Toronto, Canada (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.iwslt-1.8",
doi = "10.18653/v1/2023.iwslt-1.8",
pages = "130--137",
abstract = "We present a simple yet efficient method to enhance the quality of machine translation models trained on multimodal corpora by augmenting the training text with labels of detected objects in the corresponding video segments. We then test the effects of label augmentation in both baseline and two automatic speech recognition (ASR) conditions. In contrast with multimodal techniques that merge visual and textual features, our modular method is easy to implement and the results are more interpretable. Comparisons are made with Transformer translation architectures trained with baseline and augmented labels, showing improvements of up to +1.0 BLEU on the How2 dataset.",
}
Widespread disparities in clinical outcomes exist between different demographic groups in the United States. A new line of work in medical sociology has demonstrated physicians often use stigmatizing language in electronic medical records within certain groups, such as black patients, which may exacerbate disparities. In this study, we characterize these instances at scale using a series of domain-informed NLP techniques. We highlight important differences between this task and analogous bias-related tasks studied within the NLP community (e.g., classifying microaggressions). Our study establishes a foundation for NLP researchers to contribute timely insights to a problem domain brought to the forefront by recent legislation regarding clinical documentation transparency. We release data, code, and models.
@inproceedings{harrigian-etal-2023-characterization,
title = "Characterization of Stigmatizing Language in Medical Records",
author = "Harrigian, Keith and
Zirikly, Ayah and
Chee, Brant and
Ahmad, Alya and
Links, Anne and
Saha, Somnath and
Beach, Mary Catherine and
Dredze, Mark",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-short.28",
doi = "10.18653/v1/2023.acl-short.28",
pages = "312--329",
abstract = "Widespread disparities in clinical outcomes exist between different demographic groups in the United States. A new line of work in medical sociology has demonstrated physicians often use stigmatizing language in electronic medical records within certain groups, such as black patients, which may exacerbate disparities. In this study, we characterize these instances at scale using a series of domain-informed NLP techniques. We highlight important differences between this task and analogous bias-related tasks studied within the NLP community (e.g., classifying microaggressions). Our study establishes a foundation for NLP researchers to contribute timely insights to a problem domain brought to the forefront by recent legislation regarding clinical documentation transparency. We release data, code, and models.",
}
Natural language is ambiguous. Resolving ambiguous questions is key to successfully answering them. Focusing on questions about images, we create a dataset of ambiguous examples. We annotate these, grouping answers by the underlying question they address and rephrasing the question for each group to reduce ambiguity. Our analysis reveals a linguistically-aligned ontology of reasons for ambiguity in visual questions. We then develop an English question-generation model which we demonstrate via automatic and human evaluation produces less ambiguous questions. We further show that the question generation objective we use allows the model to integrate answer group information without any direct supervision.
@inproceedings{stengel-eskin-etal-2023-chicken,
title = "Why Did the Chicken Cross the Road? Rephrasing and Analyzing Ambiguous Questions in {VQA}",
author = "Stengel-Eskin, Elias and
Guallar-Blasco, Jimena and
Zhou, Yi and
Van Durme, Benjamin",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-long.569",
doi = "10.18653/v1/2023.acl-long.569",
pages = "10220--10237",
abstract = "Natural language is ambiguous. Resolving ambiguous questions is key to successfully answering them. Focusing on questions about images, we create a dataset of ambiguous examples. We annotate these, grouping answers by the underlying question they address and rephrasing the question for each group to reduce ambiguity. Our analysis reveals a linguistically-aligned ontology of reasons for ambiguity in visual questions. We then develop an English question-generation model which we demonstrate via automatic and human evaluation produces less ambiguous questions. We further show that the question generation objective we use allows the model to integrate answer group information without any direct supervision.",
}
Despite their impressive performance on diverse tasks, large language models (LMs) still struggle with tasks requiring rich world knowledge, implying the difficulty of encoding a wealth of world knowledge in their parameters. This paper aims to understand LMs{‘} strengths and limitations in memorizing factual knowledge, by conducting large-scale knowledge probing experiments on two open-domain entity-centric QA datasets: PopQA, our new dataset with 14k questions about long-tail entities, and EntityQuestions, a widely used open-domain QA dataset. We find that LMs struggle with less popular factual knowledge, and that retrieval augmentation helps significantly in these cases. Scaling, on the other hand, mainly improves memorization of popular knowledge, and fails to appreciably improve memorization of factual knowledge in the tail. Based on those findings, we devise a new method for retrieval-augmentation that improves performance and reduces inference costs by only retrieving non-parametric memories when necessary.
@inproceedings{mallen-etal-2023-trust,
title = "When Not to Trust Language Models: Investigating Effectiveness of Parametric and Non-Parametric Memories",
author = "Mallen, Alex and
Asai, Akari and
Zhong, Victor and
Das, Rajarshi and
Khashabi, Daniel and
Hajishirzi, Hannaneh",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-long.546",
doi = "10.18653/v1/2023.acl-long.546",
pages = "9802--9822",
abstract = "Despite their impressive performance on diverse tasks, large language models (LMs) still struggle with tasks requiring rich world knowledge, implying the difficulty of encoding a wealth of world knowledge in their parameters. This paper aims to understand LMs{'} strengths and limitations in memorizing factual knowledge, by conducting large-scale knowledge probing experiments on two open-domain entity-centric QA datasets: PopQA, our new dataset with 14k questions about long-tail entities, and EntityQuestions, a widely used open-domain QA dataset. We find that LMs struggle with less popular factual knowledge, and that retrieval augmentation helps significantly in these cases. Scaling, on the other hand, mainly improves memorization of popular knowledge, and fails to appreciably improve memorization of factual knowledge in the tail. Based on those findings, we devise a new method for retrieval-augmentation that improves performance and reduces inference costs by only retrieving non-parametric memories when necessary.",
}
Although recent neural models for coreference resolution have led to substantial improvements on benchmark datasets, it remains a challenge to successfully transfer these models to new target domains containing many out-of-vocabulary spans and requiring differing annotation schemes. Typical approaches involve continued training on annotated target-domain data, but obtaining annotations is costly and time-consuming. In this work, we show that adapting mention detection is the key component to successful domain adaptation of coreference models, rather than antecedent linking. We also show annotating mentions alone is nearly twice as fast as annotating full coreference chains. Based on these insights, we propose a method for efficiently adapting coreference models, which includes a high-precision mention detection objective and requires only mention annotations in the target domain. Extensive evaluation across three English coreference datasets: CoNLL-2012 (news/conversation), i2b2/VA (medical notes), and child welfare notes, reveals that our approach facilitates annotation-efficient transfer and results in a 7-14{\%} improvement in average F1 without increasing annotator time.
@inproceedings{gandhi-etal-2023-annotating,
title = "Annotating Mentions Alone Enables Efficient Domain Adaptation for Coreference Resolution",
author = "Gandhi, Nupoor and
Field, Anjalie and
Strubell, Emma",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-long.588",
doi = "10.18653/v1/2023.acl-long.588",
pages = "10543--10558",
abstract = "Although recent neural models for coreference resolution have led to substantial improvements on benchmark datasets, it remains a challenge to successfully transfer these models to new target domains containing many out-of-vocabulary spans and requiring differing annotation schemes. Typical approaches involve continued training on annotated target-domain data, but obtaining annotations is costly and time-consuming. In this work, we show that adapting mention detection is the key component to successful domain adaptation of coreference models, rather than antecedent linking. We also show annotating mentions alone is nearly twice as fast as annotating full coreference chains. Based on these insights, we propose a method for efficiently adapting coreference models, which includes a high-precision mention detection objective and requires only mention annotations in the target domain. Extensive evaluation across three English coreference datasets: CoNLL-2012 (news/conversation), i2b2/VA (medical notes), and child welfare notes, reveals that our approach facilitates annotation-efficient transfer and results in a 7-14{\%} improvement in average F1 without increasing annotator time.",
}
Large {“}instruction-tuned{”} language models (i.e., finetuned to respond to instructions) have demonstrated a remarkable ability to generalize zero-shot to new tasks. Nevertheless, they depend heavily on human-written instruction data that is often limited in quantity, diversity, and creativity, therefore hindering the generality of the tuned model. We introduce Self-Instruct, a framework for improving the instruction-following capabilities of pretrained language models by bootstrapping off their own generations. Our pipeline generates instructions, input, and output samples from a language model, then filters invalid or similar ones before using them to finetune the original model. Applying our method to the vanilla GPT3, we demonstrate a 33{\%} absolute improvement over the original model on Super-NaturalInstructions, on par with the performance of InstructGPT-001, which was trained with private user data and human annotations. For further evaluation, we curate a set of expert-written instructions for novel tasks, and show through human evaluation that tuning GPT3 with Self-Instruct outperforms using existing public instruction datasets by a large margin, leaving only a 5{\%} absolute gap behind InstructGPT-001. Self-Instruct provides an almost annotation-free method for aligning pre-trained language models with instructions, and we release our large synthetic dataset to facilitate future studies on instruction tuning.
@inproceedings{wang-etal-2023-self-instruct,
title = "Self-Instruct: Aligning Language Models with Self-Generated Instructions",
author = "Wang, Yizhong and
Kordi, Yeganeh and
Mishra, Swaroop and
Liu, Alisa and
Smith, Noah A. and
Khashabi, Daniel and
Hajishirzi, Hannaneh",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-long.754",
doi = "10.18653/v1/2023.acl-long.754",
pages = "13484--13508",
abstract = "Large {``}instruction-tuned{''} language models (i.e., finetuned to respond to instructions) have demonstrated a remarkable ability to generalize zero-shot to new tasks. Nevertheless, they depend heavily on human-written instruction data that is often limited in quantity, diversity, and creativity, therefore hindering the generality of the tuned model. We introduce Self-Instruct, a framework for improving the instruction-following capabilities of pretrained language models by bootstrapping off their own generations. Our pipeline generates instructions, input, and output samples from a language model, then filters invalid or similar ones before using them to finetune the original model. Applying our method to the vanilla GPT3, we demonstrate a 33{\%} absolute improvement over the original model on Super-NaturalInstructions, on par with the performance of InstructGPT-001, which was trained with private user data and human annotations. For further evaluation, we curate a set of expert-written instructions for novel tasks, and show through human evaluation that tuning GPT3 with Self-Instruct outperforms using existing public instruction datasets by a large margin, leaving only a 5{\%} absolute gap behind InstructGPT-001. Self-Instruct provides an almost annotation-free method for aligning pre-trained language models with instructions, and we release our large synthetic dataset to facilitate future studies on instruction tuning.",
}
How reliably can we trust the scores obtained from social bias benchmarks as faithful indicators of problematic social biases in a given model? In this work, we study this question by contrasting social biases with non-social biases that stem from choices made during dataset construction (which might not even be discernible to the human eye). To do so, we empirically simulate various alternative constructions for a given benchmark based on seemingly innocuous modifications (such as paraphrasing or random-sampling) that maintain the essence of their social bias. On two well-known social bias benchmarks (Winogender and BiasNLI), we observe that these shallow modifications have a surprising effect on the resulting degree of bias across various models and consequently the relative ordering of these models when ranked by measured bias. We hope these troubling observations motivate more robust measures of social biases.
@inproceedings{selvam-etal-2023-tail,
title = "The Tail Wagging the Dog: Dataset Construction Biases of Social Bias Benchmarks",
author = "Selvam, Nikil and
Dev, Sunipa and
Khashabi, Daniel and
Khot, Tushar and
Chang, Kai-Wei",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-short.118",
doi = "10.18653/v1/2023.acl-short.118",
pages = "1373--1386",
abstract = "How reliably can we trust the scores obtained from social bias benchmarks as faithful indicators of problematic social biases in a given model? In this work, we study this question by contrasting social biases with non-social biases that stem from choices made during dataset construction (which might not even be discernible to the human eye). To do so, we empirically simulate various alternative constructions for a given benchmark based on seemingly innocuous modifications (such as paraphrasing or random-sampling) that maintain the essence of their social bias. On two well-known social bias benchmarks (Winogender and BiasNLI), we observe that these shallow modifications have a surprising effect on the resulting degree of bias across various models and consequently the relative ordering of these models when ranked by measured bias. We hope these troubling observations motivate more robust measures of social biases.",
}
@InProceedings{fang-et-al-2023,
author = "Hao Fang and Anusha Balakrishnan and Harsh Jhamtani
and John Bufe and Jean Crawford and Jayant
Krishnamurthy and Adam Pauls and Jason Eisner and Jacob
Andreas and Dan Klein",
title = "The Whole Truth and Nothing But the Truth: Faithful
and Controllable Dialogue Response Generation with
Dataflow Transduction and Constrained Decoding",
booktitle = "Findings of the Association for Computational
Linguistics: ACL 2023",
year = "2023",
month = jul,
pages = "5682--5700",
URL = "http://cs.jhu.edu/~jason/papers/#fang-et-al-2023",
}
@InProceedings{li-et-al-2023-dictation,
author = "Belinda Z. Li and Jason Eisner and Adam Pauls and Sam
Thomson",
title = "Toward Interactive Dictation",
booktitle = "Proceedings of the Association for Computational
Linguistics (ACL)",
year = "2023",
month = jul,
pages = "15319--15338",
URL = "http://cs.jhu.edu/~jason/papers/#li-et-al-2023-dictation",
}
@InProceedings{mireshghallah-et-al-2023,
author = "Fatemehsadat Mireshghallah and Yu Su and Tatsunori
Hashimoto and Jason Eisner and Richard Shin",
title = "Privacy-Preserving Domain Adaptation of Semantic
Parsers",
booktitle = "Proceedings of the Association for Computational
Linguistics (ACL)",
year = "2023",
month = jul,
pages = "4950--4970",
URL = "http://cs.jhu.edu/~jason/papers/#mireshghallah-et-al-2023",
}
@InProceedings{li-et-al-2023-cd,
author = "Xiang Lisa Li and Ari Holtzman and Daniel Fried and
Percy Liang and Jason Eisner and Tatsunori Hashimoto
and Luke Zettlemoyer and Mike Lewis",
title = "Contrastive Decoding: Open-ended Text Generation as
Optimization",
booktitle = "Proceedings of the Association for Computational
Linguistics (ACL)",
year = "2023",
month = jul,
pages = "12286--12312",
URL = "http://cs.jhu.edu/~jason/papers/#li-et-al-2023-cd",
}
@InProceedings{du-et-al-2023,
author = "Li Du and Lucas Torroba Hennigen and Tiago Pimentel
and Clara Meister and Jason Eisner and Ryan Cotterell",
title = "A Measure-Theoretic Characterization of Tight Language
Models",
booktitle = "Proceedings of the Association for Computational
Linguistics (ACL)",
year = "2023",
month = jul,
pages = "9744--9770",
URL = "http://cs.jhu.edu/~jason/papers/#du-et-al-2023",
}
@InProceedings{opedal-et-al-2023,
author = "Andreas Opedal and Ran Zmigrod and Tim Vieira and Ryan
Cotterell and Jason Eisner",
title = "Efficient Semiring-Weighted {E}arley Parsing",
booktitle = "Proceedings of the Association for Computational
Linguistics (ACL)",
year = "2023",
month = jul,
pages = "3687--3713",
URL = "http://cs.jhu.edu/~jason/papers/#opedal-et-al-2023",
}
Automated Machine Learning (AutoML) is an emerging field that has potential to impact how we build models in NLP. As an umbrella term that includes topics like hyperparameter optimization and neural architecture search, AutoML has recently become mainstream at major conferences such as NeurIPS, ICML, and ICLR. What does this mean to NLP? Currently, models are often built in an ad hoc process: we might borrow default hyperparameters from previous work and try a few variant architectures, but it is never guaranteed that final trained model is optimal. Automation can introduce rigor in this model-building process. This tutorial will summarize the main AutoML techniques and illustrate how to apply them to improve the NLP model-building process.
@inproceedings{duh-zhang-2023-automl,
title = "{A}uto{ML} for {NLP}",
author = "Duh, Kevin and
Zhang, Xuan",
editor = "Zanzotto, Fabio Massimo and
Pradhan, Sameer",
booktitle = "Proceedings of the 17th Conference of the European Chapter of the Association for Computational Linguistics: Tutorial Abstracts",
month = may,
year = "2023",
address = "Dubrovnik, Croatia",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.eacl-tutorials.5",
doi = "10.18653/v1/2023.eacl-tutorials.5",
pages = "25--26",
abstract = "Automated Machine Learning (AutoML) is an emerging field that has potential to impact how we build models in NLP. As an umbrella term that includes topics like hyperparameter optimization and neural architecture search, AutoML has recently become mainstream at major conferences such as NeurIPS, ICML, and ICLR. What does this mean to NLP? Currently, models are often built in an ad hoc process: we might borrow default hyperparameters from previous work and try a few variant architectures, but it is never guaranteed that final trained model is optimal. Automation can introduce rigor in this model-building process. This tutorial will summarize the main AutoML techniques and illustrate how to apply them to improve the NLP model-building process.",
}
Multilingual sentence representations from large models encode semantic information from two or more languages and can be used for different cross-lingual information retrieval and matching tasks. In this paper, we integrate contrastive learning into multilingual representation distillation and use it for quality estimation of parallel sentences (i.e., find semantically similar sentences that can be used as translations of each other). We validate our approach with multilingual similarity search and corpus filtering tasks. Experiments across different low-resource languages show that our method greatly outperforms previous sentence encoders such as LASER, LASER3, and LaBSE.
@inproceedings{tan-etal-2023-multilingual,
title = "Multilingual Representation Distillation with Contrastive Learning",
author = "Tan, Weiting and
Heffernan, Kevin and
Schwenk, Holger and
Koehn, Philipp",
editor = "Vlachos, Andreas and
Augenstein, Isabelle",
booktitle = "Proceedings of the 17th Conference of the European Chapter of the Association for Computational Linguistics",
month = may,
year = "2023",
address = "Dubrovnik, Croatia",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.eacl-main.108",
doi = "10.18653/v1/2023.eacl-main.108",
pages = "1477--1490",
abstract = "Multilingual sentence representations from large models encode semantic information from two or more languages and can be used for different cross-lingual information retrieval and matching tasks. In this paper, we integrate contrastive learning into multilingual representation distillation and use it for quality estimation of parallel sentences (i.e., find semantically similar sentences that can be used as translations of each other). We validate our approach with multilingual similarity search and corpus filtering tasks. Experiments across different low-resource languages show that our method greatly outperforms previous sentence encoders such as LASER, LASER3, and LaBSE.",
}
Transformer models cannot easily scale to long sequences due to their O(N{\^{}}2) time and space complexity. This has led to Transformer variants seeking to lower computational complexity, such as Longformer and Performer. While such models have theoretically greater efficiency, their effectiveness on real NLP tasks has not been well studied. We benchmark 7 variants of Transformer models on 5 difficult NLP tasks and 7 datasets. We design experiments to isolate the effect of pretraining and hyperparameter settings, to focus on their capacity for long-range attention. Moreover, we present various methods to investigate attention behaviors to illuminate model details beyond metric scores. We find that the modified attention in long-range transformers has advantages on content selection and query-guided decoding, but they come with previously unrecognized drawbacks such as insufficient attention to distant tokens and accumulated approximation error.
@inproceedings{qin-etal-2023-nlp,
title = "The {NLP} Task Effectiveness of Long-Range Transformers",
author = "Qin, Guanghui and
Feng, Yukun and
Van Durme, Benjamin",
editor = "Vlachos, Andreas and
Augenstein, Isabelle",
booktitle = "Proceedings of the 17th Conference of the European Chapter of the Association for Computational Linguistics",
month = may,
year = "2023",
address = "Dubrovnik, Croatia",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.eacl-main.273",
doi = "10.18653/v1/2023.eacl-main.273",
pages = "3774--3790",
abstract = "Transformer models cannot easily scale to long sequences due to their O(N{\^{}}2) time and space complexity. This has led to Transformer variants seeking to lower computational complexity, such as Longformer and Performer. While such models have theoretically greater efficiency, their effectiveness on real NLP tasks has not been well studied. We benchmark 7 variants of Transformer models on 5 difficult NLP tasks and 7 datasets. We design experiments to isolate the effect of pretraining and hyperparameter settings, to focus on their capacity for long-range attention. Moreover, we present various methods to investigate attention behaviors to illuminate model details beyond metric scores. We find that the modified attention in long-range transformers has advantages on content selection and query-guided decoding, but they come with previously unrecognized drawbacks such as insufficient attention to distant tokens and accumulated approximation error.",
}
We present a novel iterative extraction model, IterX, for extracting complex relations, or templates, i.e., N-tuples representing a mapping from named slots to spans of text within a document. Documents may feature zero or more instances of a template of any given type, and the task of template extraction entails identifying the templates in a document and extracting each template{‘}s slot values. Our imitation learning approach casts the problem as a Markov decision process (MDP), and relieves the need to use predefined template orders to train an extractor. It leads to state-of-the-art results on two established benchmarks {–} 4-ary relation extraction on SciREX and template extraction on MUC-4 {–} as well as a strong baseline on the new BETTER Granular task.
@inproceedings{chen-etal-2023-iterative,
title = "Iterative Document-level Information Extraction via Imitation Learning",
author = "Chen, Yunmo and
Gantt, William and
Gu, Weiwei and
Chen, Tongfei and
White, Aaron and
Van Durme, Benjamin",
editor = "Vlachos, Andreas and
Augenstein, Isabelle",
booktitle = "Proceedings of the 17th Conference of the European Chapter of the Association for Computational Linguistics",
month = may,
year = "2023",
address = "Dubrovnik, Croatia",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.eacl-main.136",
doi = "10.18653/v1/2023.eacl-main.136",
pages = "1858--1874",
abstract = "We present a novel iterative extraction model, IterX, for extracting complex relations, or templates, i.e., N-tuples representing a mapping from named slots to spans of text within a document. Documents may feature zero or more instances of a template of any given type, and the task of template extraction entails identifying the templates in a document and extracting each template{'}s slot values. Our imitation learning approach casts the problem as a Markov decision process (MDP), and relieves the need to use predefined template orders to train an extractor. It leads to state-of-the-art results on two established benchmarks {--} 4-ary relation extraction on SciREX and template extraction on MUC-4 {--} as well as a strong baseline on the new BETTER Granular task.",
}
@inproceedings{259373518,
title = {Making Your First Choice: To Address Cold Start Problem in Medical Active Learning},
author = {{Liangyu Chen} and {Yutong Bai} and {A. Yuille} and {Zongwei Zhou}},
year = 2023,
booktitle = {International Conference on Medical Imaging with Deep Learning},
url = {https://www.semanticscholar.org/paper/251516c1549fc4566b801788c932ef1f18f343b3},
}
@inproceedings{260909100,
title = {Segmental SpeechCLIP: Utilizing Pretrained Image-text Models for Audio-Visual Learning},
author = {{Saurabhchand Bhati} and {J. Villalba} and {L. Moro-Velázquez} and {Thomas Thebaud} and {N. Dehak}},
year = 2023,
month = {8},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/1617d389b7947161f2943e2d30afeb1856052b14},
}
@inproceedings{258967563,
title = {Investigating model performance in language identification: beyond simple error statistics},
author = {{S. Styles} and {Victoria Y. H. Chua} and {Fei Ting Woon} and {Hexin Liu} and {Leibny Paola García Perera} and {S. Khudanpur} and {Andy W. H. Khong} and {J. Dauwels}},
year = 2023,
month = {5},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/5550d0db7030aa77480bfb10c4ec00862bb233eb},
}
@inproceedings{255569926,
title = {Benchmarking Robustness in Neural Radiance Fields},
author = {{Chen Wang} and {Angtian Wang} and {Junbo Li} and {A. Yuille} and {Cihang Xie}},
year = 2023,
month = {1},
booktitle = {2024 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)},
url = {https://www.semanticscholar.org/paper/eaf0c04e9784d6efc8f9ce16d1d9c3ae43506ad9},
}
For many languages, machine translation progress is hindered by the lack of reliable training data. Models are trained on whatever pre-existing datasets may be available and then augmented with synthetic data, because it is often not economical to pay for the creation of large-scale datasets. But for the case of low-resource languages, would the creation of a few thousand professionally translated sentence pairs give any benefit? In this paper, we show that it does. We describe a broad data collection effort involving around 6k professionally translated sentence pairs for each of 39 low-resource languages, which we make publicly available. We analyse the gains of models trained on this small but high-quality data, showing that it has significant impact even when larger but lower quality pre-existing corpora are used, or when data is augmented with millions of sentences through backtranslation.
@inproceedings{maillard-etal-2023-small,
title = "Small Data, Big Impact: Leveraging Minimal Data for Effective Machine Translation",
author = "Maillard, Jean and
Gao, Cynthia and
Kalbassi, Elahe and
Sadagopan, Kaushik Ram and
Goswami, Vedanuj and
Koehn, Philipp and
Fan, Angela and
Guzman, Francisco",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-long.154",
doi = "10.18653/v1/2023.acl-long.154",
pages = "2740--2756",
abstract = "For many languages, machine translation progress is hindered by the lack of reliable training data. Models are trained on whatever pre-existing datasets may be available and then augmented with synthetic data, because it is often not economical to pay for the creation of large-scale datasets. But for the case of low-resource languages, would the creation of a few thousand professionally translated sentence pairs give any benefit? In this paper, we show that it does. We describe a broad data collection effort involving around 6k professionally translated sentence pairs for each of 39 low-resource languages, which we make publicly available. We analyse the gains of models trained on this small but high-quality data, showing that it has significant impact even when larger but lower quality pre-existing corpora are used, or when data is augmented with millions of sentences through backtranslation.",
}
@inproceedings{258460982,
title = {Towards Being Parameter-Efficient: A Stratified Sparsely Activated Transformer with Dynamic Capacity},
author = {{Haoran Xu} and {Maha Elbayad} and {Kenton Murray} and {Jean Maillard} and {Vedanuj Goswami}},
year = 2023,
month = {5},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/09d3a354d22d75deddb0dcc99870f307aae2fd3c},
}
@inproceedings{257687311,
title = {ReBotNet: Fast Real-time Video Enhancement},
author = {{Jeya Maria Jose Valanarasu} and {Rahul Garg} and {Andeep S. Toor} and {Xin Tong} and {Weijuan Xi} and {Andreas Lugmayr} and {Vishal M. Patel} and {A. Menini}},
year = 2023,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/15c2b3ecdf1b9af2f94a2b106fddcfc89cb336cb},
}
@inproceedings{257557771,
title = {Deep Metric Learning for Unsupervised Remote Sensing Change Detection},
author = {{W. G. C. Bandara} and {Vishal M. Patel}},
year = 2023,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/30d02457a38374398deca536682c193f0f0b1a24},
}
Many machine translation toolkits make use of a data preparation step wherein raw data is transformed into a tensor format that can be used directly by the trainer. This preparation step is increasingly at odds with modern research and development practices because this process produces a static, unchangeable version of the training data, making common training-time needs difficult (e.g., subword sampling), time-consuming (preprocessing with large data can take days), expensive (e.g., disk space), and cumbersome (managing experiment combinatorics). We propose an alternative approach that separates the generation of data from the consumption of that data. In this approach, there is no separate pre-processing step; data generation produces an infinite stream of permutations of the raw training data, which the trainer tensorizes and batches as it is consumed. Additionally, this data stream can be manipulated by a set of user-definable operators that provide on-the-fly modifications, such as data normalization, augmentation or filtering. We release an open-source toolkit, SOTASTREAM, that implements this approach: https://github.com/marian-nmt/sotastream. We show that it cuts training time, adds flexibility, reduces experiment management complexity, and reduces disk space, all without affecting the accuracy of the trained models.
@inproceedings{post-etal-2023-sotastream,
title = "{SOTASTREAM}: A Streaming Approach to Machine Translation Training",
author = "Post, Matt and
Gowda, Thamme and
Grundkiewicz, Roman and
Khayrallah, Huda and
Jain, Rohit and
Junczys-Dowmunt, Marcin",
editor = "Tan, Liling and
Milajevs, Dmitrijs and
Chauhan, Geeticka and
Gwinnup, Jeremy and
Rippeth, Elijah",
booktitle = "Proceedings of the 3rd Workshop for Natural Language Processing Open Source Software (NLP-OSS 2023)",
month = dec,
year = "2023",
address = "Singapore",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.nlposs-1.13",
doi = "10.18653/v1/2023.nlposs-1.13",
pages = "110--119",
abstract = "Many machine translation toolkits make use of a data preparation step wherein raw data is transformed into a tensor format that can be used directly by the trainer. This preparation step is increasingly at odds with modern research and development practices because this process produces a static, unchangeable version of the training data, making common training-time needs difficult (e.g., subword sampling), time-consuming (preprocessing with large data can take days), expensive (e.g., disk space), and cumbersome (managing experiment combinatorics). We propose an alternative approach that separates the generation of data from the consumption of that data. In this approach, there is no separate pre-processing step; data generation produces an infinite stream of permutations of the raw training data, which the trainer tensorizes and batches as it is consumed. Additionally, this data stream can be manipulated by a set of user-definable operators that provide on-the-fly modifications, such as data normalization, augmentation or filtering. We release an open-source toolkit, SOTASTREAM, that implements this approach: https://github.com/marian-nmt/sotastream. We show that it cuts training time, adds flexibility, reduces experiment management complexity, and reduces disk space, all without affecting the accuracy of the trained models.",
}
@inproceedings{259924959,
title = {MegaWika: Millions of reports and their sources across 50 diverse languages},
author = {{Samuel Barham} and {Orion Weller} and {Michelle Yuan} and {Kenton Murray} and {M. Yarmohammadi} and {Zhengping Jiang} and {Siddharth Vashishtha} and {Alexander Martin} and {Anqi Liu} and {Aaron Steven White} and {Jordan L. Boyd-Graber} and {Benjamin Van Durme}},
year = 2023,
month = {7},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/c8e2b9f68bd585759d31741193516f58b5619584},
}
@inproceedings{260918551,
title = {Advances in Language Recognition in Low Resource African Languages: The JHU-MIT Submission for NIST LRE22},
author = {{J. Villalba} and {Jonas Borgstrom} and {Maliha Jahan} and {Saurabh Kataria} and {Leibny Paola García} and {P. Torres-Carrasquillo} and {N. Dehak}},
year = 2023,
month = {8},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/51aca07d500c44ebde896b8df3b0388dd3ade489},
}
@inproceedings{255372874,
title = {Learning Road Scene-level Representations via Semantic Region Prediction},
author = {{Zihao Xiao} and {A. Yuille} and {Yi-Ting Chen}},
year = 2023,
month = {1},
booktitle = {Conference on Robot Learning},
url = {https://www.semanticscholar.org/paper/11b29ca1a235d80a2e55f6eb7711d2aa5785bb8c},
}
@inproceedings{263134276,
title = {The Trickle-down Impact of Reward (In-)consistency on RLHF},
author = {{Lingfeng Shen} and {Sihao Chen} and {Linfeng Song} and {Lifeng Jin} and {Baolin Peng} and {Haitao Mi} and {Daniel Khashabi} and {Dong Yu}},
year = 2023,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/541b66bad4a9bf9b7fd97f13f94ab9061c7c0c47},
}
@inproceedings{271601672,
title = {Beyond the Imitation Game: Quantifying and extrapolating the capabilities of language models},
author = {{Aarohi Srivastava} and {Abhinav Rastogi} and {Abhishek Rao} and {Abu Awal Md Shoeb} and {Abubakar Abid} and {Adam Fisch} and {Adam R. Brown} and {Adam Santoro} and {Aditya Gupta} and {Adrià Garriga-Alonso} and {Agnieszka Kluska} and {Aitor Lewkowycz} and {Akshat Agarwal} and {Alethea Power} and {Alex Ray} and {Alex Warstadt} and {Alexander W. Kocurek} and {Ali Safaya} and {Ali Tazarv} and {Alice Xiang} and {Alicia Parrish} and {Allen Nie} and {Aman Hussain} and {Amanda Askell} and {Amanda Dsouza} and {Ambrose Slone} and {Ameet Rahane} and {Anantharaman S. Iyer} and {Anders Andreassen} and {Andrea Madotto} and {A. Santilli} and {Andreas Stuhlmüller} and {Andrew M. Dai} and {Andrew La} and {Andrew K. Lampinen} and {Andy Zou} and {Angela Jiang} and {Angelica Chen} and {Anh Vuong} and {Animesh Gupta} and {Anna Gottardi} and {Antonio Norelli} and {Anu Venkatesh} and {Arash Gholamidavoodi} and {A. Tabassum} and {Arul Menezes} and {Arun Kirubarajan} and {A. Mullokandov} and {Ashish Sabharwal} and {Austin Herrick} and {Avia Efrat} and {Aykut Erdem} and {Ayla Karakas} and {B. R. Roberts} and {B. S. Loe} and {Barret Zoph} and {Bartlomiej Bojanowski} and {Batuhan Özyurt} and {Behnam Hedayatnia} and {Behnam Neyshabur} and {Benjamin Inden} and {Benno Stein} and {Berk Ekmekci} and {Bill Yuchen Lin} and {B. Howald} and {Bryan Orinion} and {Cameron Diao} and {Cameron Dour} and {Catherine Stinson} and {Cedrick Argueta} and {Cèsar Ferri Ramírez} and {Chandan Singh} and {Charles Rathkopf} and {Chenlin Meng} and {Chitta Baral} and {Chiyu Wu} and {Christopher Callison-Burch} and {Christian Waites} and {Christian Voigt} and {Christopher D. Manning} and {Christopher Potts} and {Cindy Ramirez} and {Clara E. Rivera} and {Clemencia Siro} and {Colin Raffel} and {Courtney Ashcraft} and {Cristina Garbacea} and {Damien Sileo} and {Daniel H Garrette} and {Dan Hendrycks} and {D. Kilman} and {Dan Roth} and {Daniel Freeman} and {Daniel Khashabi} and {Daniel Levy} and {Daniel Moseguí González} and {Danielle Perszyk} and {Danny Hernandez} and {Danqi Chen} and {Daphne Ippolito} and {D. Gilboa} and {David Dohan} and {D. Drakard} and {David Jurgens} and {Debajyoti Datta} and {Deep Ganguli} and {Denis Emelin} and {Denis Kleyko} and {Deniz Yuret} and {Derek Chen} and {Derek Tam} and {Dieuwke Hupkes} and {Diganta Misra} and {Dilyar Buzan} and {Dimitri Coelho Mollo} and {Diyi Yang} and {Dong-Ho Lee} and {Dylan Schrader} and {Ekaterina Shutova} and {E. D. Cubuk} and {Elad Segal} and {Eleanor Hagerman} and {Elizabeth Barnes} and {E. Donoway} and {Ellie Pavlick} and {Emanuele Rodolà} and {Emma Lam} and {Eric Chu} and {Eric Tang} and {Erkut Erdem} and {Ernie Chang} and {Ethan A. Chi} and {Ethan Dyer} and {E. Jerzak} and {Ethan Kim} and {Eunice Engefu Manyasi} and {Evgenii Zheltonozhskii} and {Fanyue Xia} and {F. Siar} and {Fernando Martínez-Plumed} and {Francesca Happé} and {François Chollet} and {Frieda Rong} and {Gaurav Mishra} and {Genta Indra Winata} and {Gerard de Melo} and {Germán Kruszewski} and {Giambattista Parascandolo} and {Giorgio Mariani} and {Gloria Xinyue Wang} and {Gonzalo Jaimovitch-López} and {Gregor Betz} and {Guy Gur-Ari} and {Hana Galijasevic} and {Hannah Kim} and {Hannah Rashkin} and {Hanna Hajishirzi} and {Harsh Mehta} and {H. Bogar} and {Henry Shevlin} and {Hinrich Schütze} and {H. Yakura} and {Hongming Zhang} and {Hugh Mee Wong} and {Ian Ng} and {Isaac Noble} and {Jaap Jumelet} and {Jack Geissinger} and {John Kernion} and {Jacob Hilton} and {Jaehoon Lee} and {J. Fisac} and {James B. Simon} and {James Koppel} and {James Zheng} and {James Zou} and {Jan Kocoń} and {Jana Thompson} and {Janelle Wingfield} and {Jared Kaplan} and {Jarema Radom} and {Jascha Narain Sohl-Dickstein} and {Jason Phang} and {Jason Wei} and {J. Yosinski} and {Jekaterina Novikova} and {Jelle Bosscher} and {Jennifer Marsh} and {Jeremy Kim} and {Jeroen Taal} and {Jesse Engel} and {Jesujoba Oluwadara Alabi} and {Jiacheng Xu} and {Jiaming Song} and {Jillian Tang} and {Jane W Waweru} and {John Burden} and {John Miller} and {John U. Balis} and {Jonathan Batchelder} and {Jonathan Berant} and {Jorg Frohberg} and {Jos Rozen} and {J. Hernández-Orallo} and {Joseph Boudeman} and {Joseph Guerr} and {Joseph Jones} and {Joshua B. Tenenbaum} and {Josh Rule} and {Joyce Chua} and {Kamil Kanclerz} and {Karen Livescu} and {Karl Krauth} and {Karthik Gopalakrishnan} and {Katerina Ignatyeva} and {K. Markert} and {Kaustubh D. Dhole} and {Kevin Gimpel} and {Kevin Omondi} and {K. Mathewson} and {Kristen Chiafullo} and {Ksenia Shkaruta} and {Kumar Shridhar} and {Kyle McDonell} and {Kyle Richardson} and {Laria Reynolds} and {Leo Gao} and {Li Zhang} and {Liam Dugan} and {Lianhui Qin} and {Lidia Contreras Ochando} and {Louis-Philippe Morency} and {Luca Moschella} and {Luca Lam} and {Lucy Noble} and {Ludwig Schmidt} and {Luheng He} and {Luis Oliveros Colón} and {Luke Metz} and {Lütfi Kerem Senel} and {Maarten Bosma} and {Maarten Sap} and {Maartje ter Hoeve} and {Maheen Farooqi} and {Manaal Faruqui} and {Mantas Mazeika} and {Marco Baturan} and {Marco Marelli} and {Marco Maru} and {M. J. Ramírez-Quintana} and {M. Tolkiehn} and {Mario Giulianelli} and {Martha Lewis} and {Martin Potthast} and {Matthew L. Leavitt} and {Matthias Hagen} and {M. Schubert} and {Medina Baitemirova} and {Melody Arnaud} and {M. McElrath} and {Michael A. Yee} and {Michael Cohen} and {Michael Gu} and {Michael Ivanitskiy} and {Michael Starritt} and {M. Strube} and {Michal Swedrowski} and {Michele Bevilacqua} and {Michihiro Yasunaga} and {Mihir Kale} and {Mike Cain} and {Mimee Xu} and {Mirac Suzgun} and {Mitch Walker} and {Mohit Tiwari} and {Mohit Bansal} and {Moin Aminnaseri} and {Mor Geva} and {Mozhdeh Gheini} and {T. MukundVarma} and {Nanyun Peng} and {Nathan A. Chi} and {Nayeon Lee} and {Neta Gur-Ari Krakover} and {Nicholas Cameron} and {Nicholas Roberts} and {Nick Doiron} and {Nicole Martinez} and {Nikita Nangia} and {Niklas Deckers} and {Niklas Muennighoff} and {N. Keskar} and {Niveditha Iyer} and {Noah Constant} and {Noah Fiedel} and {Nuan Wen} and {Oliver Zhang} and {Omar Agha} and {Omar Elbaghdadi} and {Omer Levy} and {Owain Evans} and {Pablo Antonio Moreno Casares} and {Parth Doshi} and {Pascale Fung} and {P. Liang} and {Paul Vicol} and {Pegah Alipoormolabashi} and {Peiyuan Liao} and {Percy Liang} and {Peter Chang} and {Peter Eckersley} and {Phu Mon Htut} and {P. Hwang} and {P. Milkowski} and {Piyush Patil} and {Pouya Pezeshkpour} and {Priti Oli} and {Qiaozhu Mei} and {Qing Lyu} and {Qinlang Chen} and {Rabin Banjade} and {Rachel Etta Rudolph} and {Raefer Gabriel} and {Rahel Habacker} and {Ramon Risco} and {Raphael Milliere} and {Rhythm Garg} and {Richard Barnes} and {R. Saurous} and {Riku Arakawa} and {Robbe Raymaekers} and {Robert Frank} and {Rohan Sikand} and {Roman Novak} and {Roman Sitelew} and {R. L. Bras} and {Rosanne Liu} and {Rowan Jacobs} and {Rui Zhang} and {Ruslan Salakhutdinov} and {Ryan Chi} and {Ryan Lee} and {Ryan Stovall} and {Ryan Teehan} and {Rylan Yang} and {Sahib Singh} and {Saif Mohammad} and {Sajant Anand} and {Sam Dillavou} and {Sam Shleifer} and {Samuel Wiseman} and {Samuel Gruetter} and {Samuel R. Bowman} and {S. Schoenholz} and {Sanghyun Han} and {Sanjeev Kwatra} and {Sarah A. Rous} and {Sarik Ghazarian} and {Sayan Ghosh} and {Sean Casey} and {Sebastian Bischoff} and {Sebastian Gehrmann} and {Sebastian Schuster} and {Sepideh Sadeghi} and {Shadi S. Hamdan} and {Sharon Zhou} and {Shashank Srivastava} and {Sherry Shi} and {Shikhar Singh} and {Shima Asaadi} and {S. Gu} and {Shubh Pachchigar} and {Shubham Toshniwal} and {Shyam Upadhyay} and {Shyamolima Debnath} and {Siamak Shakeri} and {Simon Thormeyer} and {S. Melzi} and {Siva Reddy} and {S. Makini} and {Soo-Hwan Lee} and {Spencer Bradley Torene} and {Sriharsha Hatwar} and {S. Dehaene} and {Stefan Divic} and {Stefano Ermon} and {Stella Biderman} and {Stephanie Lin} and {Stephen Prasad} and {Steven T Piantadosi} and {Stuart M. Shieber} and {Summer Misherghi} and {S. Kiritchenko} and {Swaroop Mishra} and {Tal Linzen} and {Tal Schuster} and {Tao Li} and {Tao Yu} and {Tariq Ali} and {Tatsunori Hashimoto} and {Te-Lin Wu} and {T. Desbordes} and {Theodore Rothschild} and {Thomas Phan} and {Tianle Wang} and {Tiberius Nkinyili} and {Timo Schick} and {T. Kornev} and {T. Tunduny} and {Tobias Gerstenberg} and {T. Chang} and {Trishala Neeraj} and {Tushar Khot} and {Tyler Shultz} and {Uri Shaham} and {Vedant Misra} and {Vera Demberg} and {Victoria Nyamai} and {Vikas Raunak} and {V. Ramasesh} and {Vinay Uday Prabhu} and {Vishakh Padmakumar} and {Vivek Srikumar} and {W. Fedus} and {William Saunders} and {William Zhang} and {Wout Vossen} and {Xiang Ren} and {Xiaoyu Tong} and {Xinran Zhao} and {Xinyi Wu} and {Xudong Shen} and {Yadollah Yaghoobzadeh} and {Yair Lakretz} and {Yangqiu Song} and {Yasaman Bahri} and {Yejin Choi} and {Yichi Yang} and {Yiding Hao} and {Yifu Chen} and {Yonatan Belinkov} and {Yufang Hou} and {Yufang Hou} and {Yuntao Bai} and {Zachary Seid} and {Zhuoye Zhao} and {Zijian Wang} and {Zijie J. Wang} and {Zirui Wang} and {Ziyi Wu}},
year = 2023,
booktitle = {Trans. Mach. Learn. Res.},
url = {https://www.semanticscholar.org/paper/9dfe937f405b95bfc5e8e3679329a1f16b37e276},
}
@inproceedings{262070652,
title = {Efficient Approximate Predictive Inference Under Feedback Covariate Shift with Influence Functions},
author = {{Drew Prinster} and {S. Saria} and {Anqi Liu}},
year = 2023,
booktitle = {International Symposium on Conformal and Probabilistic Prediction with Applications},
url = {https://www.semanticscholar.org/paper/ea62b78ec46e7ca0ad4dd5337cd87bb27ab0ec06},
}
@inproceedings{258535938,
title = {Building Keyword Search System from End-To-End Asr Systems},
author = {{Ruizhe Huang} and {Matthew Wiesner} and {Leibny Paola García-Perera} and {Daniel Povey} and {J. Trmal} and {S. Khudanpur}},
year = 2023,
month = {6},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/1b610ce986449cbef77d0f6bdd28421fd8495268},
}
@inproceedings{258074434,
title = {Retinomorphic Channel Design and Considerations},
author = {{Jonah P. Sengupta} and {A. Andreou}},
year = 2023,
month = {3},
booktitle = {Annual Conference on Information Sciences and Systems},
url = {https://www.semanticscholar.org/paper/7f97effeed913a6089ca98d576d585401e251f9b},
}
@inproceedings{258967838,
title = {MERLIon CCS Challenge: A English-Mandarin code-switching child-directed speech corpus for language identification and diarization},
author = {{Victoria Y. H. Chua} and {Hexin Liu} and {Leibny Paola García Perera} and {Fei Ting Woon} and {Jinyi Wong} and {Xiangyu Zhang} and {S. Khudanpur} and {Andy W. H. Khong} and {J. Dauwels} and {S. Styles}},
year = 2023,
month = {5},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/ea701359c6e2b2ba5c36c4849d4144d318171418},
}
@inproceedings{261048725,
title = {3D-Aware Neural Body Fitting for Occlusion Robust 3D Human Pose Estimation},
author = {{Yi Zhang} and {Pengliang Ji} and {Angtian Wang} and {Jieru Mei} and {Adam Kortylewski} and {A. Yuille}},
year = 2023,
month = {8},
booktitle = {IEEE International Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/8a46058e5353ae5cc66dd8fc67e635aaad3a5f17},
}
@inproceedings{254853589,
title = {Reference free auscultation quality metric and its trends},
author = {{A. Kala} and {Eric D. McCollum} and {Mounya Elhilali}},
year = 2023,
month = {8},
booktitle = {Biomedical Signal Processing and Control},
url = {https://www.semanticscholar.org/paper/4276e26be8c196ba4b496b4a0acc4102d32c0bd8},
}
@inproceedings{257804958,
title = {Mask-Free OVIS: Open-Vocabulary Instance Segmentation without Manual Mask Annotations},
author = {{VS Vibashan} and {Ning Yu} and {Chen Xing} and {Can Qin} and {Mingfei Gao} and {Juan Carlos Niebles} and {Vishal M. Patel} and {Ran Xu}},
year = 2023,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/7aa528b8732033cfb7a6d130bb321723a4e49700},
}
@inproceedings{256604402,
title = {Adaptation in the sensory cortex drives bistable switching during auditory stream segregation},
author = {{Nathan C Higgins} and {Alexandra N. Scurry} and {Fang Jiang} and {David F. Little} and {Claude Alain} and {Mounya Elhilali} and {J. Snyder}},
year = 2023,
month = {1},
booktitle = {Neuroscience of Consciousness},
url = {https://www.semanticscholar.org/paper/c1c4a48270174de06f609bb2dc98c8e896ce78a3},
}
@inproceedings{260202959,
title = {Distillation-guided Representation Learning for Unconstrained Gait Recognition},
author = {{Yuxiang Guo} and {Cheng-Fang Peng} and {R. Prabhakar} and {Chun Pong Lau} and {R. Chellappa}},
year = 2023,
month = {7},
booktitle = {2024 IEEE International Joint Conference on Biometrics (IJCB)},
url = {https://www.semanticscholar.org/paper/5d66c8c86d4ecc2b4ee38f2aa98a470e1e6ea48f},
}
@inproceedings{262466051,
title = {SCREWS: A Modular Framework for Reasoning with Revisions},
author = {{K. Shridhar} and {Harsh Jhamtani} and {Hao Fang} and {Benjamin Van Durme} and {Jason Eisner} and {Patrick Xia}},
year = 2023,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/5d5dbba58aaf5b3fa4044cc3ffc71a3fe2b8c654},
}
@inproceedings{248397783,
title = {Conference on Health, Inference, and Learning, CHIL 2023, Broad Institute of MIT and Harvard (Merkin Building), 415 Main Street, Cambridge, MA, USA},
author = {{Gerardo Flores} and {George H. Chen} and {T. Pollard} and {Ayah Zirikly} and {Michael C. Hughes} and {Tasmie Sarker} and {Joyce Ho} and {Tristan Naumann}},
year = 2023,
booktitle = {ACM Conference on Health, Inference, and Learning},
url = {https://www.semanticscholar.org/paper/1cfe0feed33d2452f951afa7304d017131dc4520},
}
@inproceedings{258865888,
title = {InteractiveIE: Towards Assessing the Strength of Human-AI Collaboration in Improving the Performance of Information Extraction},
author = {{Ishani Mondal} and {Michelle Yuan} and {N. Anandhavelu} and {Aparna Garimella} and {Francis Ferraro} and {Andrew Blair-Stanek} and {Benjamin Van Durme} and {Jordan L. Boyd-Graber}},
year = 2023,
month = {5},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/21e0a1324522b39e5cec94885501e906942c43d0},
}
@inproceedings{258309151,
title = {Escaping the sentence-level paradigm in machine translation},
author = {{Matt Post} and {Marcin Junczys-Dowmunt}},
year = 2023,
month = {4},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/59e2cfbb1395a4a02e9efecadd4f4005af462c1b},
}
@inproceedings{259436318,
title = {The unsung hero: how synthetic data has helped computer vision, machine learning, and AI},
author = {{R. Chellappa}},
year = 2023,
month = {6},
booktitle = {Synthetic Data for Artificial Intelligence and Machine Learning: Tools, Techniques, and Applications},
url = {https://www.semanticscholar.org/paper/c061dd875146aa8d87b5bfe45eea73df8da3c373},
}
@inproceedings{256826996,
title = {Can GPT-3 Perform Statutory Reasoning?},
author = {{Andrew Blair-Stanek} and {Nils Holzenberger} and {Benjamin Van Durme}},
year = 2023,
month = {2},
booktitle = {International Conference on Artificial Intelligence and Law},
url = {https://www.semanticscholar.org/paper/5f5253fb15ac382e96ade0335baf1cfaa240fb1d},
}
@inproceedings{258887517,
title = {Robust Category-Level 3D Pose Estimation from Synthetic Data},
author = {{Jiahao Yang} and {Wufei Ma} and {Angtian Wang} and {Xiaoding Yuan} and {A. Yuille} and {Adam Kortylewski}},
year = 2023,
month = {5},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/55aa226650e6eeed51e181195b7b7a9b87102bc5},
}
@inproceedings{256353599,
title = {A Multi-Modal Array of Interpretable Features to Evaluate Language and Speech Patterns in Different Neurological Disorders},
author = {{A. Favaro} and {C. Motley} and {Tianyu Cao} and {Miguel Iglesias} and {A. Butala} and {E. Oh} and {R. Stevens} and {J. Villalba} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2023,
month = {1},
booktitle = {Spoken Language Technology Workshop},
url = {https://www.semanticscholar.org/paper/40eb935374d67b7b9979e0c9333c291d188c472b},
}
@inproceedings{260681299,
title = {Early Detection and Localization of Pancreatic Cancer by Label-Free Tumor Synthesis},
author = {{Bowen Li} and {Yu-Cheng Chou} and {Shuwen Sun} and {Hualin Qiao} and {A. Yuille} and {Zongwei Zhou}},
year = 2023,
month = {8},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/d556aaf4ac55b6cebb9b889ec7b89b086cb41bff},
}
@inproceedings{258236142,
title = {OOD-CV-v2 : An Extended Benchmark for Robustness to Out-of-Distribution Shifts of Individual Nuisances in Natural Images},
author = {{Bingchen Zhao} and {Jiahao Wang} and {Wufei Ma} and {Artur Jesslen} and {Si-Jia Yang} and {Shaozuo Yu} and {O. Zendel} and {C. Theobalt} and {A. Yuille} and {Adam Kortylewski}},
year = 2023,
month = {4},
booktitle = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
url = {https://www.semanticscholar.org/paper/f5cd9b3f48e81e1a91923ef423765edeb9bdd50e},
}
@inproceedings{258766141,
title = {Clustering using Approximate Nearest Neighbour Oracles},
author = {{Enayat Ullah} and {Harry Lang} and {R. Arora} and {V. Braverman}},
year = 2023,
booktitle = {Trans. Mach. Learn. Res.},
url = {https://www.semanticscholar.org/paper/2e864475d80f551d97232f9a6cba079dd128c54d},
}
@inproceedings{265244446,
title = {Genre Classification of Books on Spanish},
author = {{J. Nolazco-Flores} and {Ana Verónica Guerrero-Galván} and {Carolina del-Valle-Soto} and {Leibny Paola García-Perera}},
year = 2023,
booktitle = {IEEE Access},
url = {https://www.semanticscholar.org/paper/0895c353c61f4ef6452ba892e4608d45742d455b},
}
@inproceedings{256356339,
title = {Vsameter: Evaluation of a New Open-Source Tool to Measure Vowel Space Area and Related Metrics},
author = {{Tianyu Cao} and {L. Moro-Velázquez} and {Piotr Żelasko} and {J. Villalba} and {N. Dehak}},
year = 2023,
month = {1},
booktitle = {Spoken Language Technology Workshop},
url = {https://www.semanticscholar.org/paper/dd3d00bf410d95d15569443387082da13a2462c4},
}
@inproceedings{257206027,
title = {Provably Efficient Neural Offline Reinforcement Learning via Perturbed Rewards},
author = {{Thanh Nguyen-Tang} and {R. Arora}},
year = 2023,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/a8dac0d0837ac4800f4462a121c59a98a05531ee},
}
@inproceedings{258808787,
title = {Remote haemodynamic monitoring of pulmonary artery pressures in patients with chronic heart failure (MONITOR-HF): a randomised clinical trial},
author = {{J. Brugts} and {S. Radhoe} and {P. Clephas} and {Dilan Aydin} and {M. Gent} and {M. Szymanski} and {M. Rienstra} and {M. Heuvel} and {C. Fonseca} and {G. Linssen} and {C. Borleffs} and {E. Boersma} and {F. Asselbergs} and {A. Mosterd} and {H. Rocca} and {R. A. Boer} and {M. Emans} and {S. Beeres} and {L. Heerebeek} and {C. Kirchhof} and {J. Ramshorst} and {R. Spee} and {T. Smilde} and {M. V. Eck} and {E. Kaplan} and {R. Hazeleger} and {R. Tukkie} and {M. Feenema} and {W. Kok} and {V. V. Halm} and {M. L. Handoko} and {R. Kimmenade} and {Matt Post} and {N. V. Mieghem} and {O. Manintveld}},
year = 2023,
month = {5},
booktitle = {The Lancet},
url = {https://www.semanticscholar.org/paper/80da514a8c411b22bd786a69f3ca62ae1d323ff1},
}
@inproceedings{258999203,
title = {Discovering Failure Modes of Text-guided Diffusion Models via Adversarial Search},
author = {{Qihao Liu} and {Adam Kortylewski} and {Yutong Bai} and {Song Bai} and {A. Yuille}},
year = 2023,
month = {6},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/b469d5e906eee4f682726fb8b7f899fd96bcd8a3},
}
@inproceedings{258444556,
title = {Evaluation of a Novel Digital Stethoscope Prototype in a Low-resource Setting: Expert Listening Panel Agreement With Conventional Auscultation in Hospitalized Malawian Children With Severe Pneumonia},
author = {{Z. Smith} and {N. Hoekstra} and {T. Mvalo} and {I. McLane} and {A. Kala} and {M. Chiume} and {C. Verwey} and {D. Olson} and {C. Buck} and {J. Mulindwa} and {E. Fitzgerald} and {M. Chagomerana} and {Mounya Elhilali} and {M. Hosseinipour} and {E. McCollum}},
year = 2023,
month = {5},
booktitle = {C25. OPPORTUNITIES AND ADVANCES IN PEDIATRIC GLOBAL HEALTH},
url = {https://www.semanticscholar.org/paper/00ff74d263d80498ea78cca8850c565b66057476},
}
@inproceedings{257805227,
title = {Did You Mean...? Confidence-based Trade-offs in Semantic Parsing},
author = {{Elias Stengel-Eskin} and {Benjamin Van Durme}},
year = 2023,
month = {3},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/695a24f4bd79293d7c4dc41ce3f86c66d601f930},
}
@inproceedings{258865176,
title = {NOVUM: Neural Object Volumes for Robust Object Classification},
author = {{Artur Jesslen} and {Guofeng Zhang} and {Angtian Wang} and {Wufei Ma} and {A. Yuille} and {Adam Kortylewski}},
year = 2023,
month = {5},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/7f6b686b1a9ae3983dd4facfb23038d49f16dcc4},
}
@inproceedings{259164709,
title = {Generating Images with 3D Annotations Using Diffusion Models},
author = {{Wufei Ma} and {Qihao Liu} and {Jiahao Wang} and {Angtian Wang} and {Yaoyao Liu} and {Adam Kortylewski} and {A. Yuille}},
year = 2023,
month = {6},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/1036f39069a1fe3d5f818f1d7bc07286ad3f1363},
}
@inproceedings{259267429,
title = {What are Adapters Really Efficient At?},
author = {{Alexis Conneau} and {Kartikay Khandelwal} and {Naman Goyal} and {Mitesh M. Khapra} and {Pratyush Kumar} and {V. Rudra} and {Murthy Anoop} and {Kunchukuttan. 2022} and {Naama-677} and {Adam Roberts} and {Stella Biderman} and {Teven Le Scao} and {Saiful Bari} and {Sheng Shen} and {Zheng-Xin Yong} and {Hai-682 ley Schoelkopf} and {Xiangru Tang} and {Dragomir R. Radev} and {Al-683 ham} and {Fikri Aji} and {Khalid Almubarak} and {Samuel Albanie} and {Zaid Alyafeai} and {Albert Webson} and {Edward Raff} and {Jonas Pfeiffer} and {Aishwarya Kamath} and {Andreas Rücklé} and {Kyunghyun Cho} and {Iryna Gurevych} and {Clifton Poth} and {Aishwarya} and {Ivan Kamath} and {Sebastian Vuli´c} and {Kyunghyun Ruder} and {Gregor Geigle} and {Max Glockner} and {Jonas Beck} and {Nils Pfeiffer} and {Reimers Iryna} and {Victor Sanh} and {Colin Raffel} and {Lintang Bach} and {Zaid Sutawika} and {Antoine Alyafeai} and {Arnaud Chaffin} and {Arun Stiegler} and {Manan Raja} and {Dey Saiful} and {Canwen Bari} and {Urmish Xu} and {Thakker} and {Shanya Sharma} and {Eliza Szczechla} and {Taewoon} and {Gunjan Kim} and {Nihal Chhablani} and {Nayak} and {Debajyoti} and {Jonathan Datta} and {Mike Tian-Jian Chang} and {Han Jiang} and {Matteo Wang} and {S. Mânica} and {Zheng Xin Shen} and {Yong} and {Harshit Pandey} and {Rachel Bawden} and {Thomas Wang} and {Tripathi Neeraj} and {Jos Rozen} and {Abheesht Sharma} and {A. Santilli} and {Thibault Févry} and {Jason Alan Fries} and {Maarten Sap} and {Hannah Rashkin} and {Derek Chen} and {Ronan} and {Aarohi Srivastava} and {Abhinav Rastogi} and {Abhishek Rao} and {Adam R. Brown} and {Adam Santoro} and {Adrià Gupta} and {Agnieszka Garriga-Alonso} and {Kluska} and {Aitor Lewkowycz} and {Akshat Agarwal} and {Alethea Power} and {Alex Ray} and {Alex Warstadt} and {Alexander W. Kocurek} and {Ali Safaya} and {Ali Tazarv} and {Alice Xiang} and {Alicia Par-765} and {Allen Nie} and {Aman Hussain} and {Amanda Askell} and {Anantharaman S. Iyer} and {Anders Andreassen} and {Andrea Madotto} and {A. Santilli} and {Andreas Stuhlmüller} and {Andrew M. Dai} and {Andrew La} and {Andrew K. Lampinen} and {Angela Zou} and {Angela Jiang} and {Anh Chen} and {Vuong} and {Animesh Gupta} and {Anna Gottardi} and {Antonio Norelli} and {Anu Venkatesh} and {Arash Gholamidavoodi} and {Arfa Tabas-773} and {Arul Menezes} and {Arun Kirubarajan} and {Asher Mul-774} and {Ashish lokandov} and {Austin Sabharwal} and {Herrick} and {Avia} and {A. Efrat} and {Ayla Erdem} and {B. Karaka¸s} and {Ryan Roberts} and {B. S. Loe} and {Barret Zoph} and {Bartlomiej Bojanowski} and {Batuhan Özyurt} and {Behnam Hedayatnia} and {Behnam} and {Benjamin Neyshabur} and {Benno Inden} and {Berk Stein} and {Ek-779 mekci} and {Bill Yuchen} and {B. Lin} and {Cameron Howald} and {Cameron Diao} and {Catherine Dour} and {Cedrick Stinson} and {Ar-781 César} and {Chandan Ferri Ramírez} and {Charles Singh} and {Christopher D. Manning} and {Christopher Potts} and {Cindy Ramirez} and {Clara E. Rivera} and {Clemencia Siro} and {Colin Raf-786} and {Courtney Ashcraft} and {Cristina Garbacea} and {Dan Sileo} and {Daniel H Garrette} and {Dan Hendrycks} and {Kilman} and {Dan Roth} and {Daniel Freeman} and {Daniel Khashabi} and {Daniel Levy} and {Daniel Moseguí González} and {Perszyk} and {Danny Hernandez} and {Danqi Chen} and {Daphne Ippolito} and {D. Gilboa} and {David Dohan} and {D. Drakard} and {David Ju-792} and {Debajyoti Datta} and {Deep Ganguli} and {Denis Emelin} and {Denis Kleyko} and {Deniz Yuret} and {Derek Tam} and {mán Kruszewski} and {Giambattista Parascandolo} and {Giorgio Mariani} and {Gloria Wang} and {Gonzalo Jaimovitch-807 López} and {Gregor Betz} and {Guy Gur-Ari} and {Hana Galijase-808 vic} and {Hannah Kim} and {Harsh Mehta} and {H. Bogar} and {Henry Shevlin} and {Hinrich Schütze} and {H. Yakura} and {Hongming Zhang} and {Hugh Mee Wong} and {Ian Ng} and {Isaac Noble} and {Jaap Jumelet} and {Jack Geissinger} and {John Kernion} and {Jacob Hilton} and {Jae-813 hoon Lee} and {J. Fisac} and {James B. Simon} and {James Koppel} and {James Zheng} and {James Zou} and {Jan Ko-815 co´n} and {Jana Thompson} and {Jared Kaplan} and {Jarema Radom} and {Joyce Chua} and {Kamil Kanclerz} and {Karen Livescu} and {Karl Krauth} and {Karthik Gopalakrishnan} and {Katerina Ignatyeva} and {K. Markert} and {Kaustubh D. Dhole} and {Kevin Gim-827 pel} and {Kevin Omondi} and {K. Mathewson} and {Kristen Chi-828 afullo} and {Ksenia Shkaruta} and {Kumar Shridhar} and {Kyle Mc-829 Donell} and {Kyle Richardson} and {Laria Reynolds} and {Leo Gao} and {Li Zhang} and {Liam Dugan} and {Lianhui Qin} and {Lidia Contreras Ochando} and {Louis-Philippe Morency} and {Luca Moschella} and {Maarten ¸Senel} and {Maarten Bosma} and {Manaal Farooqi} and {Mantas Faruqui} and {Marco Mazeika} and {Marco Baturan} and {Marco Marelli} and {Maria Jose Maru} and {Marie Ramírez Quintana} and {Tolkiehn Mario} and {Martha Giulianelli} and {Martin Lewis} and {L. PotthastMatthew} and {Matthew L. Leavitt} and {Mátyás Schu-840 bert Hagen} and {Medina Orduna} and {Melody Baitemirova} and {Arnaud Melvin} and {Michael A McElrath} and {Michael A. Yee} and {Michael Co-842 hen} and {Michael Gu} and {Michael Ivanitskiy} and {Michael Star-843 ritt} and {M. Strube} and {Michele Sw˛edrowski} and {Michihiro Bevilacqua} and {Mihir Yasunaga} and {Mike Kale} and {Mimee Cain} and {Mirac Xu} and {Mo Suzgun} and {Monica Tiwari} and {Moin Bansal} and {Mor Aminnaseri} and {Mozhdeh Geva} and {Mukund Gheini} and {T. Varma} and {Nanyun Peng} and {tish Shirish Keskar} and {Niveditha Iyer} and {Noah Fiedel} and {Nuan Wen} and {Oliver Zhang} and {Omar Agha} and {Omar Elbaghdadi} and {Omer Levy} and {Owain Evans} and {Pablo Antonio} and {Moreno Casares} and {Parth Doshi} and {Jason Wei} and {Maarten Bosma} and {Vincent Y. Zhao} and {Adams Wei Guu} and {Brian Yu} and {Nan Lester} and {An-921 Du} and {M. Dai} and {Quoc V. Le} and {Finetuned} and {Adina Williams} and {Nikita Nangia} and {Samuel R. Bowman} and {Thomas Wolf} and {Lysandre Debut} and {Clement Chaumond} and {Anthony Delangue} and {Pier-339 Moi} and {Tim ric Cistac} and {Rémi Rault} and {Morgan Louf} and {Funtow-900 Joe} and {Sam Davison} and {Patrick Shleifer} and {V. Platen} and {Clara Ma} and {Yacine Jernite} and {J. Plu} and {Canwen Xu} and {Sylvain Gugger} and {Mariama Drame} and {Yinfei Yang} and {Yuan Zhang} and {Chris Tar} and {Hailey Schoelkopf} and {Niklas Muen-954} and {Alham Fikri} and {D. Adelani} and {M. Saiful Bari} and {Lintang Sutawika} and {Zhihan Zhang} and {Wenhao Yu} and {Mengxia Yu} and {Zhichun Guo} and {Jonathan May}},
year = 2023,
booktitle = {},
url = {https://www.semanticscholar.org/paper/6ce31ab55c3cad599b91e1a36c5e2928d31e3986},
}
@inproceedings{259923580,
title = {MULTIMEDIA CURRICULUM LEARNING FOR LANGUAGE ACQUISITION},
author = {{Pengfei Yu} and {Heng Ji} and {Shih-Fu Chang} and {Kevin Duh}},
year = 2023,
booktitle = {},
url = {https://www.semanticscholar.org/paper/7c7d8f106f8cd1bdadfd3b46f6ebb1509cb1be42},
}
@inproceedings{258060050,
title = {MOST: Multiple Object localization with Self-supervised Transformers for object discovery},
author = {{Sai Saketh Rambhatla} and {Ishan Misra} and {R. Chellappa} and {Abhinav Shrivastava}},
year = 2023,
month = {4},
booktitle = {IEEE International Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/3be837073f08eecc01e1bc742c541c5f0e644946},
}
@inproceedings{258615767,
title = {Analyzing Bias in Diffusion-based Face Generation Models},
author = {{Malsha V. Perera} and {Vishal M. Patel}},
year = 2023,
month = {5},
booktitle = {2023 IEEE International Joint Conference on Biometrics (IJCB)},
url = {https://www.semanticscholar.org/paper/94831cbd104369092b08f3711e6ac95c5f5f2c7b},
}
@inproceedings{257495961,
title = {PoseExaminer: Automated Testing of Out-of-Distribution Robustness in Human Pose and Shape Estimation},
author = {{Qihao Liu} and {Adam Kortylewski} and {A. Yuille}},
year = 2023,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/85fcce7ef6f5eec2d5e5bce82fc7246e8a90696c},
}
@inproceedings{263152687,
title = {Enhancing End-to-End Conversational Speech Translation Through Target Language Context Utilization},
author = {{A. Hussein} and {Brian Yan} and {Antonios Anastasopoulos} and {Shinji Watanabe} and {S. Khudanpur}},
year = 2023,
month = {9},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/c2745e86ecc9bec372690cced53ccfdf44f407f8},
}
@inproceedings{261076475,
title = {Animal3D: A Comprehensive Dataset of 3D Animal Pose and Shape},
author = {{Jiacong Xu} and {Yi Zhang} and {Jia-Xiong Peng} and {Wufei Ma} and {Artur Jesslen} and {Pengliang Ji} and {Qixing Hu} and {Jiehua Zhang} and {Qihao Liu} and {Jiahao Wang} and {Wei Ji} and {Chen Wang} and {Xiaoding Yuan} and {Prakhar Kaushik} and {Guofeng Zhang} and {Jie Liu} and {Yushan Xie} and {Yawen Cui} and {A. Yuille} and {Adam Kortylewski}},
year = 2023,
month = {8},
booktitle = {IEEE International Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/cf6f0b77e006083e74d5f08bae59bd207d0e4ac6},
}
@inproceedings{259129355,
title = {Developing Speech Processing Pipelines for Police Accountability},
author = {{Anjalie Field} and {Prateek Verma} and {Nay San} and {J. Eberhardt} and {Dan Jurafsky}},
year = 2023,
month = {6},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/38c2e4e54a50ea5027c7a06ab325c22ece7b6c40},
}
@inproceedings{255669634,
title = {BNET: Batch Normalization With Enhanced Linear Transformation},
author = {{Yuhui Xu} and {Lingxi Xie} and {Cihang Xie} and {Wenrui Dai} and {Jieru Mei} and {Siyuan Qiao} and {Wei Shen} and {H. Xiong} and {A. Yuille}},
year = 2023,
month = {1},
booktitle = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
url = {https://www.semanticscholar.org/paper/edcf374466f791118acf3bbd8430d4fd73e4ea79},
}
@inproceedings{259202526,
title = {SURT 2.0: Advances in Transducer-Based Multi-Talker Speech Recognition},
author = {{Desh Raj} and {Daniel Povey} and {S. Khudanpur}},
year = 2023,
month = {6},
booktitle = {IEEE/ACM Transactions on Audio Speech and Language Processing},
url = {https://www.semanticscholar.org/paper/a6fffd418fabef307cba5e70324a3ba89c7ffc39},
}
@inproceedings{258987867,
title = {Examining risks of racial biases in NLP tools for child protective services},
author = {{Anjalie Field} and {Amanda Coston} and {Nupoor Gandhi} and {A. Chouldechova} and {Emily Putnam-Hornstein} and {David Steier} and {Yulia Tsvetkov}},
year = 2023,
month = {5},
booktitle = {Conference on Fairness, Accountability and Transparency},
url = {https://www.semanticscholar.org/paper/346e4f35a5a81ef893792133ec1fec18f23c1768},
}
@inproceedings{261682358,
title = {Leveraging Pretrained Image-text Models for Improving Audio-Visual Learning},
author = {{Saurabhchand Bhati} and {J. Villalba} and {L. Moro-Velázquez} and {Thomas Thebaud} and {N. Dehak}},
year = 2023,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/ada7b279876196a283a8379729212338386c7eba},
}
@inproceedings{257766699,
title = {Spatio-Temporal Pixel-Level Contrastive Learning-based Source-Free Domain Adaptation for Video Semantic Segmentation},
author = {{Shao-Yuan Lo} and {Poojan Oza} and {Sumanth Chennupati} and {Alejandro Galindo} and {Vishal M. Patel}},
year = 2023,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/47cd9158e970329355a575ed992d4452ac498784},
}
@inproceedings{257833842,
title = {BloombergGPT: A Large Language Model for Finance},
author = {{Shijie Wu} and {Ozan Irsoy} and {Steven Lu} and {Vadim Dabravolski} and {Mark Dredze} and {Sebastian Gehrmann} and {P. Kambadur} and {D. Rosenberg} and {Gideon Mann}},
year = 2023,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/83edcfbb206ddad38a971d605da09390604248ea},
}
@inproceedings{260091661,
title = {From Adaptive Query Release to Machine Unlearning},
author = {{Enayat Ullah} and {R. Arora}},
year = 2023,
month = {7},
booktitle = {International Conference on Machine Learning},
url = {https://www.semanticscholar.org/paper/ea3eff68041f3a22b984578e8da8533aa3f766de},
}
@inproceedings{260914548,
title = {Do Phonatory Features Display Robustness to Characterize Parkinsonian Speech Across Corpora?},
author = {{A. Favaro} and {Tianyu Cao} and {Thomas Thebaud} and {J. Villalba} and {A. Butala} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2023,
month = {8},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/562d06b0cddb553a76e6b68f6f2ba470a17bb5d4},
}
@inproceedings{257632366,
title = {CLIP goes 3D: Leveraging Prompt Tuning for Language Grounded 3D Recognition},
author = {{Deepti Hegde} and {Jeya Maria Jose Valanarasu} and {Vishal M. Patel}},
year = 2023,
month = {3},
booktitle = {2023 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)},
url = {https://www.semanticscholar.org/paper/b460a263abec8b1aaa039963be9b371a581e7b21},
}
@inproceedings{258841086,
title = {Condensing Multilingual Knowledge with Lightweight Language-Specific Modules},
author = {{Haoran Xu} and {Weiting Tan} and {Shuyue Stella Li} and {Yunmo Chen} and {Benjamin Van Durme} and {Philipp Koehn} and {Kenton Murray}},
year = 2023,
month = {5},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/cf99558d35891d35ba5429cfce5ca2e2ae383b71},
}
@inproceedings{259361037,
title = {MultiVENT: Multilingual Videos of Events with Aligned Natural Text},
author = {{Kate Sanders} and {David Etter} and {Reno Kriz} and {Benjamin Van Durme}},
year = 2023,
month = {7},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/d6592cd383da0ebae9f4ff78a4df96ab635acfa2},
}
@inproceedings{258888240,
title = {Securing Deep Generative Models with Universal Adversarial Signature},
author = {{Yu Zeng} and {Mo Zhou} and {Yuan Xue} and {Vishal M. Patel}},
year = 2023,
month = {5},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/98e87cd4c19dad7018270b4561dc64b0109ee360},
}
@inproceedings{258959429,
title = {Why Does Zero-Shot Cross-Lingual Generation Fail? An Explanation and a Solution},
author = {{Tianjian Li} and {Kenton Murray}},
year = 2023,
month = {5},
booktitle = {Annual Meeting of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/aa933e27c470eeecbe7bbec5debdd8c5d2faa4be},
}
@inproceedings{263310495,
title = {Enhancing Code-Switching Speech Recognition With Interactive Language Biases},
author = {{Hexin Liu} and {Leibny Paola García} and {Xiangyu Zhang} and {Andy W. H. Khong} and {S. Khudanpur}},
year = 2023,
month = {9},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/47c14df80f649488c64f5659fa49ad356ff59470},
}
@inproceedings{258762744,
title = {Flatness-Aware Prompt Selection Improves Accuracy and Sample Efficiency},
author = {{Lingfeng Shen} and {Weiting Tan} and {Boyuan Zheng} and {Daniel Khashabi}},
year = 2023,
month = {5},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/b8ba16a107621f760e7830ddaab8c3d5c5ff06b0},
}
@inproceedings{258766137,
title = {Generalization bounds for Kernel Canonical Correlation Analysis},
author = {{Enayat Ullah} and {R. Arora}},
year = 2023,
booktitle = {Trans. Mach. Learn. Res.},
url = {https://www.semanticscholar.org/paper/4a55079d0145870461cbe2a48f53e40e64b7db3d},
}
@inproceedings{259840157,
title = {Multispectral Video Semantic Segmentation: A Benchmark Dataset and Baseline},
author = {{Wei Ji} and {Jingjing Li} and {Cheng Bian} and {Zongwei Zhou} and {Jiaying Zhao} and {A. Yuille} and {Li Cheng}},
year = 2023,
month = {6},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/fa0215c456d1957e131e43702e50e4c8f3e9477d},
}
@inproceedings{258999294,
title = {Zero and Few-shot Semantic Parsing with Ambiguous Inputs},
author = {{Elias Stengel-Eskin} and {Kyle Rawlins} and {Benjamin Van Durme}},
year = 2023,
month = {6},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/b8e49068441a43aaf039527c6063a033368dd357},
}
@inproceedings{257698009,
title = {Biomonitoring and precision health in deep space supported by artificial intelligence},
author = {{Ryan T. Scott} and {Lauren M. Sanders} and {E. Antonsen} and {Jaden J. A. Hastings} and {Seung-min Park} and {Graham Mackintosh} and {R. Reynolds} and {A. Hoarfrost} and {A. Sawyer} and {Casey S. Greene} and {Benjamin S. Glicksberg} and {C. Theriot} and {D. Berrios} and {Jack Miller} and {Joel Babdor} and {Richard Barker} and {S. Baranzini} and {Afshin Beheshti} and {Stuart Chalk} and {Guillermo M. Delgado-Aparicio} and {Melissa Haendel} and {Arif A. Hamid} and {P. Heller} and {Daniel Jamieson} and {K. Jarvis} and {John Kalantari} and {Kia Khezeli} and {Svetlana V. Komarova} and {M. Komorowski} and {Prachi Kothiyal} and {A. Mahabal} and {U. Manor} and {Héctor García Martín} and {Christopher E. Mason} and {Mona Matar} and {G. Mias} and {J. Myers} and {Charlotte A. Nelson} and {Jonathan Oribello} and {P. Parsons-Wingerter} and {R. K. Prabhu} and {A. Qutub} and {J. Rask} and {Amanda M. Saravia-Butler} and {S. Saria} and {N. Singh} and {M. Snyder} and {Frank Soboczenski} and {Karthik Soman} and {David Van Valen} and {K. Venkateswaran} and {L. Warren} and {Liz Worthey} and {Jason H. Yang} and {M. Zitnik} and {S. Costes}},
year = 2023,
month = {3},
booktitle = {Nature Machine Intelligence},
url = {https://www.semanticscholar.org/paper/275a42c374d6381406a5da16dfa52fa939817a15},
}
@inproceedings{258999635,
title = {Neural Textured Deformable Meshes for Robust Analysis-by-Synthesis},
author = {{Angtian Wang} and {Wufei Ma} and {A. Yuille} and {Adam Kortylewski}},
year = 2023,
month = {5},
booktitle = {IEEE Workshop/Winter Conference on Applications of Computer Vision},
url = {https://www.semanticscholar.org/paper/7752104e311751cc786a677f050e2815281039f8},
}
@inproceedings{258714648,
title = {AbdomenAtlas-8K: Annotating 8, 000 CT Volumes for Multi-Organ Segmentation in Three Weeks},
author = {{Chongyu Qu} and {Tiezheng Zhang} and {Hualin Qiao} and {Jie Liu} and {Yucheng Tang} and {A. Yuille} and {Zongwei Zhou}},
year = 2023,
month = {5},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/40927a6916f00f8e7ad43ad7009decb25a861767},
}
@inproceedings{259300311,
title = {JAWS-X: Addressing Efficiency Bottlenecks of Conformal Prediction Under Standard and Feedback Covariate Shift},
author = {{Drew Prinster} and {S. Saria} and {Anqi Liu}},
year = 2023,
booktitle = {International Conference on Machine Learning},
url = {https://www.semanticscholar.org/paper/6faf60347b9ec3672a4d191cfe9fe0076191e9a0},
}
@inproceedings{268499126,
title = {Do pretrained Transformers Really Learn In-context by Gradient Descent?},
author = {{Lingfeng Shen} and {Aayush Mishra} and {Daniel Khashabi}},
year = 2023,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/a9d460f8eb9001b1bed11b7fb2af555185c70fcf},
}
@inproceedings{256389683,
title = {CancerUniT: Towards a Single Unified Model for Effective Detection, Segmentation, and Diagnosis of Eight Major Cancers Using a Large Collection of CT Scans},
author = {{Jieneng Chen} and {Yingda Xia} and {Jiawen Yao} and {K. Yan} and {Jianpeng Zhang} and {Le Lu} and {Fakai Wang} and {Bo Zhou} and {Mingyan Qiu} and {Qihang Yu} and {Ming Yuan} and {Wei Fang} and {Yuxing Tang} and {Minfeng Xu} and {Jian Zhou} and {Yuqian Zhao} and {Qifeng Wang} and {X. Ye} and {Xiaoli Yin} and {Yu Shi} and {Xin Chen} and {Jingren Zhou} and {A. Yuille} and {Zai-De Liu} and {Ling Zhang}},
year = 2023,
month = {1},
booktitle = {IEEE International Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/30be551bfce603f76ba526f047ec4e610b0c2376},
}
Social media has become an established platform for people to organize and take offline actions, often in the form of civil unrest. Understanding these events can help support pro-democratic movements. The primary method to detect these events on Twitter relies on aggregating many tweets, but this includes many that are not relevant to the task. We propose a multi-instance learning (MIL) approach, which jointly identifies relevant tweets and detects civil unrest events. We demonstrate that MIL improves civil unrest detection over methods based on simple aggregation. Our best model achieves a 0.73 F1 on the Global Civil Unrest on Twitter (G-CUT) dataset.
@inproceedings{delucia-etal-2023-multi,
title = "A Multi-instance Learning Approach to Civil Unrest Event Detection on {T}witter",
author = "DeLucia, Alexandra and
Dredze, Mark and
Buczak, Anna L.",
editor = {H{\"u}rriyeto{\u{g}}lu, Ali and
Tanev, Hristo and
Zavarella, Vanni and
Yeniterzi, Reyyan and
Y{\"o}r{\"u}k, Erdem and
Slavcheva, Milena},
booktitle = "Proceedings of the 6th Workshop on Challenges and Applications of Automated Extraction of Socio-political Events from Text",
month = sep,
year = "2023",
address = "Varna, Bulgaria",
publisher = "INCOMA Ltd., Shoumen, Bulgaria",
url = "https://aclanthology.org/2023.case-1.3",
pages = "18--33",
abstract = "Social media has become an established platform for people to organize and take offline actions, often in the form of civil unrest. Understanding these events can help support pro-democratic movements. The primary method to detect these events on Twitter relies on aggregating many tweets, but this includes many that are not relevant to the task. We propose a multi-instance learning (MIL) approach, which jointly identifies relevant tweets and detects civil unrest events. We demonstrate that MIL improves civil unrest detection over methods based on simple aggregation. Our best model achieves a 0.73 F1 on the Global Civil Unrest on Twitter (G-CUT) dataset.",
}
@inproceedings{260003158,
title = {A RISC-V Neuromorphic Micro-Controller Unit (vMCU) with Event-Based Physical Interface and Computational Memory for Low-Latency Machine Perception and Intelligence at the Edge},
author = {{Daniel R. Mendat} and {Jonah P. Sengupta} and {Gaspar Tognetti} and {M. Villemur} and {P. Pouliquen} and {Sergio Montano} and {Kayode A. Sanni} and {J. Molin} and {Nishant Zachariah} and {I. Doxas} and {A. Andreou}},
year = 2023,
month = {5},
booktitle = {International Symposium on Circuits and Systems},
url = {https://www.semanticscholar.org/paper/0d2f0f6eb40d3be7b97a19315439721cf7ae8469},
}
@inproceedings{259893511,
title = {Editorial Introduction to the Special Issue on Biometrics at a Distance in the Deep Learning Era},
author = {{M. Marín-Jiménez} and {Shiqi Yu} and {Yasushi Makihara} and {Vishal M. Patel} and {Maneet Singh} and {M. De Marsico}},
year = 2023,
month = {5},
booktitle = {IEEE Journal on Selected Topics in Signal Processing},
url = {https://www.semanticscholar.org/paper/df958104e921170b592e27798e18de9b9c892cbd},
}
@inproceedings{260334568,
title = {Disruptive Autoencoders: Leveraging Low-level features for 3D Medical Image Pre-training},
author = {{Jeya Maria Jose Valanarasu} and {Yucheng Tang} and {Dong Yang} and {Ziyue Xu} and {Can Zhao} and {Wenqi Li} and {Vishal M. Patel} and {Bennett A. Landman} and {Daguang Xu} and {Yufan He} and {V. Nath}},
year = 2023,
month = {7},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/21510551199cc8ebfba5252575133de607448fa9},
}
@inproceedings{259145290,
title = {Compositor: Bottom-Up Clustering and Compositing for Robust Part and Object Segmentation},
author = {{Ju He} and {Jieneng Chen} and {Ming-Xian Lin} and {Qihang Yu} and {A. Yuille}},
year = 2023,
month = {6},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/c49666de550031cd63514dacc74b5c4a632da6a6},
}
@inproceedings{261065732,
title = {Crosslingual Handwritten Text Generation Using GANs},
author = {{Chun-Chieh Chang} and {Leibny Paola García-Perera} and {S. Khudanpur}},
year = 2023,
booktitle = {ICDAR Workshops},
url = {https://www.semanticscholar.org/paper/48abc94b0eaf32dac2573dc5cdbe5dcfa897b7f0},
}
@inproceedings{257766789,
title = {Label-Free Liver Tumor Segmentation},
author = {{Qixing Hu} and {Yixiong Chen} and {Junfei Xiao} and {Shuwen Sun} and {Jieneng Chen} and {A. Yuille} and {Zongwei Zhou}},
year = 2023,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/74fc777becc43b9e94c2fb59ed3ee78d212ca01e},
}
@inproceedings{258383693,
title = {Leveraging synthetic data for robust gesture recognition},
author = {{Kapil D. Katyal} and {R. Chellappa} and {Ketul Shah} and {Arun V. Reddy} and {Judy Hoffman} and {William Paul} and {Rohita Mocharla} and {D. Handelman} and {Celso de Melo}},
year = 2023,
month = {6},
booktitle = {Defense + Commercial Sensing},
url = {https://www.semanticscholar.org/paper/922198774621861436721bd923dc0f0028872a84},
}
@inproceedings{258909084,
title = {The promise of AI and technology to improve quality of life and care for older adults},
author = {{P. Abadir} and {Ramalingam Chellappa} and {N. Choudhry} and {G. Demiris} and {Deepak Ganesan} and {Jason Karlawish} and {Rose M Li} and {Jason H. Moore} and {J. Walston} and {Benjamin Najim Alicia I. Mathias Thomas K. M. Suchi Esther Marlin Dehak Arbaje Unberath Cudjoe Saria Oh Lunde} and {Benjamin M Marlin} and {N. Dehak} and {A. Arbaje} and {M. Unberath} and {Thomas K. M. Cudjoe} and {S. Saria} and {Esther Oh} and {N. Lundebjerg} and {C. Chute} and {Phillip Phan} and {Quincy M. Samus} and {Nancy L. Schoenborn}},
year = 2023,
month = {5},
booktitle = {Nature Aging},
url = {https://www.semanticscholar.org/paper/24eafaf005bd6d73870b66525e8978b760e7b3ad},
}
@inproceedings{257697867,
title = {Biological research and self-driving labs in deep space supported by artificial intelligence},
author = {{Lauren M. Sanders} and {Ryan T. Scott} and {Jason H. Yang} and {Amina Ann Qutub} and {Héctor García Martín} and {D. Berrios} and {Jaden J. A. Hastings} and {J. Rask} and {Graham Mackintosh} and {A. Hoarfrost} and {Stuart Chalk} and {John Kalantari} and {Kia Khezeli} and {E. Antonsen} and {Joel Babdor} and {Richard Barker} and {S. Baranzini} and {Afshin Beheshti} and {Guillermo M. Delgado-Aparicio} and {B. Glicksberg} and {Casey S. Greene} and {Melissa Haendel} and {Arif A. Hamid} and {P. Heller} and {Daniel Jamieson} and {K. Jarvis} and {Svetlana V. Komarova} and {M. Komorowski} and {Prachi Kothiyal} and {A. Mahabal} and {U. Manor} and {Christopher E. Mason} and {Mona Matar} and {G. Mias} and {Jack M. Miller} and {J. Myers} and {Charlotte A. Nelson} and {Jonathan Oribello} and {Seung-min Park} and {P. Parsons-Wingerter} and {R. K. Prabhu} and {R. Reynolds} and {Amanda M. Saravia-Butler} and {S. Saria} and {A. Sawyer} and {N. Singh} and {M. Snyder} and {Frank Soboczenski} and {Karthik Soman} and {C. Theriot} and {David Van Valen} and {K. Venkateswaran} and {L. Warren} and {Liz Worthey} and {M. Zitnik} and {S. Costes}},
year = 2023,
month = {3},
booktitle = {Nature Machine Intelligence},
url = {https://www.semanticscholar.org/paper/880e7f45c1952189e350545dd98a73ef47465cba},
}
@inproceedings{258987816,
title = {MERLIon CCS Challenge Evaluation Plan},
author = {{Leibny Paola García Perera} and {Y. H. V. Chua} and {Hexin Liu} and {Fei Ting Woon} and {Andy W. H. Khong} and {J. Dauwels} and {S. Khudanpur} and {S. Styles}},
year = 2023,
month = {5},
booktitle = {},
url = {https://www.semanticscholar.org/paper/6616c330539e1f38b8d80d5aec6eaf0be98f9314},
}
@inproceedings{259251557,
title = {The CHiME-7 DASR Challenge: Distant Meeting Transcription with Multiple Devices in Diverse Scenarios},
author = {{Samuele Cornell} and {Matthew Wiesner} and {Shinji Watanabe} and {Desh Raj} and {Xuankai Chang} and {Paola García} and {Yoshiki Masuyama} and {Zhong-Qiu Wang} and {S. Squartini} and {S. Khudanpur}},
year = 2023,
month = {6},
booktitle = {7th International Workshop on Speech Processing in Everyday Environments (CHiME 2023)},
url = {https://www.semanticscholar.org/paper/d4d5fe4a35e9de845877015075f727415e83d18f},
}
@inproceedings{268083188,
title = {Evaluating Algorithmic Bias in 30-Day Hospital Readmission Models: Retrospective Analysis},
author = {{H. E. Wang} and {Jonathan P. Weiner} and {S. Saria} and {Hadi Kharrazi}},
year = 2023,
month = {3},
booktitle = {Journal of Medical Internet Research},
url = {https://www.semanticscholar.org/paper/ed42741178d7d119acb440ae5a6d6f9f87fc1523},
}
@inproceedings{268064142,
title = {Causal-structure Driven Augmentations for Text OOD Generalization},
author = {{Amir Feder} and {Yoav Wald} and {Claudia Shi} and {S. Saria} and {David M. Blei}},
year = 2023,
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/dce7db550d6edda246d7848a37f777ba3b9bbf2f},
}
@inproceedings{262185166,
title = {Using a quality improvement tool, Plan-Do-Study-Act cycle, to boost TB notification in India post-Covid-19 pandemic.},
author = {{Manoj Jain} and {Salil Bhargava} and {R. Arora} and {Rajendra P. Joshi} and {Ravinder Kumar} and {Deepak Saxena} and {Kiran Rade} and {Rebecca Martin}},
year = 2023,
month = {9},
booktitle = {Indian Journal of Tuberculosis},
url = {https://www.semanticscholar.org/paper/acbaffb72d4c3bd7c9a12d6c756a4a207dea3703},
}
@inproceedings{259137602,
title = {A Survey of Vision-Language Pre-training from the Lens of Multimodal Machine Translation},
author = {{Jeremy Gwinnup} and {Kevin Duh}},
year = 2023,
month = {6},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/c581d2ad3b092a2cc152d0c6f55fd6320f78eb3a},
}
@inproceedings{257378503,
title = {Self-FiLM: Conditioning GANs with self-supervised representations for bandwidth extension based speaker recognition},
author = {{Saurabh Kataria} and {J. Villalba} and {Laureano Moro-Vel'azquez} and {Thomas Thebaud} and {N. Dehak}},
year = 2023,
month = {3},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/03e266795339008e9366daabfd2a2db2fbd51151},
}
@inproceedings{259202766,
title = {DuTa-VC: A Duration-aware Typical-to-atypical Voice Conversion Approach with Diffusion Probabilistic Model},
author = {{Helin Wang} and {Thomas Thebaud} and {J. Villalba} and {Myra Sydnor} and {Becky Lammers} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2023,
month = {6},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/bf6339e920466f2dc7dc0da5edde5b3187cf9d0d},
}
@inproceedings{258686491,
title = {Natural Language Decomposition and Interpretation of Complex Utterances},
author = {{Harsh Jhamtani} and {Hao Fang} and {Patrick Xia} and {Eran Levy} and {Jacob Andreas} and {Benjamin Van Durme}},
year = 2023,
month = {5},
booktitle = {International Joint Conference on Artificial Intelligence},
url = {https://www.semanticscholar.org/paper/68040213e9a83408cdc491ed3e235b52b537eed1},
}
@inproceedings{260870320,
title = {Birds of an odd feather: guaranteed out-of-distribution (OOD) novel category detection},
author = {{Yoav Wald} and {S. Saria}},
year = 2023,
booktitle = {Conference on Uncertainty in Artificial Intelligence},
url = {https://www.semanticscholar.org/paper/90869ce11a670ca4fb568a56a38f3ffe37161121},
}
@inproceedings{258865247,
title = {T1: Scaling Diffusion Probabilistic Fields to High-Resolution on Unified Visual Modalities},
author = {{Kangfu Mei} and {Mo Zhou} and {Vishal M. Patel}},
year = 2023,
month = {5},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/95dd7685e9b4e6195d80b22167d980be4379da44},
}
@inproceedings{259298670,
title = {Which Layer is Learning Faster? A Systematic Exploration of Layer-wise Convergence Rate for Deep Neural Networks},
author = {{Yixiong Chen} and {A. Yuille} and {Zongwei Zhou}},
year = 2023,
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/ca195fc6d5879060135a5cf6ff571b243f0c6156},
}
@inproceedings{259859140,
title = {An Extensive Exploration of Back-Translation in 60 Languages},
author = {{Paul McNamee} and {Kevin Duh}},
year = 2023,
booktitle = {Annual Meeting of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/3b1cea929fb0a44886ed654c9ca88a9df959f371},
}
@inproceedings{257687723,
title = {Self-supervised Learning with Speech Modulation Dropout},
author = {{Samik Sadhu} and {H. Hermansky}},
year = 2023,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/eb6358eca5f4ee632f929cb384d07b6a5f04e0ef},
}
@inproceedings{257663507,
title = {CrowdDiff: Multi-Hypothesis Crowd Density Estimation Using Diffusion Models},
author = {{Y. Ranasinghe} and {Nithin Gopalakrishnan Nair} and {W. G. C. Bandara} and {Vishal M. Patel}},
year = 2023,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/315d4007e3cc0384c9e340160c44fd698a9ec052},
}
@inproceedings{258570384,
title = {Explicit-memory multiresolution adaptive framework for speech and music separation},
author = {{Ashwin Bellur} and {Karan Thakkar} and {Mounya Elhilali}},
year = 2023,
month = {5},
booktitle = {EURASIP Journal on Audio, Speech, and Music Processing},
url = {https://www.semanticscholar.org/paper/237ea0d3b14b924f12693a29de6fa903a3ae54ed},
}
@inproceedings{255372928,
title = {CLIP-Driven Universal Model for Organ Segmentation and Tumor Detection},
author = {{Jie Liu} and {Yixiao Zhang} and {Jieneng Chen} and {Junfei Xiao} and {Yongyi Lu} and {Bennett A. Landman} and {Yixuan Yuan} and {A. Yuille} and {Yucheng Tang} and {Zongwei Zhou}},
year = 2023,
month = {1},
booktitle = {IEEE International Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/125632627bfad80c2c688bcbed7f3ee915de7359},
}
@inproceedings{257323163,
title = {Multilingual evaluation of interpretable biomarkers to represent language and speech patterns in Parkinson's disease},
author = {{A. Favaro} and {L. Moro-Velázquez} and {A. Butala} and {C. Motley} and {Tianyu Cao} and {R. Stevens} and {J. Villalba} and {N. Dehak}},
year = 2023,
month = {3},
booktitle = {Frontiers in Neurology},
url = {https://www.semanticscholar.org/paper/3ed2d557a323c9fc39dbdd64e0ffab064b35a7f9},
}
@inproceedings{259063779,
title = {Bypass Temporal Classification: Weakly Supervised Automatic Speech Recognition with Imperfect Transcripts},
author = {{Dongji Gao} and {Matthew Wiesner} and {Hainan Xu} and {Leibny Paola García} and {Daniel Povey} and {S. Khudanpur}},
year = 2023,
month = {6},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/b620d46668d62930e41393168434118bb9a2bfcb},
}
@inproceedings{257366012,
title = {VIPeR: Provably Efficient Algorithm for Offline RL with Neural Function Approximation},
author = {{Thanh Nguyen-Tang} and {R. Arora}},
year = 2023,
month = {2},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/7d200b868cb92657a68ac64c112a2cd0a4045f87},
}
@inproceedings{260125020,
title = {SwinMM: Masked Multi-view with Swin Transformers for 3D Medical Image Segmentation},
author = {{Yiqing Wang} and {Zihan Li} and {Jieru Mei} and {Zi-Ying Wei} and {Li Liu} and {Chen Wang} and {Shengtian Sang} and {A. Yuille} and {Cihang Xie} and {Yuyin Zhou}},
year = 2023,
month = {7},
booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention},
url = {https://www.semanticscholar.org/paper/c84e03c8ba7feaa2679a90b1637f3b079be15aa9},
}
@inproceedings{266199727,
title = {Constrained Synthetic Sampling for Augmentation of Crackle Lung Sounds},
author = {{A. Kala} and {Mounya Elhilali}},
year = 2023,
month = {7},
booktitle = {Annual International Conference of the IEEE Engineering in Medicine and Biology Society},
url = {https://www.semanticscholar.org/paper/d463716d4860ccc8a42190b9d90bc94af45db1ac},
}
@inproceedings{258079344,
title = {Regularizing Contrastive Predictive Coding for Speech Applications},
author = {{Saurabhchand Bhati} and {J. Villalba} and {Piotr Żelasko} and {L. Moro-Velázquez} and {N. Dehak}},
year = 2023,
month = {4},
booktitle = {},
url = {https://www.semanticscholar.org/paper/47ac48e7ee37e7cf4d3bb183477e42d6c5632b64},
}
@inproceedings{257378087,
title = {Data Portraits: Recording Foundation Model Training Data},
author = {{Marc Marone} and {Benjamin Van Durme}},
year = 2023,
month = {3},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/572b92972eff7501ca2b109b8998cdcb69aa1958},
}
@inproceedings{260003954,
title = {Asynchronous, Spatiotemporal Filtering using an Analog Cellular Neural Network Processor},
author = {{Jonah P. Sengupta} and {M. A. Tomlinson} and {Daniel R. Mendat} and {M. Villemur} and {A. Andreou}},
year = 2023,
month = {5},
booktitle = {International Symposium on Circuits and Systems},
url = {https://www.semanticscholar.org/paper/30446a1b3ca0fc61c3b672d5a284e0dcb761fe6d},
}
@inproceedings{257848515,
title = {AC Transit Fuel Cell Electric Bus Progress Report (Data Period Focus: Jan. 2020 through Dec. 2020)},
author = {{L. Eudy} and {Matt Post}},
year = 2023,
month = {3},
booktitle = {},
url = {https://www.semanticscholar.org/paper/69cf8aae9aa20f261b91ad67636fc064a2376e7a},
}
@inproceedings{259047417,
title = {Interpretable Speech Features vs. DNN Embeddings: What to Use in the Automatic Assessment of Parkinson's Disease in Multi-lingual Scenarios},
author = {{A. Favaro} and {Yi-Ting Tsai} and {A. Butala} and {Thomas Thebaud} and {J. Villalba} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2023,
month = {6},
booktitle = {medRxiv},
url = {https://www.semanticscholar.org/paper/8d18efe22ad66b53a0a13fc71c9b57c41b7790d0},
}
@inproceedings{258841479,
title = {Multilingual Pixel Representations for Translation and Effective Cross-lingual Transfer},
author = {{Elizabeth Salesky} and {Neha Verma} and {Philipp Koehn} and {Matt Post}},
year = 2023,
month = {5},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/c60736e61f8961ec535ecfdc6f0398925d34d0b8},
}
@inproceedings{259993644,
title = {Electrostatic Acoustic Sensor with an Impedance-Matched Diaphragm Characterized for Body Sound Monitoring.},
author = {{V. Rennoll} and {Ian McLane} and {Adebayo A. Eisape} and {D. Grant} and {Helena Hahn} and {Mounya Elhilali} and {James E. West}},
year = 2023,
month = {7},
booktitle = {ACS Applied Bio Materials},
url = {https://www.semanticscholar.org/paper/bf5172b246adb601b731618108ba8ce5d1367177},
}
@inproceedings{258997982,
title = {Deep Stroop: Using eye tracking and speech processing to characterize people with neurodegenerative disorders while performing the Stroop Test},
author = {{T. Meyer} and {A. Favaro} and {Tianyu Cao} and {A. Butala} and {E. Oh} and {C. Motley} and {P. Irazoqui} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2023,
month = {6},
booktitle = {medRxiv},
url = {https://www.semanticscholar.org/paper/172e04d89d89109626cba6a5b2d4d8a736bd145d},
}
@inproceedings{259302532,
title = {Online speech synthesis using a chronically implanted brain-computer interface in an individual with ALS},
author = {{Miguel Angrick} and {Shiyu Luo} and {Qinwan Rabbani} and {Daniel N Candrea} and {Samyak Shah} and {Griffin W. Milsap} and {W. Anderson} and {C. Gordon} and {Kathryn R Rosenblatt} and {L. Clawson} and {N. Maragakis} and {F. Tenore} and {M. Fifer} and {H. Hermansky} and {N. Ramsey} and {N. Crone}},
year = 2023,
month = {7},
booktitle = {medRxiv},
url = {https://www.semanticscholar.org/paper/3991788eee23646956065f50303a62379c1150dd},
}
@inproceedings{262056669,
title = {OpenAI Cribbed Our Tax Example, But Can GPT-4 Really Do Tax?},
author = {{Andrew Blair-Stanek} and {Nils Holzenberger} and {Benjamin Van Durme}},
year = 2023,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/a77de1f2e2dc253798e5ca9bee71e4d651dc30cd},
}
@inproceedings{263152081,
title = {Speech Collage: Code-Switched Audio Generation by Collaging Monolingual Corpora},
author = {{A. Hussein} and {Dorsa Zeinali} and {Ondrej Klejch} and {Matthew Wiesner} and {Brian Yan} and {Shammur A. Chowdhury} and {Ahmed Ali} and {Shinji Watanabe} and {S. Khudanpur}},
year = 2023,
month = {9},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/fa5ebb425c57f6c4f1c36a7200ef1da867346e8c},
}
@inproceedings{258374319,
title = {Perception of global properties, objects, and settings in natural auditory scenes},
author = {{Margaret A. McMullin} and {Nathan C Higgins} and {Brian Gygi} and {Rohit Kumar} and {Mounya Elhilali} and {J. Snyder}},
year = 2023,
month = {3},
booktitle = {Journal of the Acoustical Society of America},
url = {https://www.semanticscholar.org/paper/8890c3afc837ab0871d11f6ed17bfb6109943bff},
}
@inproceedings{258999199,
title = {Continual Learning for Abdominal Multi-Organ and Tumor Segmentation},
author = {{Yixiao Zhang} and {Xinyi Li} and {Huimiao Chen} and {A. Yuille} and {Yaoyao Liu} and {Zongwei Zhou}},
year = 2023,
month = {6},
booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention},
url = {https://www.semanticscholar.org/paper/7f29e3cb212df207146c567a420999cba6d9fff8},
}
@inproceedings{263152210,
title = {Learning From Flawed Data: Weakly Supervised Automatic Speech Recognition},
author = {{Dongji Gao} and {Hainan Xu} and {Desh Raj} and {Leibny Paola García Perera} and {Daniel Povey} and {S. Khudanpur}},
year = 2023,
month = {9},
booktitle = {Automatic Speech Recognition & Understanding},
url = {https://www.semanticscholar.org/paper/4df2d56e2c81d315e8ead7c3eaf840064ea3665e},
}
@inproceedings{258997975,
title = {Automating analysis of eye movement and feature extraction for different neurodegenerative disorders},
author = {{D. Li} and {A. Butala} and {T. Meyer} and {E. Oh} and {C. Motley} and {L. Moro-Velázquez} and {N. Dehak}},
year = 2023,
month = {6},
booktitle = {medRxiv},
url = {https://www.semanticscholar.org/paper/2b5f1cfc2b507561bd463b0a5ac14fd92d75dc50},
}
@inproceedings{259991385,
title = {GLSFormer: Gated - Long, Short Sequence Transformer for Step Recognition in Surgical Videos},
author = {{Nisarg A. Shah} and {S. Sikder} and {S. Vedula} and {Vishal M. Patel}},
year = 2023,
month = {7},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/330bf5c3162606581ebfba1f744e1f7da90c5de4},
}
@inproceedings{260715129,
title = {Best Paper Section IEEE International Conference on Automatic Face and Gesture Recognition 2021},
author = {{Rachael E. Jack} and {Vishal M. Patel} and {P. Turaga} and {Mayank Vatsa} and {Ramalingam Chellappa} and {A. Pentland} and {Richa Singh}},
year = 2023,
month = {7},
booktitle = {IEEE Transactions on Biometrics Behavior and Identity Science},
url = {https://www.semanticscholar.org/paper/51bdfb0e1834a150abd52ad73b63e80ad690aa80},
}
@inproceedings{257505032,
title = {InstMove: Instance Motion for Object-centric Video Segmentation},
author = {{Qihao Liu} and {Junfeng Wu} and {Yi Jiang} and {Xiang Bai} and {A. Yuille} and {S. Bai}},
year = 2023,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/0e60c1229d7963b605b83cb10a90ed6a8cf79149},
}
@inproceedings{257532548,
title = {Deep Learning for Cross-Domain Few-Shot Visual Recognition: A Survey},
author = {{Huali Xu} and {Shuaifeng Zhi} and {Shuzhou Sun} and {Vishal M. Patel} and {Li Liu}},
year = 2023,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/095138d9207da38bce4914c569e2f312927213b5},
}
@inproceedings{260704213,
title = {Cross-Dataset Adaptation for Instrument Classification in Cataract Surgery Videos},
author = {{Jay N. Paranjape} and {S. Sikder} and {Vishal M. Patel} and {S. Vedula}},
year = 2023,
month = {7},
booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention},
url = {https://www.semanticscholar.org/paper/648a8bc5f5e6354aa56a899c327715bfaa80944d},
}
@inproceedings{257404851,
title = {Stabilized training of joint energy-based models and their practical applications},
author = {{Martin Sustek} and {Samik Sadhu} and {L. Burget} and {H. Hermansky} and {J. Villalba} and {L. Moro-Velázquez} and {N. Dehak}},
year = 2023,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/46fd16213979b00e741b926539ad4ba7a1acd1cf},
}
@inproceedings{257985028,
title = {Diffusion Models as Masked Autoencoders},
author = {{Chen Wei} and {K. Mangalam} and {Po-Yao (Bernie) Huang} and {Yanghao Li} and {Haoqi Fan} and {Hu Xu} and {Huiyu Wang} and {Cihang Xie} and {A. Yuille} and {Christoph Feichtenhofer}},
year = 2023,
month = {4},
booktitle = {IEEE International Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/b032f324a0d4a24fd917551345bd100dc368e41a},
}
@inproceedings{261637808,
title = {Editorial: Artificial intelligence for human function and disability},
author = {{Denis Newman-Griffis} and {Bart Desmet} and {Ayah Zirikly} and {Suzanne Tamang} and {Chih-Hung Chang}},
year = 2023,
month = {9},
booktitle = {Frontiers Digit. Health},
url = {https://www.semanticscholar.org/paper/251b6ab5f8aa64447bcab84b2078a7198afc4ac3},
}
@inproceedings{259203410,
title = {HK-LegiCoST: Leveraging Non-Verbatim Transcripts for Speech Translation},
author = {{Cihan Xiao} and {Henry Li Xinyuan} and {Jinyi Yang} and {Dongji Gao} and {Matthew Wiesner} and {Kevin Duh} and {S. Khudanpur}},
year = 2023,
month = {6},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/74173dec94055d7f4051aa2e80be31ccd2bde596},
}
@inproceedings{254366617,
title = {AsyInst: Asymmetric Affinity with DepthGrad and Color for Box-Supervised Instance Segmentation},
author = {{Si-Jia Yang} and {Longlong Jing} and {Junfei Xiao} and {Hang Zhao} and {A. Yuille} and {Yingwei Li}},
year = 2022,
month = {12},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/1358ad196c4e300612fb3b65a2f3578836941384},
}
Most entity linking systems, whether mono or multilingual, link mentions to a single English knowledge base. Few have considered linking non-English text to a non-English KB, and therefore, transferring an English entity linking model to both a new document and KB language. We consider the task of zero-shot cross-language transfer of entity linking systems to a new language and KB. We find that a system trained with multilingual representations does reasonably well, and propose improvements to system training that lead to improved recall in most datasets, often matching the in-language performance. We further conduct a detailed evaluation to elucidate the challenges of this setting.
@inproceedings{schumacher-etal-2022-zero,
title = "Zero-shot Cross-Language Transfer of Monolingual Entity Linking Models",
author = "Schumacher, Elliot and
Mayfield, James and
Dredze, Mark",
editor = {Ataman, Duygu and
Gonen, Hila and
Ruder, Sebastian and
Firat, Orhan and
G{\"u}l Sahin, G{\"o}zde and
Mirzakhalov, Jamshidbek},
booktitle = "Proceedings of the 2nd Workshop on Multi-lingual Representation Learning (MRL)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.mrl-1.4",
doi = "10.18653/v1/2022.mrl-1.4",
pages = "38--51",
abstract = "Most entity linking systems, whether mono or multilingual, link mentions to a single English knowledge base. Few have considered linking non-English text to a non-English KB, and therefore, transferring an English entity linking model to both a new document and KB language. We consider the task of zero-shot cross-language transfer of entity linking systems to a new language and KB. We find that a system trained with multilingual representations does reasonably well, and propose improvements to system training that lead to improved recall in most datasets, often matching the in-language performance. We further conduct a detailed evaluation to elucidate the challenges of this setting.",
}
@inproceedings{254877586,
title = {When Do Decompositions Help for Machine Reading?},
author = {{Kangda Wei} and {Dawn J Lawrie} and {Benjamin Van Durme} and {Yunmo Chen} and {Orion Weller}},
year = 2022,
month = {12},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/624ea7bdaf7e8e3f7bd76f72aa665b562f0dd70a},
}
@inproceedings{254125357,
title = {Unite and Conquer: Cross Dataset Multimodal Synthesis using Diffusion Models},
author = {{Nithin Gopalakrishnan Nair} and {W. G. C. Bandara} and {Vishal M. Patel}},
year = 2022,
month = {12},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/24e6c62fd28da4ecf748620e1f25eae7337bad40},
}
@inproceedings{254563914,
title = {GPU-accelerated Guided Source Separation for Meeting Transcription},
author = {{Desh Raj} and {Daniel Povey} and {S. Khudanpur}},
year = 2022,
month = {12},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/ad9199a35c5ce4738c39bb4af8abf7caee418365},
}
We present an empirical study on methods for span finding, the selection of consecutive tokens in text for some downstream tasks. We focus on approaches that can be employed in training end-to-end information extraction systems, and find there is no definitive solution without considering task properties, and provide our observations to help with future design choices: 1) a tagging approach often yields higher precision while span enumeration and boundary prediction provide higher recall; 2) span type information can benefit a boundary prediction approach; 3) additional contextualization does not help span finding in most cases.
@inproceedings{gu-etal-2022-empirical,
title = "An Empirical Study on Finding Spans",
author = "Gu, Weiwei and
Zheng, Boyuan and
Chen, Yunmo and
Chen, Tongfei and
Van Durme, Benjamin",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.264",
doi = "10.18653/v1/2022.emnlp-main.264",
pages = "3976--3983",
abstract = "We present an empirical study on methods for span finding, the selection of consecutive tokens in text for some downstream tasks. We focus on approaches that can be employed in training end-to-end information extraction systems, and find there is no definitive solution without considering task properties, and provide our observations to help with future design choices: 1) a tagging approach often yields higher precision while span enumeration and boundary prediction provide higher recall; 2) span type information can benefit a boundary prediction approach; 3) additional contextualization does not help span finding in most cases.",
}
@inproceedings{254636282,
title = {Bi-Noising Diffusion: Towards Conditional Diffusion Models with Generative Restoration Priors},
author = {{Kangfu Mei} and {Nithin Gopalakrishnan Nair} and {Vishal M. Patel}},
year = 2022,
month = {12},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/e5fec7e9103c9edbc4c6b4bb1a47e53593c667bb},
}
In natural language understanding (NLU) production systems, users{‘} evolving needs necessitate the addition of new features over time, indexed by new symbols added to the meaning representation space. This requires additional training data and results in ever-growing datasets. We present the first systematic investigation into this incremental symbol learning scenario. Our analysis reveals a troubling quirk in building broad-coverage NLU systems: as the training dataset grows, performance on a small set of new symbols often decreases. We show that this trend holds for multiple mainstream models on two common NLU tasks: intent recognition and semantic parsing. Rejecting class imbalance as the sole culprit, we reveal that the trend is closely associated with an effect we call source signal dilution, where strong lexical cues for the new symbol become diluted as the training dataset grows. Selectively dropping training examples to prevent dilution often reverses the trend, showing the over-reliance of mainstream neural NLU models on simple lexical cues.
@inproceedings{stengel-eskin-etal-2022-data,
title = "When More Data Hurts: A Troubling Quirk in Developing Broad-Coverage Natural Language Understanding Systems",
author = "Stengel-Eskin, Elias and
Platanios, Emmanouil Antonios and
Pauls, Adam and
Thomson, Sam and
Fang, Hao and
Van Durme, Benjamin and
Eisner, Jason and
Su, Yu",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.789",
doi = "10.18653/v1/2022.emnlp-main.789",
pages = "11473--11487",
abstract = "In natural language understanding (NLU) production systems, users{'} evolving needs necessitate the addition of new features over time, indexed by new symbols added to the meaning representation space. This requires additional training data and results in ever-growing datasets. We present the first systematic investigation into this incremental symbol learning scenario. Our analysis reveals a troubling quirk in building broad-coverage NLU systems: as the training dataset grows, performance on a small set of new symbols often decreases. We show that this trend holds for multiple mainstream models on two common NLU tasks: intent recognition and semantic parsing. Rejecting class imbalance as the sole culprit, we reveal that the trend is closely associated with an effect we call source signal dilution, where strong lexical cues for the new symbol become diluted as the training dataset grows. Selectively dropping training examples to prevent dilution often reverses the trend, showing the over-reliance of mainstream neural NLU models on simple lexical cues.",
}
Recent years have witnessed rapid advancements in machine translation, but the state-of-the-art machine translation system still can not satisfy the high requirements in some rigorous translation scenarios. Computer-aided translation (CAT) provides a promising solution to yield a high-quality translation with a guarantee. Unfortunately, due to the lack of popular benchmarks, the research on CAT is not well developed compared with machine translation. In this year, we hold a new shared task called Word-level AutoCompletion (WLAC) for CAT in WMT. Specifically, we introduce some resources to train a WLAC model, and particularly we collect data from CAT systems as a part of test data for this shared task. In addition, we employ both automatic and human evaluations to measure the performance of the submitted systems, and our final evaluation results reveal some findings for the WLAC task.
@inproceedings{casacuberta-etal-2022-findings,
title = "Findings of the Word-Level {A}uto{C}ompletion Shared Task in {WMT} 2022",
author = "Casacuberta, Francisco and
Foster, George and
Huang, Guoping and
Koehn, Philipp and
Kovacs, Geza and
Liu, Lemao and
Shi, Shuming and
Watanabe, Taro and
Zong, Chengqing",
editor = {Koehn, Philipp and
Barrault, Lo{\"\i}c and
Bojar, Ond{\v{r}}ej and
Bougares, Fethi and
Chatterjee, Rajen and
Costa-juss{\`a}, Marta R. and
Federmann, Christian and
Fishel, Mark and
Fraser, Alexander and
Freitag, Markus and
Graham, Yvette and
Grundkiewicz, Roman and
Guzman, Paco and
Haddow, Barry and
Huck, Matthias and
Jimeno Yepes, Antonio and
Kocmi, Tom and
Martins, Andr{\'e} and
Morishita, Makoto and
Monz, Christof and
Nagata, Masaaki and
Nakazawa, Toshiaki and
Negri, Matteo and
N{\'e}v{\'e}ol, Aur{\'e}lie and
Neves, Mariana and
Popel, Martin and
Turchi, Marco and
Zampieri, Marcos},
booktitle = "Proceedings of the Seventh Conference on Machine Translation (WMT)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.wmt-1.75",
pages = "812--820",
abstract = "Recent years have witnessed rapid advancements in machine translation, but the state-of-the-art machine translation system still can not satisfy the high requirements in some rigorous translation scenarios. Computer-aided translation (CAT) provides a promising solution to yield a high-quality translation with a guarantee. Unfortunately, due to the lack of popular benchmarks, the research on CAT is not well developed compared with machine translation. In this year, we hold a new shared task called Word-level AutoCompletion (WLAC) for CAT in WMT. Specifically, we introduce some resources to train a WLAC model, and particularly we collect data from CAT systems as a part of test data for this shared task. In addition, we employ both automatic and human evaluations to measure the performance of the submitted systems, and our final evaluation results reveal some findings for the WLAC task.",
}
Mental health stigma prevents many individuals from receiving the appropriate care, and social psychology studies have shown that mental health tends to be overlooked in men. In this work, we investigate gendered mental health stigma in masked language models. In doing so, we operationalize mental health stigma by developing a framework grounded in psychology research: we use clinical psychology literature to curate prompts, then evaluate the models{‘} propensity to generate gendered words. We find that masked language models capture societal stigma about gender in mental health: models are consistently more likely to predict female subjects than male in sentences about having a mental health condition (32{\%} vs. 19{\%}), and this disparity is exacerbated for sentences that indicate treatment-seeking behavior. Furthermore, we find that different models capture dimensions of stigma differently for men and women, associating stereotypes like anger, blame, and pity more with women with mental health conditions than with men. In showing the complex nuances of models{‘} gendered mental health stigma, we demonstrate that context and overlapping dimensions of identity are important considerations when assessing computational models{‘} social biases.
@inproceedings{lin-etal-2022-gendered,
title = "Gendered Mental Health Stigma in Masked Language Models",
author = "Lin, Inna and
Njoo, Lucille and
Field, Anjalie and
Sharma, Ashish and
Reinecke, Katharina and
Althoff, Tim and
Tsvetkov, Yulia",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.139",
doi = "10.18653/v1/2022.emnlp-main.139",
pages = "2152--2170",
abstract = "Mental health stigma prevents many individuals from receiving the appropriate care, and social psychology studies have shown that mental health tends to be overlooked in men. In this work, we investigate gendered mental health stigma in masked language models. In doing so, we operationalize mental health stigma by developing a framework grounded in psychology research: we use clinical psychology literature to curate prompts, then evaluate the models{'} propensity to generate gendered words. We find that masked language models capture societal stigma about gender in mental health: models are consistently more likely to predict female subjects than male in sentences about having a mental health condition (32{\%} vs. 19{\%}), and this disparity is exacerbated for sentences that indicate treatment-seeking behavior. Furthermore, we find that different models capture dimensions of stigma differently for men and women, associating stereotypes like anger, blame, and pity more with women with mental health conditions than with men. In showing the complex nuances of models{'} gendered mental health stigma, we demonstrate that context and overlapping dimensions of identity are important considerations when assessing computational models{'} social biases.",
}
For the most part, NLP applications operate at the sentence level. Since sentences occur most naturally in documents, they must be extracted and segmented via the use of a segmenter, of which there are a handful of options. There has been some work evaluating the performance of segmenters on intrinsic metrics, that look at their ability to recover human-segmented sentence boundaries, but there has been no work looking at the effect of segmenters on downstream tasks. We ask the question, {“}does segmentation matter?{”} and attempt to answer it on the task of machine translation. We consider two settings: the application of segmenters to a black-box system whose training segmentation is mostly unknown, as well as the variation in performance when segmenters are applied to the training process, too. We find that the choice of segmenter largely does not matter, so long as its behavior is not one of extreme under- or over-segmentation. For such settings, we provide some qualitative analysis examining their harms, and point the way towards document-level processing.
@inproceedings{wicks-post-2022-sentence,
title = "Does Sentence Segmentation Matter for Machine Translation?",
author = "Wicks, Rachel and
Post, Matt",
editor = {Koehn, Philipp and
Barrault, Lo{\"\i}c and
Bojar, Ond{\v{r}}ej and
Bougares, Fethi and
Chatterjee, Rajen and
Costa-juss{\`a}, Marta R. and
Federmann, Christian and
Fishel, Mark and
Fraser, Alexander and
Freitag, Markus and
Graham, Yvette and
Grundkiewicz, Roman and
Guzman, Paco and
Haddow, Barry and
Huck, Matthias and
Jimeno Yepes, Antonio and
Kocmi, Tom and
Martins, Andr{\'e} and
Morishita, Makoto and
Monz, Christof and
Nagata, Masaaki and
Nakazawa, Toshiaki and
Negri, Matteo and
N{\'e}v{\'e}ol, Aur{\'e}lie and
Neves, Mariana and
Popel, Martin and
Turchi, Marco and
Zampieri, Marcos},
booktitle = "Proceedings of the Seventh Conference on Machine Translation (WMT)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.wmt-1.78",
pages = "843--854",
abstract = "For the most part, NLP applications operate at the sentence level. Since sentences occur most naturally in documents, they must be extracted and segmented via the use of a segmenter, of which there are a handful of options. There has been some work evaluating the performance of segmenters on intrinsic metrics, that look at their ability to recover human-segmented sentence boundaries, but there has been no work looking at the effect of segmenters on downstream tasks. We ask the question, {``}does segmentation matter?{''} and attempt to answer it on the task of machine translation. We consider two settings: the application of segmenters to a black-box system whose training segmentation is mostly unknown, as well as the variation in performance when segmenters are applied to the training process, too. We find that the choice of segmenter largely does not matter, so long as its behavior is not one of extreme under- or over-segmentation. For such settings, we provide some qualitative analysis examining their harms, and point the way towards document-level processing.",
}
@inproceedings{254877370,
title = {Unleashing the Power of Visual Prompting At the Pixel Level},
author = {{Junyang Wu} and {Xianhang Li} and {Chen Wei} and {Huiyu Wang} and {A. Yuille} and {Yuyin Zhou} and {Cihang Xie}},
year = 2022,
month = {12},
booktitle = {Trans. Mach. Learn. Res.},
url = {https://www.semanticscholar.org/paper/7786825fd653b398c3975c3ff876459307d871f4},
}
Most existing dialogue systems fail to respond properly to potentially unsafe user utterances by either ignoring or passively agreeing with them. To address this issue, we introduce ProsocialDialog, the first large-scale multi-turn dialogue dataset to teach conversational agents to respond to problematic content following social norms. Covering diverse unethical, problematic, biased, and toxic situations, ProsocialDialog contains responses that encourage prosocial behavior, grounded in commonsense social rules (i.e., rules-of-thumb, RoTs). Created via a human-AI collaborative framework, ProsocialDialog consists of 58K dialogues, with 331K utterances, 160K unique RoTs, and 497K dialogue safety labels accompanied by free-form rationales.With this dataset, we introduce a dialogue safety detection module, Canary, capable of generating RoTs given conversational context, and a socially-informed dialogue agent, Prost. Empirical results show that Prost generates more socially acceptable dialogues compared to other state-of-the-art language and dialogue models in both in-domain and out-of-domain settings. Additionally, Canary effectively guides conversational agents and off-the-shelf language models to generate significantly more prosocial responses. Our work highlights the promise and importance of creating and steering conversational AI to be socially responsible.
@inproceedings{kim-etal-2022-prosocialdialog,
title = "{P}rosocial{D}ialog: A Prosocial Backbone for Conversational Agents",
author = "Kim, Hyunwoo and
Yu, Youngjae and
Jiang, Liwei and
Lu, Ximing and
Khashabi, Daniel and
Kim, Gunhee and
Choi, Yejin and
Sap, Maarten",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.267",
doi = "10.18653/v1/2022.emnlp-main.267",
pages = "4005--4029",
abstract = "Most existing dialogue systems fail to respond properly to potentially unsafe user utterances by either ignoring or passively agreeing with them. To address this issue, we introduce ProsocialDialog, the first large-scale multi-turn dialogue dataset to teach conversational agents to respond to problematic content following social norms. Covering diverse unethical, problematic, biased, and toxic situations, ProsocialDialog contains responses that encourage prosocial behavior, grounded in commonsense social rules (i.e., rules-of-thumb, RoTs). Created via a human-AI collaborative framework, ProsocialDialog consists of 58K dialogues, with 331K utterances, 160K unique RoTs, and 497K dialogue safety labels accompanied by free-form rationales.With this dataset, we introduce a dialogue safety detection module, Canary, capable of generating RoTs given conversational context, and a socially-informed dialogue agent, Prost. Empirical results show that Prost generates more socially acceptable dialogues compared to other state-of-the-art language and dialogue models in both in-domain and out-of-domain settings. Additionally, Canary effectively guides conversational agents and off-the-shelf language models to generate significantly more prosocial responses. Our work highlights the promise and importance of creating and steering conversational AI to be socially responsible.",
}
Building pretrained language models is considered expensive and data-intensive, but must we increase dataset size to achieve better performance? We propose an alternative to larger training sets by automatically identifying smaller yet domain-representative subsets. We extend Cynical Data Selection, a statistical sentence scoring method that conditions on a representative target domain corpus. As an example, we treat the OntoNotes corpus as a target domain and pretrain a RoBERTa-like encoder from a cynically selected subset of the Pile. On both perplexity and across several downstream tasks in the target domain, it consistently outperforms random selection with 20x less data, 3x fewer training iterations, and 2x less estimated cloud compute cost, validating the recipe of automatic document selection for LM pretraining.
@inproceedings{feng-etal-2022-automatic,
title = "Automatic Document Selection for Efficient Encoder Pretraining",
author = "Feng, Yukun and
Xia, Patrick and
Van Durme, Benjamin and
Sedoc, Jo{\~a}o",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.647",
doi = "10.18653/v1/2022.emnlp-main.647",
pages = "9522--9530",
abstract = "Building pretrained language models is considered expensive and data-intensive, but must we increase dataset size to achieve better performance? We propose an alternative to larger training sets by automatically identifying smaller yet domain-representative subsets. We extend Cynical Data Selection, a statistical sentence scoring method that conditions on a representative target domain corpus. As an example, we treat the OntoNotes corpus as a target domain and pretrain a RoBERTa-like encoder from a cynically selected subset of the Pile. On both perplexity and across several downstream tasks in the target domain, it consistently outperforms random selection with 20x less data, 3x fewer training iterations, and 2x less estimated cloud compute cost, validating the recipe of automatic document selection for LM pretraining.",
}
Multilingual pretrained models have shown strong cross-lingual transfer ability. Some works used code-switching sentences, which consist of tokens from multiple languages, to enhance the cross-lingual representation further, and have shown success in many zero-shot cross-lingual tasks. However, code-switched tokens are likely to cause grammatical incoherence in newly substituted sentences, and negatively affect the performance on token-sensitive tasks, such as Part-of-Speech (POS) tagging and Named-Entity-Recognition (NER). This paper mitigates the limitation of the code-switching method by not only making the token replacement but considering the similarity between the context and the switched tokens so that the newly substituted sentences are grammatically consistent during both training and inference. We conduct experiments on cross-lingual POS and NER over 30+ languages, and demonstrate the effectiveness of our method by outperforming the mBERT by 0.95 and original code-switching method by 1.67 on F1 scores.
@inproceedings{feng-etal-2022-toward,
title = "Toward the Limitation of Code-Switching in Cross-Lingual Transfer",
author = "Feng, Yukun and
Li, Feng and
Koehn, Philipp",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.400",
doi = "10.18653/v1/2022.emnlp-main.400",
pages = "5966--5971",
abstract = "Multilingual pretrained models have shown strong cross-lingual transfer ability. Some works used code-switching sentences, which consist of tokens from multiple languages, to enhance the cross-lingual representation further, and have shown success in many zero-shot cross-lingual tasks. However, code-switched tokens are likely to cause grammatical incoherence in newly substituted sentences, and negatively affect the performance on token-sensitive tasks, such as Part-of-Speech (POS) tagging and Named-Entity-Recognition (NER). This paper mitigates the limitation of the code-switching method by not only making the token replacement but considering the similarity between the context and the switched tokens so that the newly substituted sentences are grammatically consistent during both training and inference. We conduct experiments on cross-lingual POS and NER over 30+ languages, and demonstrate the effectiveness of our method by outperforming the mBERT by 0.95 and original code-switching method by 1.67 on F1 scores.",
}
@inproceedings{254125164,
title = {Super-CLEVR: A Virtual Benchmark to Diagnose Domain Robustness in Visual Reasoning},
author = {{Zhuowan Li} and {Xingrui Wang} and {Elias Stengel-Eskin} and {Adam Kortylewski} and {Wufei Ma} and {Benjamin Van Durme} and {Alan Yuille Johns Hopkins University} and {U. California} and {Max Planck Institute for Informatics} and {U. Freiburg}},
year = 2022,
month = {12},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/cb6365a1aa3133318ce7fa2461b6d1d48cd8152e},
}
@inproceedings{254767215,
title = {Distributed representations of natural body pose in visual cortex},
author = {{Hongru Zhu} and {Yijun Ge} and {Alexander Bratch} and {A. Yuille} and {Kendrick Norris Kay} and {D. Kersten}},
year = 2022,
month = {12},
booktitle = {Journal of Vision},
url = {https://www.semanticscholar.org/paper/0f737f04ade2ef8f4a360dc42296476a55fa49d3},
}
Bilingual lexicons form a critical component of various natural language processing applications, including unsupervised and semisupervised machine translation and crosslingual information retrieval. In this work, we improve bilingual lexicon induction performance across 40 language pairs with a graph-matching method based on optimal transport. The method is especially strong with low amounts of supervision.
@inproceedings{marchisio-etal-2022-bilingual,
title = "Bilingual Lexicon Induction for Low-Resource Languages using Graph Matching via Optimal Transport",
author = "Marchisio, Kelly and
Saad-Eldin, Ali and
Duh, Kevin and
Priebe, Carey and
Koehn, Philipp",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.164",
doi = "10.18653/v1/2022.emnlp-main.164",
pages = "2545--2561",
abstract = "Bilingual lexicons form a critical component of various natural language processing applications, including unsupervised and semisupervised machine translation and crosslingual information retrieval. In this work, we improve bilingual lexicon induction performance across 40 language pairs with a graph-matching method based on optimal transport. The method is especially strong with low amounts of supervision.",
}
@inproceedings{254879636,
title = {Automatic Extraction of Oculographic Signals as Digital Biomarkers for Alzheimer's Disease},
author = {{Trevor Meyer} and {L. Moro-Velázquez} and {Seneca Motley} and {A. Butala} and {Ashley M Paul} and {Quincy M. Samus} and {Pedro P. Irazoqui} and {N. Dehak} and {Esther S. Oh}},
year = 2022,
month = {12},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/e5a0988cdd73b981611be9fe06e0b7328ff1c0d0},
}
Additive interventions are a recently-proposed mechanism for controlling target-side attributes in neural machine translation by modulating the encoder{‘}s representation of a source sequence as opposed to manipulating the raw source sequence as seen in most previous tag-based approaches. In this work we examine the role of additive interventions in a large-scale multi-domain machine translation setting and compare its performance in various inference scenarios. We find that while the performance difference is small between intervention-based systems and tag-based systems when the domain label matches the test domain, intervention-based systems are robust to label error, making them an attractive choice under label uncertainty. Further, we find that the superiority of single-domain fine-tuning comes under question when training data is scaled, contradicting previous findings.
@inproceedings{rippeth-post-2022-additive,
title = "Additive Interventions Yield Robust Multi-Domain Machine Translation Models",
author = "Rippeth, Elijah and
Post, Matt",
editor = {Koehn, Philipp and
Barrault, Lo{\"\i}c and
Bojar, Ond{\v{r}}ej and
Bougares, Fethi and
Chatterjee, Rajen and
Costa-juss{\`a}, Marta R. and
Federmann, Christian and
Fishel, Mark and
Fraser, Alexander and
Freitag, Markus and
Graham, Yvette and
Grundkiewicz, Roman and
Guzman, Paco and
Haddow, Barry and
Huck, Matthias and
Jimeno Yepes, Antonio and
Kocmi, Tom and
Martins, Andr{\'e} and
Morishita, Makoto and
Monz, Christof and
Nagata, Masaaki and
Nakazawa, Toshiaki and
Negri, Matteo and
N{\'e}v{\'e}ol, Aur{\'e}lie and
Neves, Mariana and
Popel, Martin and
Turchi, Marco and
Zampieri, Marcos},
booktitle = "Proceedings of the Seventh Conference on Machine Translation (WMT)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.wmt-1.14",
pages = "220--232",
abstract = "Additive interventions are a recently-proposed mechanism for controlling target-side attributes in neural machine translation by modulating the encoder{'}s representation of a source sequence as opposed to manipulating the raw source sequence as seen in most previous tag-based approaches. In this work we examine the role of additive interventions in a large-scale multi-domain machine translation setting and compare its performance in various inference scenarios. We find that while the performance difference is small between intervention-based systems and tag-based systems when the domain label matches the test domain, intervention-based systems are robust to label error, making them an attractive choice under label uncertainty. Further, we find that the superiority of single-domain fine-tuning comes under question when training data is scaled, contradicting previous findings.",
}
Children acquiring English make systematic errors on subject control sentences even after they have reached near-adult competence (Chomsky, 1969), possibly due to heuristics based on semantic roles (Maratsos, 1974).Given the advanced fluency of large generative language models, we ask whether model outputs are consistent with these heuristics, and to what degree different models are consistent with each other. We find that models can be categorized by behavior into three separate groups, with broad differences between the groups. The outputs of models in the largest group are consistent with positional heuristics that succeed on subject control but fail on object control. This result is surprising, given that object control is orders of magnitude more frequent in the text data used to train such models. We examine to what degree the models are sensitive to prompting with agent-patient information, finding that raising the salience of agent and patient relations results in significant changes in the outputs of most models. Based on this observation, we leverage an existing dataset of semantic proto-role annotations (White et al. 2020) to explore the connections between control and labeling event participants with properties typically associated with agents and patients.
@inproceedings{stengel-eskin-van-durme-2022-curious,
title = "The Curious Case of Control",
author = "Stengel-Eskin, Elias and
Van Durme, Benjamin",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.760",
doi = "10.18653/v1/2022.emnlp-main.760",
pages = "11065--11076",
abstract = "Children acquiring English make systematic errors on subject control sentences even after they have reached near-adult competence (Chomsky, 1969), possibly due to heuristics based on semantic roles (Maratsos, 1974).Given the advanced fluency of large generative language models, we ask whether model outputs are consistent with these heuristics, and to what degree different models are consistent with each other. We find that models can be categorized by behavior into three separate groups, with broad differences between the groups. The outputs of models in the largest group are consistent with positional heuristics that succeed on subject control but fail on object control. This result is surprising, given that object control is orders of magnitude more frequent in the text data used to train such models. We examine to what degree the models are sensitive to prompting with agent-patient information, finding that raising the salience of agent and patient relations results in significant changes in the outputs of most models. Based on this observation, we leverage an existing dataset of semantic proto-role annotations (White et al. 2020) to explore the connections between control and labeling event participants with properties typically associated with agents and patients.",
}
Recent model pruning methods have demonstrated the ability to remove redundant parameters without sacrificing model performance. Common methods remove redundant parameters according to the parameter sensitivity, a gradient-based measure reflecting the contribution of the parameters. In this paper, however, we argue that redundant parameters can be trained to make beneficial contributions. We first highlight the large sensitivity (contribution) gap among high-sensitivity and low-sensitivity parameters and show that the model generalization performance can be significantly improved after balancing the contribution of all parameters. Our goal is to balance the sensitivity of all parameters and encourage all of them to contribute equally. We propose a general task-agnostic method, namely intra-distillation, appended to the regular training loss to balance parameter sensitivity. Moreover, we also design a novel adaptive learning method to control the strength of intra-distillation loss for faster convergence. Our experiments show the strong effectiveness of our methods on machine translation, natural language understanding, and zero-shot cross-lingual transfer across up to 48 languages, e.g., a gain of 3.54 BLEU on average across 8 language pairs from the IWSLT{‘}14 dataset.
@inproceedings{xu-etal-2022-importance,
title = "The Importance of Being Parameters: An Intra-Distillation Method for Serious Gains",
author = "Xu, Haoran and
Koehn, Philipp and
Murray, Kenton",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.13",
doi = "10.18653/v1/2022.emnlp-main.13",
pages = "170--183",
abstract = "Recent model pruning methods have demonstrated the ability to remove redundant parameters without sacrificing model performance. Common methods remove redundant parameters according to the parameter sensitivity, a gradient-based measure reflecting the contribution of the parameters. In this paper, however, we argue that redundant parameters can be trained to make beneficial contributions. We first highlight the large sensitivity (contribution) gap among high-sensitivity and low-sensitivity parameters and show that the model generalization performance can be significantly improved after balancing the contribution of all parameters. Our goal is to balance the sensitivity of all parameters and encourage all of them to contribute equally. We propose a general task-agnostic method, namely intra-distillation, appended to the regular training loss to balance parameter sensitivity. Moreover, we also design a novel adaptive learning method to control the strength of intra-distillation loss for faster convergence. Our experiments show the strong effectiveness of our methods on machine translation, natural language understanding, and zero-shot cross-lingual transfer across up to 48 languages, e.g., a gain of 3.54 BLEU on average across 8 language pairs from the IWSLT{'}14 dataset.",
}
Language diversity in NLP is critical in enabling the development of tools for a wide range of users.However, there are limited resources for building such tools for many languages, particularly those spoken in Africa.For search, most existing datasets feature few or no African languages, directly impacting researchers{‘} ability to build and improve information access capabilities in those languages.Motivated by this, we created AfriCLIRMatrix, a test collection for cross-lingual information retrieval research in 15 diverse African languages.In total, our dataset contains 6 million queries in English and 23 million relevance judgments automatically mined from Wikipedia inter-language links, covering many more African languages than any existing information retrieval test collection.In addition, we release BM25, dense retrieval, and sparse{–}dense hybrid baselines to provide a starting point for the development of future systems.We hope that these efforts can spur additional work in search for African languages.AfriCLIRMatrix can be downloaded at https://github.com/castorini/africlirmatrix.
@inproceedings{ogundepo-etal-2022-africlirmatrix,
title = "{A}fri{CLIRM}atrix: Enabling Cross-Lingual Information Retrieval for {A}frican Languages",
author = "Ogundepo, Odunayo and
Zhang, Xinyu and
Sun, Shuo and
Duh, Kevin and
Lin, Jimmy",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.597",
doi = "10.18653/v1/2022.emnlp-main.597",
pages = "8721--8728",
abstract = "Language diversity in NLP is critical in enabling the development of tools for a wide range of users.However, there are limited resources for building such tools for many languages, particularly those spoken in Africa.For search, most existing datasets feature few or no African languages, directly impacting researchers{'} ability to build and improve information access capabilities in those languages.Motivated by this, we created AfriCLIRMatrix, a test collection for cross-lingual information retrieval research in 15 diverse African languages.In total, our dataset contains 6 million queries in English and 23 million relevance judgments automatically mined from Wikipedia inter-language links, covering many more African languages than any existing information retrieval test collection.In addition, we release BM25, dense retrieval, and sparse{--}dense hybrid baselines to provide a starting point for the development of future systems.We hope that these efforts can spur additional work in search for African languages.AfriCLIRMatrix can be downloaded at https://github.com/castorini/africlirmatrix.",
}
How well can NLP models generalize to a variety of unseen tasks when provided with task instructions? To address this question, we first introduce Super-NaturalInstructions, a benchmark of 1,616 diverse NLP tasks and their expert-written instructions. Our collection covers 76 distinct task types, including but not limited to classification, extraction, infilling, sequence tagging, text rewriting, and text composition. This large and diverse collection of tasks enables rigorous benchmarking of cross-task generalization under instructions{–-}training models to follow instructions on a subset of tasks and evaluating them on the remaining unseen ones.Furthermore, we build Tk-Instruct, a transformer model trained to follow a variety of in-context instructions (plain language task definitions or k-shot examples). Our experiments show that Tk-Instruct outperforms existing instruction-following models such as InstructGPT by over 9{\%} on our benchmark despite being an order of magnitude smaller. We further analyze generalization as a function of various scaling parameters, such as the number of observed tasks, the number of instances per task, and model sizes. We hope our dataset and model facilitate future progress towards more general-purpose NLP models.
@inproceedings{wang-etal-2022-super,
title = "Super-{N}atural{I}nstructions: Generalization via Declarative Instructions on 1600+ {NLP} Tasks",
author = "Wang, Yizhong and
Mishra, Swaroop and
Alipoormolabashi, Pegah and
Kordi, Yeganeh and
Mirzaei, Amirreza and
Naik, Atharva and
Ashok, Arjun and
Dhanasekaran, Arut Selvan and
Arunkumar, Anjana and
Stap, David and
Pathak, Eshaan and
Karamanolakis, Giannis and
Lai, Haizhi and
Purohit, Ishan and
Mondal, Ishani and
Anderson, Jacob and
Kuznia, Kirby and
Doshi, Krima and
Pal, Kuntal Kumar and
Patel, Maitreya and
Moradshahi, Mehrad and
Parmar, Mihir and
Purohit, Mirali and
Varshney, Neeraj and
Kaza, Phani Rohitha and
Verma, Pulkit and
Puri, Ravsehaj Singh and
Karia, Rushang and
Doshi, Savan and
Sampat, Shailaja Keyur and
Mishra, Siddhartha and
Reddy A, Sujan and
Patro, Sumanta and
Dixit, Tanay and
Shen, Xudong",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.340",
doi = "10.18653/v1/2022.emnlp-main.340",
pages = "5085--5109",
abstract = "How well can NLP models generalize to a variety of unseen tasks when provided with task instructions? To address this question, we first introduce Super-NaturalInstructions, a benchmark of 1,616 diverse NLP tasks and their expert-written instructions. Our collection covers 76 distinct task types, including but not limited to classification, extraction, infilling, sequence tagging, text rewriting, and text composition. This large and diverse collection of tasks enables rigorous benchmarking of cross-task generalization under instructions{---}training models to follow instructions on a subset of tasks and evaluating them on the remaining unseen ones.Furthermore, we build Tk-Instruct, a transformer model trained to follow a variety of in-context instructions (plain language task definitions or k-shot examples). Our experiments show that Tk-Instruct outperforms existing instruction-following models such as InstructGPT by over 9{\%} on our benchmark despite being an order of magnitude smaller. We further analyze generalization as a function of various scaling parameters, such as the number of observed tasks, the number of instances per task, and model sizes. We hope our dataset and model facilitate future progress towards more general-purpose NLP models.",
}
@inproceedings{256033943,
title = {Cognitive and Acoustic Speech and Language Patterns Occurring in Different Neurodegenerative Disorders while Performing Neuropsychological Tests},
author = {{M. Iglesias} and {A. Favaro} and {C. Motley} and {E. Oh} and {R. Stevens} and {A. Butala} and {L. Moro-Velázquez} and {N. Dehak}},
year = 2022,
month = {12},
booktitle = {IEEE Signal Processing in Medicine and Biology Symposium},
url = {https://www.semanticscholar.org/paper/ee067fbced756c332d18a34d6d4f59ab512f9013},
}
@inproceedings{256034037,
title = {Phonatory Analysis on Parkinson's Disease Patients Attending Singing and Discussion Therapy (Parkinsonics) using Signal Processing Techniques},
author = {{C. Chen} and {L. Moro-Velázquez} and {A. Ožbolt} and {A. Butala} and {A. Pantelyat} and {N. Dehak}},
year = 2022,
month = {12},
booktitle = {IEEE Signal Processing in Medicine and Biology Symposium},
url = {https://www.semanticscholar.org/paper/513937e2300445136193356fb6fdae3753d09770},
}
@inproceedings{254880773,
title = {Artificial Intelligence Tools to Evaluate Language and Speech Patterns in Alzheimer's Disease},
author = {{A. Favaro} and {Seneca Motley} and {Quincy M. Samus} and {A. Butala} and {N. Dehak} and {Esther S. Oh} and {L. Moro-Velázquez}},
year = 2022,
month = {12},
booktitle = {Alzheimer's & Dementia},
url = {https://www.semanticscholar.org/paper/e8f74514d4b195230ddd7dd6b60cabbc7ed240b1},
}
@inproceedings{254825419,
title = {A prospective birth cohort study of maternal prenatal cigarette smoking assessed by self-report and biomarkers on childhood risk of overweight or obesity},
author = {{Wenpin Hou} and {Mingyu Zhang} and {Yuelong Ji} and {X. Hong} and {Guoying Wang} and {Richard Xu} and {L. Liang} and {S. Saria} and {Hongkai Ji}},
year = 2022,
month = {12},
booktitle = {Precision Nutrition},
url = {https://www.semanticscholar.org/paper/2304edd25b8f08b99c6992c3de6434459742ccad},
}
Hyperparameter tuning is important for achieving high accuracy in deep learning models, yet little interpretability work has focused on hyperparameters. We propose to use the Explainable Boosting Machine (EBM), a glassbox method, as a post-hoc analysis tool for understanding how hyperparameters influence model accuracy. We present a case study on Transformer models in machine translation to illustrate the kinds of insights that may be gleaned, and perform extensive analysis to test the robustness of EBM under different data conditions.
@inproceedings{deb-etal-2022-post,
title = "Post-Hoc Interpretation of Transformer Hyperparameters with Explainable Boosting Machines",
author = "Deb, Kiron and
Zhang, Xuan and
Duh, Kevin",
editor = "Bastings, Jasmijn and
Belinkov, Yonatan and
Elazar, Yanai and
Hupkes, Dieuwke and
Saphra, Naomi and
Wiegreffe, Sarah",
booktitle = "Proceedings of the Fifth BlackboxNLP Workshop on Analyzing and Interpreting Neural Networks for NLP",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.blackboxnlp-1.5",
doi = "10.18653/v1/2022.blackboxnlp-1.5",
pages = "51--61",
abstract = "Hyperparameter tuning is important for achieving high accuracy in deep learning models, yet little interpretability work has focused on hyperparameters. We propose to use the Explainable Boosting Machine (EBM), a glassbox method, as a post-hoc analysis tool for understanding how hyperparameters influence model accuracy. We present a case study on Transformer models in machine translation to illustrate the kinds of insights that may be gleaned, and perform extensive analysis to test the robustness of EBM under different data conditions.",
}
@inproceedings{254125713,
title = {VIDM: Video Implicit Diffusion Models},
author = {{Kangfu Mei} and {Vishal M. Patel}},
year = 2022,
month = {12},
booktitle = {AAAI Conference on Artificial Intelligence},
url = {https://www.semanticscholar.org/paper/13c7b29a100f67d285eb3625c160d06882d4c092},
}
The ability to extract high-quality translation dictionaries from monolingual word embedding spaces depends critically on the geometric similarity of the spaces{–-}their degree of {“}isomorphism.{”} We address the root-cause of faulty cross-lingual mapping: that word embedding training resulted in the underlying spaces being non-isomorphic. We incorporate global measures of isomorphism directly into the skipgram loss function, successfully increasing the relative isomorphism of trained word embedding spaces and improving their ability to be mapped to a shared cross-lingual space. The result is improved bilingual lexicon induction in general data conditions, under domain mismatch, and with training algorithm dissimilarities. We release IsoVec at https://github.com/kellymarchisio/isovec.
@inproceedings{marchisio-etal-2022-isovec,
title = "{I}so{V}ec: Controlling the Relative Isomorphism of Word Embedding Spaces",
author = "Marchisio, Kelly and
Verma, Neha and
Duh, Kevin and
Koehn, Philipp",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.404",
doi = "10.18653/v1/2022.emnlp-main.404",
pages = "6019--6033",
abstract = "The ability to extract high-quality translation dictionaries from monolingual word embedding spaces depends critically on the geometric similarity of the spaces{---}their degree of {``}isomorphism.{''} We address the root-cause of faulty cross-lingual mapping: that word embedding training resulted in the underlying spaces being non-isomorphic. We incorporate global measures of isomorphism directly into the skipgram loss function, successfully increasing the relative isomorphism of trained word embedding spaces and improving their ability to be mapped to a shared cross-lingual space. The result is improved bilingual lexicon induction in general data conditions, under domain mismatch, and with training algorithm dissimilarities. We release IsoVec at https://github.com/kellymarchisio/isovec.",
}
This paper presents the results of the General Machine Translation Task organised as part of the Conference on Machine Translation (WMT) 2022. In the general MT task, participants were asked to build machine translation systems for any of 11 language pairs, to be evaluated on test sets consisting of four different domains. We evaluate system outputs with human annotators using two different techniques: reference-based direct assessment and (DA) and a combination of DA and scalar quality metric (DA+SQM).
@inproceedings{kocmi-etal-2022-findings,
title = "Findings of the 2022 Conference on Machine Translation ({WMT}22)",
author = "Kocmi, Tom and
Bawden, Rachel and
Bojar, Ond{\v{r}}ej and
Dvorkovich, Anton and
Federmann, Christian and
Fishel, Mark and
Gowda, Thamme and
Graham, Yvette and
Grundkiewicz, Roman and
Haddow, Barry and
Knowles, Rebecca and
Koehn, Philipp and
Monz, Christof and
Morishita, Makoto and
Nagata, Masaaki and
Nakazawa, Toshiaki and
Nov{\'a}k, Michal and
Popel, Martin and
Popovi{\'c}, Maja",
editor = {Koehn, Philipp and
Barrault, Lo{\"\i}c and
Bojar, Ond{\v{r}}ej and
Bougares, Fethi and
Chatterjee, Rajen and
Costa-juss{\`a}, Marta R. and
Federmann, Christian and
Fishel, Mark and
Fraser, Alexander and
Freitag, Markus and
Graham, Yvette and
Grundkiewicz, Roman and
Guzman, Paco and
Haddow, Barry and
Huck, Matthias and
Jimeno Yepes, Antonio and
Kocmi, Tom and
Martins, Andr{\'e} and
Morishita, Makoto and
Monz, Christof and
Nagata, Masaaki and
Nakazawa, Toshiaki and
Negri, Matteo and
N{\'e}v{\'e}ol, Aur{\'e}lie and
Neves, Mariana and
Popel, Martin and
Turchi, Marco and
Zampieri, Marcos},
booktitle = "Proceedings of the Seventh Conference on Machine Translation (WMT)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.wmt-1.1",
pages = "1--45",
abstract = "This paper presents the results of the General Machine Translation Task organised as part of the Conference on Machine Translation (WMT) 2022. In the general MT task, participants were asked to build machine translation systems for any of 11 language pairs, to be evaluated on test sets consisting of four different domains. We evaluate system outputs with human annotators using two different techniques: reference-based direct assessment and (DA) and a combination of DA and scalar quality metric (DA+SQM).",
}
@inproceedings{262383173,
title = {A prospective birth cohort study of maternal prenatal cigarette smoking assessed by self-report and biomarkers on childhood risk of overweight or obesity.},
author = {{Wenpin Hou} and {Mingyu Zhang} and {Yuelong Ji} and {X. Hong} and {Guoying Wang} and {Richard Xu} and {Liming Liang} and {S. Saria} and {Hongkai Ji}},
year = 2022,
month = {12},
booktitle = {Precision Nutrition},
url = {https://www.semanticscholar.org/paper/e898ce790bbb170c93ff44e139e83c3448b590ab},
}
In contexts where debate and deliberation are the norm, the participants are regularly presented with new information that conflicts with their original beliefs. When required to update their beliefs (belief alignment), they may choose arguments that align with their worldview (confirmation bias). We test this and competing hypotheses in a constraint-based modeling approach to predict the winning arguments in multi-party interactions in the Reddit Change My View and Intelligence Squared debates datasets. We adopt a hierarchical generative Variational Autoencoder as our model and impose structural constraints that reflect competing hypotheses about the nature of argumentation. Our findings suggest that in most settings, predictive models that anticipate winning arguments to be further from the initial argument of the opinion holder are more likely to succeed.
@inproceedings{sia-etal-2022-offer,
title = "Offer a Different Perspective: Modeling the Belief Alignment of Arguments in Multi-party Debates",
author = "Sia, Suzanna and
Jaidka, Kokil and
Ahuja, Hansin and
Chhaya, Niyati and
Duh, Kevin",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.818",
doi = "10.18653/v1/2022.emnlp-main.818",
pages = "11939--11950",
abstract = "In contexts where debate and deliberation are the norm, the participants are regularly presented with new information that conflicts with their original beliefs. When required to update their beliefs (belief alignment), they may choose arguments that align with their worldview (confirmation bias). We test this and competing hypotheses in a constraint-based modeling approach to predict the winning arguments in multi-party interactions in the Reddit Change My View and Intelligence Squared debates datasets. We adopt a hierarchical generative Variational Autoencoder as our model and impose structural constraints that reflect competing hypotheses about the nature of argumentation. Our findings suggest that in most settings, predictive models that anticipate winning arguments to be further from the initial argument of the opinion holder are more likely to succeed.",
}
We investigate model calibration in the setting of zero-shot cross-lingual transfer with large-scale pre-trained language models. The level of model calibration is an important metric for evaluating the trustworthiness of predictive models. There exists an essential need for model calibration when natural language models are deployed in critical tasks. We study different post-training calibration methods in structured and unstructured prediction tasks. We find that models trained with data from the source language become less calibrated when applied to the target language and that calibration errors increase with intrinsic task difficulty and relative sparsity of training data. Moreover, we observe a potential connection between the level of calibration error and an earlier proposed measure of the distance from English to other languages. Finally, our comparison demonstrates that among other methods Temperature Scaling (TS) generalizes well to distant languages, but TS fails to calibrate more complex confidence estimation in structured predictions compared to more expressive alternatives like Gaussian Process Calibration.
@inproceedings{jiang-etal-2022-calibrating,
title = "Calibrating Zero-shot Cross-lingual (Un-)structured Predictions",
author = "Jiang, Zhengping and
Liu, Anqi and
Van Durme, Benjamin",
editor = "Goldberg, Yoav and
Kozareva, Zornitsa and
Zhang, Yue",
booktitle = "Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.emnlp-main.170",
doi = "10.18653/v1/2022.emnlp-main.170",
pages = "2648--2674",
abstract = "We investigate model calibration in the setting of zero-shot cross-lingual transfer with large-scale pre-trained language models. The level of model calibration is an important metric for evaluating the trustworthiness of predictive models. There exists an essential need for model calibration when natural language models are deployed in critical tasks. We study different post-training calibration methods in structured and unstructured prediction tasks. We find that models trained with data from the source language become less calibrated when applied to the target language and that calibration errors increase with intrinsic task difficulty and relative sparsity of training data. Moreover, we observe a potential connection between the level of calibration error and an earlier proposed measure of the distance from English to other languages. Finally, our comparison demonstrates that among other methods Temperature Scaling (TS) generalizes well to distant languages, but TS fails to calibrate more complex confidence estimation in structured predictions compared to more expressive alternatives like Gaussian Process Calibration.",
}
@inproceedings{256034700,
title = {Analysis of Interpretable Handwriting Features to Evaluate Motoric Patterns in Different Neurodegenerative Diseases},
author = {{D. D. Kairamkonda} and {P. S. Mandaleeka} and {A. Favaro} and {C. Motley} and {A. Butala} and {E. Oh} and {R. Stevens} and {N. Dehak} and {L. Moro-Velázquez}},
year = 2022,
month = {12},
booktitle = {IEEE Signal Processing in Medicine and Biology Symposium},
url = {https://www.semanticscholar.org/paper/d10f7b6ab049a92c19e1d9c7792063e85ce60d22},
}
Expressing natural language descriptions of structured facts or relations {–} data-to-text generation (D2T) {–} increases the accessibility of structured knowledge repositories. Previous work shows that pre-trained language models (PLMs) perform remarkably well on this task after fine-tuning on a significant amount of task-specific training data. On the other hand, while auto-regressive PLMs can generalize from a few task examples, their efficacy at D2T is largely unexplored. Furthermore, we have an incomplete understanding of the limits of PLMs on D2T. In this work, we conduct an empirical study of both fine-tuned and auto-regressive PLMs on the DART multi-domain D2T dataset. We consider their performance as a function of the amount of task-specific data and how the data is incorporated into the models: zero and few-shot learning, and fine-tuning of model weights. In addition, we probe the limits of PLMs by measuring performance on subsets of the evaluation data: novel predicates and abstractive test examples. To improve the performance on these subsets, we investigate two techniques: providing predicate descriptions in the context and re-ranking generated candidates by information reflected in the source. Finally, we conduct a human evaluation of model errors and show that D2T generation tasks would benefit from datasets with more careful manual curation.
@inproceedings{keymanesh-etal-2022-makes,
title = "What Makes Data-to-Text Generation Hard for Pretrained Language Models?",
author = "Keymanesh, Moniba and
Benton, Adrian and
Dredze, Mark",
editor = "Bosselut, Antoine and
Chandu, Khyathi and
Dhole, Kaustubh and
Gangal, Varun and
Gehrmann, Sebastian and
Jernite, Yacine and
Novikova, Jekaterina and
Perez-Beltrachini, Laura",
booktitle = "Proceedings of the 2nd Workshop on Natural Language Generation, Evaluation, and Metrics (GEM)",
month = dec,
year = "2022",
address = "Abu Dhabi, United Arab Emirates (Hybrid)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.gem-1.50",
doi = "10.18653/v1/2022.gem-1.50",
pages = "539--554",
abstract = "Expressing natural language descriptions of structured facts or relations {--} data-to-text generation (D2T) {--} increases the accessibility of structured knowledge repositories. Previous work shows that pre-trained language models (PLMs) perform remarkably well on this task after fine-tuning on a significant amount of task-specific training data. On the other hand, while auto-regressive PLMs can generalize from a few task examples, their efficacy at D2T is largely unexplored. Furthermore, we have an incomplete understanding of the limits of PLMs on D2T. In this work, we conduct an empirical study of both fine-tuned and auto-regressive PLMs on the DART multi-domain D2T dataset. We consider their performance as a function of the amount of task-specific data and how the data is incorporated into the models: zero and few-shot learning, and fine-tuning of model weights. In addition, we probe the limits of PLMs by measuring performance on subsets of the evaluation data: novel predicates and abstractive test examples. To improve the performance on these subsets, we investigate two techniques: providing predicate descriptions in the context and re-ranking generated candidates by information reflected in the source. Finally, we conduct a human evaluation of model errors and show that D2T generation tasks would benefit from datasets with more careful manual curation.",
}
@inproceedings{254591386,
title = {Do Text-to-Text Multi-Task Learners Suffer from Task Conflict?},
author = {{David Mueller} and {Nicholas Andrews} and {Mark Dredze}},
year = 2022,
month = {12},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/2843661ee0d5fa159165beba50c345566cc44c57},
}
@InProceedings{svete-et-al-2022,
aclid = "2022.emnlp-main.567",
author = "Anej Svete and Benjamin Dayan and Ryan Cotterell and
Tim Vieira and Jason Eisner",
title = "Acyclic Weighted Finite-State Automata with Failure
Transitions",
booktitle = "Proceedings of the 2022 Conference on Empirical
Methods in Natural Language Processing",
pages = "8289--8305",
year = "2022",
month = dec,
address = "Abu Dhabi",
URL = "http://cs.jhu.edu/~jason/papers/#svete-et-al-2022",
}
@InProceedings{stengeleskin-et-al-2022,
aclid = "2022.emnlp-main.789",
author = "Elias Stengel-Eskin and Emmanouil Antonios Platanios
and Adam Pauls and Sam Thomson and Hao Fang and
Benjamin Van Durme and Jason Eisner and Yu Su",
title = "When More Data Hurts: {A} Troubling Quirk in
Developing Broad-Coverage Natural Language
Understanding Systems",
booktitle = "Proceedings of the 2022 Conference on Empirical
Methods in Natural Language Processing",
pages = "11473--11487",
year = "2022",
month = dec,
address = "Abu Dhabi",
URL = "http://cs.jhu.edu/~jason/papers/#stengeleskin-et-al-2022",
}
@inproceedings{253903852,
title = {Optimized Acoustic Phantom Design for Characterizing Body Sound Sensors},
author = {{V. Rennoll} and {Ian McLane} and {Mounya Elhilali} and {James E. West}},
year = 2022,
month = {11},
booktitle = {Italian National Conference on Sensors},
url = {https://www.semanticscholar.org/paper/0d7b6b5a15b47c1cd1d688f043fd06ff6822d5a1},
}
@inproceedings{253553494,
title = {AdaMAE: Adaptive Masking for Efficient Spatiotemporal Learning with Masked Autoencoders},
author = {{W. G. C. Bandara} and {Naman Patel} and {A. Gholami} and {Mehdi Nikkhah} and {M. Agrawal} and {Vishal M. Patel}},
year = 2022,
month = {11},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/a135632a05cc1f3311859fdebcd1350b4e9e1ee7},
}
@inproceedings{254069733,
title = {LUMix: Improving Mixup by Better Modelling Label Uncertainty},
author = {{Shuyang Sun} and {Jieneng Chen} and {Ruifei He} and {A. Yuille} and {Philip H. S. Torr} and {Song Bai}},
year = 2022,
month = {11},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/62ce349a6dbc58f64ae02d7203c2f9a06cf6f6d4},
}
@inproceedings{253383773,
title = {Bridging Speech and Textual Pre-Trained Models With Unsupervised ASR},
author = {{Jiatong Shi} and {Chan-Jan Hsu} and {Ho-Lam Chung} and {Dongji Gao} and {Leibny Paola García-Perera} and {Shinji Watanabe} and {Ann Lee} and {Hung-yi Lee}},
year = 2022,
month = {11},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/92302ab168429c7c3a8f699b35ba8302916c6e7c},
}
@inproceedings{253735003,
title = {SMAUG: Sparse Masked Autoencoder for Efficient Video-Language Pre-training},
author = {{Yuanze Lin} and {Chen Wei} and {Huiyu Wang} and {A. Yuille} and {Cihang Xie}},
year = 2022,
month = {11},
booktitle = {IEEE International Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/210f6ffbed4bf3a0f020cfcb48dab9d6a9939cdb},
}
Machine translation traditionally refers to translating from a single source language into a single target language. In recent years, the field has moved towards large neural models either translating from or into many languages. The model must be correctly cued to translate into the correct target language. This is typically done by prefixing language tokens onto the source or target sequence. The location and content of the prefix can vary and many use different approaches without much justification towards one approach or another. As a guidance to future researchers and directions for future work, we present a series of experiments that show how the positioning and type of a target language prefix token effects translation performance. We show that source side prefixes improve performance. Further, we find that the best language information to denote via tokens depends on the supported language set.
@inproceedings{wicks-duh-2022-effects,
title = "The Effects of Language Token Prefixing for Multilingual Machine Translation",
author = "Wicks, Rachel and
Duh, Kevin",
editor = "He, Yulan and
Ji, Heng and
Li, Sujian and
Liu, Yang and
Chang, Chua-Hui",
booktitle = "Proceedings of the 2nd Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics and the 12th International Joint Conference on Natural Language Processing (Volume 2: Short Papers)",
month = nov,
year = "2022",
address = "Online only",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.aacl-short.19",
doi = "10.18653/v1/2022.aacl-short.19",
pages = "148--153",
abstract = "Machine translation traditionally refers to translating from a single source language into a single target language. In recent years, the field has moved towards large neural models either translating from or into many languages. The model must be correctly cued to translate into the correct target language. This is typically done by prefixing language tokens onto the source or target sequence. The location and content of the prefix can vary and many use different approaches without much justification towards one approach or another. As a guidance to future researchers and directions for future work, we present a series of experiments that show how the positioning and type of a target language prefix token effects translation performance. We show that source side prefixes improve performance. Further, we find that the best language information to denote via tokens depends on the supported language set.",
}
@inproceedings{253801674,
title = {On Instance-Dependent Bounds for Offline Reinforcement Learning with Linear Function Approximation},
author = {{Thanh Nguyen-Tang} and {Ming Yin} and {Sunil Gupta} and {S. Venkatesh} and {R. Arora}},
year = 2022,
month = {11},
booktitle = {AAAI Conference on Artificial Intelligence},
url = {https://www.semanticscholar.org/paper/b61a3d718a192e39a437d32a6ed4037b8c29cc41},
}
@inproceedings{253499210,
title = {Open-Set Automatic Target Recognition},
author = {{Bardia Safaei} and {VS Vibashan} and {Celso M. de Melo} and {Shuowen Hu} and {Vishal M. Patel}},
year = 2022,
month = {11},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/878d61661e35c80c0b981fe4512fbad6c55ab037},
}
@inproceedings{253244355,
title = {Adapting Self-Supervised Models to Multi-Talker Speech Recognition Using Speaker Embeddings},
author = {{Zili Huang} and {Desh Raj} and {Leibny Paola García-Perera} and {S. Khudanpur}},
year = 2022,
month = {11},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/2226b25c6656e1d7c99667b4e685cd01348e8577},
}
@inproceedings{253734941,
title = {SceneComposer: Any-Level Semantic Image Synthesis},
author = {{Yu Zeng} and {Zhe Lin} and {Jianming Zhang} and {Qing Liu} and {J. Collomosse} and {Jason Kuen} and {Vishal M. Patel}},
year = 2022,
month = {11},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/4cc5266166478592ec8539a2b940740b8d380cdd},
}
@inproceedings{253510101,
title = {Calibrated Interpretation: Confidence Estimation in Semantic Parsing},
author = {{Elias Stengel-Eskin} and {Benjamin Van Durme}},
year = 2022,
month = {11},
booktitle = {Transactions of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/c428f1621f79925311082d8d7425dd4d50cd64ed},
}
@inproceedings{254125113,
title = {Operationalizing Specifications, In Addition to Test Sets for Evaluating Constrained Generative Models},
author = {{Vikas Raunak} and {Matt Post} and {Arul Menezes}},
year = 2022,
month = {11},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/ad2149957cd288a5626adcce48f9981a2ab59184},
}
@inproceedings{253510862,
title = {Language Agnostic Code-Mixing Data Augmentation by Predicting Linguistic Patterns},
author = {{Shuyue Stella Li} and {Kenton Murray}},
year = 2022,
month = {11},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/96fdfc1ba9588d1fab990d504aa590233216326a},
}
@inproceedings{254095971,
title = {Euro: Espnet Unsupervised ASR Open-Source Toolkit},
author = {{Dongji Gao} and {Jiatong Shi} and {Shun-Po Chuang} and {Leibny Paola García-Perera} and {Hung-yi Lee} and {Shinji Watanabe} and {S. Khudanpur}},
year = 2022,
month = {11},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/012771aa3a8d59401d22fade9416dbaad22f42b1},
}
@inproceedings{252735237,
title = {Ambiguous Images With Human Judgments for Robust Visual Event Classification},
author = {{Kate Sanders} and {Reno Kriz} and {Anqi Liu} and {Benjamin Van Durme}},
year = 2022,
month = {10},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/2a55f57716576fdd5840252d673aabe9a676fced},
}
@inproceedings{253098673,
title = {1st Place Solution of The Robust Vision Challenge (RVC) 2022 Semantic Segmentation Track},
author = {{Junfei Xiao} and {Zhichao Xu} and {Shiyi Lan} and {Zhiding Yu} and {A. Yuille} and {Anima Anandkumar}},
year = 2022,
month = {10},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/17a6bee0ef616822d8a883f6bc373dd676242793},
}
@inproceedings{253117124,
title = {Synthetic Tumors Make AI Segment Tumors Better},
author = {{Qixing Hu} and {Junfei Xiao} and {Yixiong Chen} and {Shuwen Sun} and {Jieneng Chen} and {A. Yuille} and {Zongwei Zhou}},
year = 2022,
month = {10},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/0077f46c9cf3de56319aad65e419131e2466b848},
}
@inproceedings{253347117,
title = {Mixture of Teacher Experts for Source-Free Domain Adaptive Object Detection},
author = {{VS Vibashan} and {Poojan Oza} and {Vishwanath A. Sindagi} and {Vishal M. Patel}},
year = 2022,
month = {10},
booktitle = {International Conference on Information Photonics},
url = {https://www.semanticscholar.org/paper/96a609d83a2aaf739fedc4cbfa3f96b14ae234cb},
}
@inproceedings{252715598,
title = {MOAT: Alternating Mobile Convolution and Attention Brings Strong Vision Models},
author = {{Chenglin Yang} and {Siyuan Qiao} and {Qihang Yu} and {Xiaoding Yuan} and {Yukun Zhu} and {A. Yuille} and {Hartwig Adam} and {Liang-Chieh Chen}},
year = 2022,
month = {10},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/a8a2a8229f99c291bf71ec92b801a073854c52e2},
}
@inproceedings{252726978,
title = {Imbalanced regression for intensity series of pain expression from videos by regularizing spatio-temporal face nets},
author = {{Xiang Xiang} and {Feng Wang} and {Yuwen Tan} and {A. Yuille}},
year = 2022,
month = {10},
booktitle = {Pattern Recognition Letters},
url = {https://www.semanticscholar.org/paper/e9eab79d381d7799e74afd9917e91d47953aa69d},
}
@inproceedings{252780362,
title = {Multi-Modal Human Authentication Using Silhouettes, Gait and RGB},
author = {{Yuxiang Guo} and {Cheng Peng} and {Chun Pong Lau} and {R. Chellappa}},
year = 2022,
month = {10},
booktitle = {IEEE International Conference on Automatic Face & Gesture Recognition},
url = {https://www.semanticscholar.org/paper/e89d9b5c7b5d9c4b490ba1d5fdbbca423920c3e1},
}
@inproceedings{253244506,
title = {Generating Sequences by Learning to Self-Correct},
author = {{S. Welleck} and {Ximing Lu} and {Peter West} and {Faeze Brahman} and {T. Shen} and {Daniel Khashabi} and {Yejin Choi}},
year = 2022,
month = {10},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/538288d24bdad73d831dfed44b706958287ed318},
}
@inproceedings{253080413,
title = {Context-Enhanced Stereo Transformer},
author = {{Weiyu Guo} and {Zhaoshuo Li} and {Yongkui Yang} and {Z. Wang} and {Russell H. Taylor} and {M. Unberath} and {A. Yuille} and {Yingwei Li}},
year = 2022,
month = {10},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/3fe123f4777bcb86d796de230b3767c15f28ed7d},
}
@inproceedings{253116576,
title = {Reducing Language Confusion for Code-Switching Speech Recognition with Token-Level Language Diarization},
author = {{Hexin Liu} and {Haihua Xu} and {Leibny Paola García} and {Andy W. H. Khong} and {Yi He} and {S. Khudanpur}},
year = 2022,
month = {10},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/1fab5a425ad712bb8245741c5abec00aa80fc123},
}
This paper presents a detailed foundational empirical case study of the nature of out-of-vocabulary words encountered in modern text in a moderate-resource language such as Bulgarian, and a multi-faceted distributional analysis of the underlying word-formation processes that can aid in their compositional translation, tagging, parsing, language modeling, and other NLP tasks. Given that out-of-vocabulary (OOV) words generally present a key open challenge to NLP and machine translation systems, especially toward the lower limit of resource availability, there are useful practical insights, as well as corpus-linguistic insights, from both a detailed manual and automatic taxonomic analysis of the types, multidimensional properties, and processing potential for multiple representative OOV data samples.
@inproceedings{botev-etal-2022-deciphering,
title = "Deciphering and Characterizing Out-of-Vocabulary Words for Morphologically Rich Languages",
author = "Botev, Georgie and
McCarthy, Arya D. and
Wu, Winston and
Yarowsky, David",
editor = "Calzolari, Nicoletta and
Huang, Chu-Ren and
Kim, Hansaem and
Pustejovsky, James and
Wanner, Leo and
Choi, Key-Sun and
Ryu, Pum-Mo and
Chen, Hsin-Hsi and
Donatelli, Lucia and
Ji, Heng and
Kurohashi, Sadao and
Paggio, Patrizia and
Xue, Nianwen and
Kim, Seokhwan and
Hahm, Younggyun and
He, Zhong and
Lee, Tony Kyungil and
Santus, Enrico and
Bond, Francis and
Na, Seung-Hoon",
booktitle = "Proceedings of the 29th International Conference on Computational Linguistics",
month = oct,
year = "2022",
address = "Gyeongju, Republic of Korea",
publisher = "International Committee on Computational Linguistics",
url = "https://aclanthology.org/2022.coling-1.472",
pages = "5309--5326",
abstract = "This paper presents a detailed foundational empirical case study of the nature of out-of-vocabulary words encountered in modern text in a moderate-resource language such as Bulgarian, and a multi-faceted distributional analysis of the underlying word-formation processes that can aid in their compositional translation, tagging, parsing, language modeling, and other NLP tasks. Given that out-of-vocabulary (OOV) words generally present a key open challenge to NLP and machine translation systems, especially toward the lower limit of resource availability, there are useful practical insights, as well as corpus-linguistic insights, from both a detailed manual and automatic taxonomic analysis of the types, multidimensional properties, and processing potential for multiple representative OOV data samples.",
}
Translating into low-resource languages is challenging due to the scarcity of training data. In this paper, we propose a probabilistic lexical translation method that bridges through lexical relations including synonyms, hypernyms, hyponyms, and co-hyponyms. This method, which only requires a dictionary like Wiktionary and a lexical database like WordNet, enables the translation of unknown vocabulary into low-resource languages for which we may only know the translation of a related concept. Experiments on translating a core vocabulary set into 472 languages, most of them low-resource, show the effectiveness of our approach.
@inproceedings{wu-yarowsky-2022-known,
title = "Known Words Will Do: Unknown Concept Translation via Lexical Relations",
author = "Wu, Winston and
Yarowsky, David",
editor = "Ojha, Atul Kr. and
Liu, Chao-Hong and
Vylomova, Ekaterina and
Abbott, Jade and
Washington, Jonathan and
Oco, Nathaniel and
Pirinen, Tommi A and
Malykh, Valentin and
Logacheva, Varvara and
Zhao, Xiaobing",
booktitle = "Proceedings of the Fifth Workshop on Technologies for Machine Translation of Low-Resource Languages (LoResMT 2022)",
month = oct,
year = "2022",
address = "Gyeongju, Republic of Korea",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.loresmt-1.3",
pages = "15--22",
abstract = "Translating into low-resource languages is challenging due to the scarcity of training data. In this paper, we propose a probabilistic lexical translation method that bridges through lexical relations including synonyms, hypernyms, hyponyms, and co-hyponyms. This method, which only requires a dictionary like Wiktionary and a lexical database like WordNet, enables the translation of unknown vocabulary into low-resource languages for which we may only know the translation of a related concept. Experiments on translating a core vocabulary set into 472 languages, most of them low-resource, show the effectiveness of our approach.",
}
Researchers across disciplines use Twitter geolocation tools to filter data for desired locations. These tools have largely been trained and tested on English tweets, often originating in the United States from almost a decade ago. Despite the importance of these tools for data curation, the impact of tweet language, country of origin, and creation date on tool performance remains largely unknown. We explore these issues with Carmen, a popular tool for Twitter geolocation. To support this study we introduce Carmen 2.0, a major update which includes the incorporation of GeoNames, a gazetteer that provides much broader coverage of locations. We evaluate using two new Twitter datasets, one for multilingual, multiyear geolocation evaluation, and another for usage trends over time. We found that language, country origin, and time does impact geolocation tool performance.
@inproceedings{zhang-etal-2022-changes,
title = "Changes in Tweet Geolocation over Time: A Study with Carmen 2.0",
author = "Zhang, Jingyu and
DeLucia, Alexandra and
Dredze, Mark",
booktitle = "Proceedings of the Eighth Workshop on Noisy User-generated Text (W-NUT 2022)",
month = oct,
year = "2022",
address = "Gyeongju, Republic of Korea",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.wnut-1.1",
pages = "1--14",
abstract = "Researchers across disciplines use Twitter geolocation tools to filter data for desired locations. These tools have largely been trained and tested on English tweets, often originating in the United States from almost a decade ago. Despite the importance of these tools for data curation, the impact of tweet language, country of origin, and creation date on tool performance remains largely unknown. We explore these issues with Carmen, a popular tool for Twitter geolocation. To support this study we introduce Carmen 2.0, a major update which includes the incorporation of GeoNames, a gazetteer that provides much broader coverage of locations. We evaluate using two new Twitter datasets, one for multilingual, multiyear geolocation evaluation, and another for usage trends over time. We found that language, country origin, and time does impact geolocation tool performance.",
}
@inproceedings{252715847,
title = {Making Your First Choice: To Address Cold Start Problem in Vision Active Learning},
author = {{Liangyu Chen} and {Yutong Bai} and {Siyu Huang} and {Yongyi Lu} and {B. Wen} and {A. Yuille} and {Zongwei Zhou}},
year = 2022,
month = {10},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/a4af00f50f0b397b14ae5dc22e0e766c31adaaa8},
}
@inproceedings{253098023,
title = {Delving into Masked Autoencoders for Multi-Label Thorax Disease Classification},
author = {{Junfei Xiao} and {Yutong Bai} and {A. Yuille} and {Zongwei Zhou}},
year = 2022,
month = {10},
booktitle = {IEEE Workshop/Winter Conference on Applications of Computer Vision},
url = {https://www.semanticscholar.org/paper/249e00445585586214e27d1f4ade032533132d0a},
}
@inproceedings{254853697,
title = {A Brief Survey on Person Recognition at a Distance},
author = {{Chris Nalty} and {Neehar Peri} and {Joshua Gleason} and {C. Castillo} and {Shuowen Hu} and {T. Bourlai} and {R. Chellappa}},
year = 2022,
month = {10},
booktitle = {Asilomar Conference on Signals, Systems and Computers},
url = {https://www.semanticscholar.org/paper/6934bd40d21e3bddce5328d29a7e1083e21d0aad},
}
@inproceedings{251829168,
title = {Efficient Self-Supervised Learning Representations for Spoken Language Identification},
author = {{Hexin Liu} and {Leibny Paola García-Perera} and {Andy W. H. Khong} and {E. Chng} and {S. Styles} and {S. Khudanpur}},
year = 2022,
month = {10},
booktitle = {IEEE Journal on Selected Topics in Signal Processing},
url = {https://www.semanticscholar.org/paper/130693386f2f7b7c1a98c4298c4ed27b9a56f79e},
}
@inproceedings{252762304,
title = {Mutual Learning of Single- and Multi-Channel End-to-End Neural Diarization},
author = {{Shota Horiguchi} and {Yuki Takashima} and {Shinji Watanabe} and {Leibny Paola García-Perera}},
year = 2022,
month = {10},
booktitle = {Spoken Language Technology Workshop},
url = {https://www.semanticscholar.org/paper/30472f3386177fb929a8454cbbb70462e30d9c61},
}
Very large language models have been shown to translate with few-shot in-context examples. However, they have not achieved state-of-art results for translating out of English. In this work, we investigate an extremely lightweight fixed-parameter method for conditioning a large language model to better translate into the target language. Our method introduces additional embeddings, known as prefix embeddings which do not interfere with the existing weights of the model. Using unsupervised and weakly semi-supervised methods that train only 0.0001{\%} of the model parameters, the simple method improves {\textasciitilde}0.2-1.3 BLEU points across 3 domains and 3 languages. We analyze the resulting embeddings{‘} training dynamics, and where they lie in the embedding space, and show that our trained embeddings can be used for both in-context translation, and diverse generation of the target sentence.
@inproceedings{sia-duh-2022-prefix,
title = "Prefix Embeddings for In-context Machine Translation",
author = "Sia, Suzanna and
Duh, Kevin",
editor = "Duh, Kevin and
Guzm{\'a}n, Francisco",
booktitle = "Proceedings of the 15th biennial conference of the Association for Machine Translation in the Americas (Volume 1: Research Track)",
month = sep,
year = "2022",
address = "Orlando, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2022.amta-research.4",
pages = "45--57",
abstract = "Very large language models have been shown to translate with few-shot in-context examples. However, they have not achieved state-of-art results for translating out of English. In this work, we investigate an extremely lightweight fixed-parameter method for conditioning a large language model to better translate into the target language. Our method introduces additional embeddings, known as prefix embeddings which do not interfere with the existing weights of the model. Using unsupervised and weakly semi-supervised methods that train only 0.0001{\%} of the model parameters, the simple method improves {\textasciitilde}0.2-1.3 BLEU points across 3 domains and 3 languages. We analyze the resulting embeddings{'} training dynamics, and where they lie in the embedding space, and show that our trained embeddings can be used for both in-context translation, and diverse generation of the target sentence.",
}
Obtaining meaningful quality scores for machine translation systems through human evaluation remains a challenge given the high variability between human evaluators, partly due to subjective expectations for translation quality for different language pairs. We propose a new metric called XSTS that is more focused on semantic equivalence and a cross-lingual calibration method that enables more consistent assessment. We demonstrate the effectiveness of these novel contributions in large scale evaluation studies across up to 14 language pairs, with translation both into and out of English.
@inproceedings{licht-etal-2022-consistent,
title = "Consistent Human Evaluation of Machine Translation across Language Pairs",
author = "Licht, Daniel and
Gao, Cynthia and
Lam, Janice and
Guzman, Francisco and
Diab, Mona and
Koehn, Philipp",
editor = "Duh, Kevin and
Guzm{\'a}n, Francisco",
booktitle = "Proceedings of the 15th biennial conference of the Association for Machine Translation in the Americas (Volume 1: Research Track)",
month = sep,
year = "2022",
address = "Orlando, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2022.amta-research.24",
pages = "309--321",
abstract = "Obtaining meaningful quality scores for machine translation systems through human evaluation remains a challenge given the high variability between human evaluators, partly due to subjective expectations for translation quality for different language pairs. We propose a new metric called XSTS that is more focused on semantic equivalence and a cross-lingual calibration method that enables more consistent assessment. We demonstrate the effectiveness of these novel contributions in large scale evaluation studies across up to 14 language pairs, with translation both into and out of English.",
}
Pretrained multilingual sequence-to-sequence models have been successful in improving translation performance for mid- and lower-resourced languages. However, it is unclear if these models are helpful in the domain adaptation setting, and if so, how to best adapt them to both the domain and translation language pair. Therefore, in this work, we propose two major fine-tuning strategies: our language-first approach first learns the translation language pair via general bitext, followed by the domain via in-domain bitext, and our domain-first approach first learns the domain via multilingual in-domain bitext, followed by the language pair via language pair-specific in-domain bitext. We test our approach on 3 domains at different levels of data availability, and 5 language pairs. We find that models using an mBART initialization generally outperform those using a random Transformer initialization. This holds for languages even outside of mBART{‘}s pretraining set, and can result in improvements of over +10 BLEU. Additionally, we find that via our domain-first approach, fine-tuning across multilingual in-domain corpora can lead to stark improvements in domain adaptation without sourcing additional out-of-domain bitext. In larger domain availability settings, our domain-first approach can be competitive with our language-first approach, even when using over 50X less data.
@inproceedings{verma-etal-2022-strategies,
title = "Strategies for Adapting Multilingual Pre-training for Domain-Specific Machine Translation",
author = "Verma, Neha and
Murray, Kenton and
Duh, Kevin",
editor = "Duh, Kevin and
Guzm{\'a}n, Francisco",
booktitle = "Proceedings of the 15th biennial conference of the Association for Machine Translation in the Americas (Volume 1: Research Track)",
month = sep,
year = "2022",
address = "Orlando, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2022.amta-research.3",
pages = "31--44",
abstract = "Pretrained multilingual sequence-to-sequence models have been successful in improving translation performance for mid- and lower-resourced languages. However, it is unclear if these models are helpful in the domain adaptation setting, and if so, how to best adapt them to both the domain and translation language pair. Therefore, in this work, we propose two major fine-tuning strategies: our language-first approach first learns the translation language pair via general bitext, followed by the domain via in-domain bitext, and our domain-first approach first learns the domain via multilingual in-domain bitext, followed by the language pair via language pair-specific in-domain bitext. We test our approach on 3 domains at different levels of data availability, and 5 language pairs. We find that models using an mBART initialization generally outperform those using a random Transformer initialization. This holds for languages even outside of mBART{'}s pretraining set, and can result in improvements of over +10 BLEU. Additionally, we find that via our domain-first approach, fine-tuning across multilingual in-domain corpora can lead to stark improvements in domain adaptation without sourcing additional out-of-domain bitext. In larger domain availability settings, our domain-first approach can be competitive with our language-first approach, even when using over 50X less data.",
}
Neural Machine Translation (NMT) models are known to suffer from noisy inputs. To make models robust, we generate adversarial augmentation samples that attack the model and preserve the source-side meaning at the same time. To generate such samples, we propose a doubly-trained architecture that pairs two NMT models of opposite translation directions with a joint loss function, which combines the target-side attack and the source-side semantic similarity constraint. The results from our experiments across three different language pairs and two evaluation metrics show that these adversarial samples improve model robustness.
@inproceedings{tan-etal-2022-doubly,
title = "Doubly-Trained Adversarial Data Augmentation for Neural Machine Translation",
author = "Tan, Weiting and
Ding, Shuoyang and
Khayrallah, Huda and
Koehn, Philipp",
editor = "Duh, Kevin and
Guzm{\'a}n, Francisco",
booktitle = "Proceedings of the 15th biennial conference of the Association for Machine Translation in the Americas (Volume 1: Research Track)",
month = sep,
year = "2022",
address = "Orlando, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2022.amta-research.12",
pages = "157--174",
abstract = "Neural Machine Translation (NMT) models are known to suffer from noisy inputs. To make models robust, we generate adversarial augmentation samples that attack the model and preserve the source-side meaning at the same time. To generate such samples, we propose a doubly-trained architecture that pairs two NMT models of opposite translation directions with a joint loss function, which combines the target-side attack and the source-side semantic similarity constraint. The results from our experiments across three different language pairs and two evaluation metrics show that these adversarial samples improve model robustness.",
}
The standard approach for inducing narrative chains considers statistics gathered per individual document. We consider whether statistics gathered using cross-document relations can lead to improved chain induction. Our study is motivated by legal narratives, where cases typically cite thematically similar cases. We consider four novel variations on pointwise mutual information (PMI), each accounting for cross-document relations in a different way. One proposed PMI variation performs 58{\%} better relative to standard PMI on recall@50 and induces qualitatively better narrative chains.
@inproceedings{blair-stanek-van-durme-2022-improved,
title = "Improved Induction of Narrative Chains via Cross-Document Relations",
author = "Blair-stanek, Andrew and
Van Durme, Benjamin",
editor = "Nastase, Vivi and
Pavlick, Ellie and
Pilehvar, Mohammad Taher and
Camacho-Collados, Jose and
Raganato, Alessandro",
booktitle = "Proceedings of the 11th Joint Conference on Lexical and Computational Semantics",
month = jul,
year = "2022",
address = "Seattle, Washington",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.starsem-1.18",
doi = "10.18653/v1/2022.starsem-1.18",
pages = "208--212",
abstract = "The standard approach for inducing narrative chains considers statistics gathered per individual document. We consider whether statistics gathered using cross-document relations can lead to improved chain induction. Our study is motivated by legal narratives, where cases typically cite thematically similar cases. We consider four novel variations on pointwise mutual information (PMI), each accounting for cross-document relations in a different way. One proposed PMI variation performs 58{\%} better relative to standard PMI on recall@50 and induces qualitatively better narrative chains.",
}
Since the advent of Federated Learning (FL), research has applied these methods to natural language processing (NLP) tasks. Despite a plethora of papers in FL for NLP, no previous works have studied how multilingual text impacts FL algorithms. Furthermore, multilingual text provides an interesting avenue to examine the impact of non-IID text (e.g. different languages) on FL in naturally occurring data. We explore three multilingual language tasks, language modeling, machine translation, and text classification using differing federated and non-federated learning algorithms. Our results show that using pretrained models reduces the negative effects of FL, helping them to perform near or better than centralized (no privacy) learning, even when using non-IID partitioning.
@inproceedings{weller-etal-2022-pretrained,
title = "Pretrained Models for Multilingual Federated Learning",
author = "Weller, Orion and
Marone, Marc and
Braverman, Vladimir and
Lawrie, Dawn and
Van Durme, Benjamin",
editor = "Carpuat, Marine and
de Marneffe, Marie-Catherine and
Meza Ruiz, Ivan Vladimir",
booktitle = "Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies",
month = jul,
year = "2022",
address = "Seattle, United States",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.naacl-main.101",
doi = "10.18653/v1/2022.naacl-main.101",
pages = "1413--1421",
abstract = "Since the advent of Federated Learning (FL), research has applied these methods to natural language processing (NLP) tasks. Despite a plethora of papers in FL for NLP, no previous works have studied how multilingual text impacts FL algorithms. Furthermore, multilingual text provides an interesting avenue to examine the impact of non-IID text (e.g. different languages) on FL in naturally occurring data. We explore three multilingual language tasks, language modeling, machine translation, and text classification using differing federated and non-federated learning algorithms. Our results show that using pretrained models reduces the negative effects of FL, helping them to perform near or better than centralized (no privacy) learning, even when using non-IID partitioning.",
}
Models of mental health based on natural language processing can uncover latent signals of mental health from language. Models that indicate whether an individual is depressed, or has other mental health conditions, can aid in diagnosis and treatment. A critical aspect of integration of these models into the clinical setting relies on explaining their behavior to domain experts. In the case of mental health diagnosis, clinicians already rely on an assessment framework to make these decisions; that framework can help a model generate meaningful explanations. In this work we propose to use PHQ-9 categories as an auxiliary task to explaining a social media based model of depression. We develop a multi-task learning framework that predicts both depression and PHQ-9 categories as auxiliary tasks. We compare the quality of explanations generated based on the depression task only, versus those that use the predicted PHQ-9 categories. We find that by relying on clinically meaningful auxiliary tasks, we produce more meaningful explanations.
@inproceedings{zirikly-dredze-2022-explaining,
title = "Explaining Models of Mental Health via Clinically Grounded Auxiliary Tasks",
author = "Zirikly, Ayah and
Dredze, Mark",
editor = "Zirikly, Ayah and
Atzil-Slonim, Dana and
Liakata, Maria and
Bedrick, Steven and
Desmet, Bart and
Ireland, Molly and
Lee, Andrew and
MacAvaney, Sean and
Purver, Matthew and
Resnik, Rebecca and
Yates, Andrew",
booktitle = "Proceedings of the Eighth Workshop on Computational Linguistics and Clinical Psychology",
month = jul,
year = "2022",
address = "Seattle, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.clpsych-1.3",
doi = "10.18653/v1/2022.clpsych-1.3",
pages = "30--39",
abstract = "Models of mental health based on natural language processing can uncover latent signals of mental health from language. Models that indicate whether an individual is depressed, or has other mental health conditions, can aid in diagnosis and treatment. A critical aspect of integration of these models into the clinical setting relies on explaining their behavior to domain experts. In the case of mental health diagnosis, clinicians already rely on an assessment framework to make these decisions; that framework can help a model generate meaningful explanations. In this work we propose to use PHQ-9 categories as an auxiliary task to explaining a social media based model of depression. We develop a multi-task learning framework that predicts both depression and PHQ-9 categories as auxiliary tasks. We compare the quality of explanations generated based on the depression task only, versus those that use the predicted PHQ-9 categories. We find that by relying on clinically meaningful auxiliary tasks, we produce more meaningful explanations.",
}
We provide an overview of the CLPsych 2022 Shared Task, which focusses on the automatic identification of {`}Moments of Change{‘} in lon- gitudinal posts by individuals on social media and its connection with information regarding mental health . This year{‘}s task introduced the notion of longitudinal modelling of the text generated by an individual online over time, along with appropriate temporally sen- sitive evaluation metrics. The Shared Task con- sisted of two subtasks: (a) the main task of cap- turing changes in an individual{‘}s mood (dras- tic changes-{`}Switches{‘}- and gradual changes -{`}Escalations{‘}- on the basis of textual content shared online; and subsequently (b) the sub- task of identifying the suicide risk level of an individual {–} a continuation of the CLPsych 2019 Shared Task{–} where participants were encouraged to explore how the identification of changes in mood in task (a) can help with assessing suicidality risk in task (b).
@inproceedings{tsakalidis-etal-2022-overview,
title = "Overview of the {CLP}sych 2022 Shared Task: Capturing Moments of Change in Longitudinal User Posts",
author = "Tsakalidis, Adam and
Chim, Jenny and
Bilal, Iman Munire and
Zirikly, Ayah and
Atzil-Slonim, Dana and
Nanni, Federico and
Resnik, Philip and
Gaur, Manas and
Roy, Kaushik and
Inkster, Becky and
Leintz, Jeff and
Liakata, Maria",
editor = "Zirikly, Ayah and
Atzil-Slonim, Dana and
Liakata, Maria and
Bedrick, Steven and
Desmet, Bart and
Ireland, Molly and
Lee, Andrew and
MacAvaney, Sean and
Purver, Matthew and
Resnik, Rebecca and
Yates, Andrew",
booktitle = "Proceedings of the Eighth Workshop on Computational Linguistics and Clinical Psychology",
month = jul,
year = "2022",
address = "Seattle, USA",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.clpsych-1.16",
doi = "10.18653/v1/2022.clpsych-1.16",
pages = "184--198",
abstract = "We provide an overview of the CLPsych 2022 Shared Task, which focusses on the automatic identification of {`}Moments of Change{'} in lon- gitudinal posts by individuals on social media and its connection with information regarding mental health . This year{'}s task introduced the notion of longitudinal modelling of the text generated by an individual online over time, along with appropriate temporally sen- sitive evaluation metrics. The Shared Task con- sisted of two subtasks: (a) the main task of cap- turing changes in an individual{'}s mood (dras- tic changes-{`}Switches{'}- and gradual changes -{`}Escalations{'}- on the basis of textual content shared online; and subsequently (b) the sub- task of identifying the suicide risk level of an individual {--} a continuation of the CLPsych 2019 Shared Task{--} where participants were encouraged to explore how the identification of changes in mood in task (a) can help with assessing suicidality risk in task (b).",
}
Non-Player Characters (NPCs) significantly enhance the player experience in many games. Historically, players{‘} interactions with NPCs have tended to be highly scripted, to be limited to natural language responses to be selected by the player, and to not involve dynamic change in game state. In this work, we demonstrate that use of a few example conversational prompts can power a conversational agent to generate both natural language and novel code. This approach can permit development of NPCs with which players can have grounded conversations that are free-form and less repetitive. We demonstrate our approach using OpenAI Codex (GPT-3 finetuned on GitHub), with Minecraft game development as our test bed. We show that with a few example prompts, a Codex-based agent can generate novel code, hold multi-turn conversations and answer questions about structured data. We evaluate this application using experienced gamers in a Minecraft realm and provide analysis of failure cases and suggest possible directions for solutions.
@inproceedings{volum-etal-2022-craft,
title = "Craft an Iron Sword: Dynamically Generating Interactive Game Characters by Prompting Large Language Models Tuned on Code",
author = "Volum, Ryan and
Rao, Sudha and
Xu, Michael and
DesGarennes, Gabriel and
Brockett, Chris and
Van Durme, Benjamin and
Deng, Olivia and
Malhotra, Akanksha and
Dolan, Bill",
editor = "C{\^o}t{\'e}, Marc-Alexandre and
Yuan, Xingdi and
Ammanabrolu, Prithviraj",
booktitle = "Proceedings of the 3rd Wordplay: When Language Meets Games Workshop (Wordplay 2022)",
month = jul,
year = "2022",
address = "Seattle, United States",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.wordplay-1.3",
doi = "10.18653/v1/2022.wordplay-1.3",
pages = "25--43",
abstract = "Non-Player Characters (NPCs) significantly enhance the player experience in many games. Historically, players{'} interactions with NPCs have tended to be highly scripted, to be limited to natural language responses to be selected by the player, and to not involve dynamic change in game state. In this work, we demonstrate that use of a few example conversational prompts can power a conversational agent to generate both natural language and novel code. This approach can permit development of NPCs with which players can have grounded conversations that are free-form and less repetitive. We demonstrate our approach using OpenAI Codex (GPT-3 finetuned on GitHub), with Minecraft game development as our test bed. We show that with a few example prompts, a Codex-based agent can generate novel code, hold multi-turn conversations and answer questions about structured data. We evaluate this application using experienced gamers in a Minecraft realm and provide analysis of failure cases and suggest possible directions for solutions.",
}
Our commonsense knowledge about objects includes their typical visual attributes; we know that bananas are typically yellow or green, and not purple. Text and image corpora, being subject to reporting bias, represent this world-knowledge to varying degrees of faithfulness. In this paper, we investigate to what degree unimodal (language-only) and multimodal (image and language) models capture a broad range of visually salient attributes. To that end, we create the Visual Commonsense Tests (ViComTe) dataset covering 5 property types (color, shape, material, size, and visual co-occurrence) for over 5000 subjects. We validate this dataset by showing that our grounded color data correlates much better than ungrounded text-only data with crowdsourced color judgments provided by Paik et al. (2021). We then use our dataset to evaluate pretrained unimodal models and multimodal models. Our results indicate that multimodal models better reconstruct attribute distributions, but are still subject to reporting bias. Moreover, increasing model size does not enhance performance, suggesting that the key to visual commonsense lies in the data.
@inproceedings{zhang-etal-2022-visual,
title = "Visual Commonsense in Pretrained Unimodal and Multimodal Models",
author = "Zhang, Chenyu and
Van Durme, Benjamin and
Li, Zhuowan and
Stengel-Eskin, Elias",
editor = "Carpuat, Marine and
de Marneffe, Marie-Catherine and
Meza Ruiz, Ivan Vladimir",
booktitle = "Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies",
month = jul,
year = "2022",
address = "Seattle, United States",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.naacl-main.390",
doi = "10.18653/v1/2022.naacl-main.390",
pages = "5321--5335",
abstract = "Our commonsense knowledge about objects includes their typical visual attributes; we know that bananas are typically yellow or green, and not purple. Text and image corpora, being subject to reporting bias, represent this world-knowledge to varying degrees of faithfulness. In this paper, we investigate to what degree unimodal (language-only) and multimodal (image and language) models capture a broad range of visually salient attributes. To that end, we create the Visual Commonsense Tests (ViComTe) dataset covering 5 property types (color, shape, material, size, and visual co-occurrence) for over 5000 subjects. We validate this dataset by showing that our grounded color data correlates much better than ungrounded text-only data with crowdsourced color judgments provided by Paik et al. (2021). We then use our dataset to evaluate pretrained unimodal models and multimodal models. Our results indicate that multimodal models better reconstruct attribute distributions, but are still subject to reporting bias. Moreover, increasing model size does not enhance performance, suggesting that the key to visual commonsense lies in the data.",
}
Large language models can perform semantic parsing with little training data, when prompted with in-context examples. It has been shown that this can be improved by formulating the problem as paraphrasing into canonical utterances, which casts the underlying meaning representation into a controlled natural language-like representation. Intuitively, such models can more easily output canonical utterances as they are closer to the natural language used for pre-training. Recently, models also pre-trained on code, like OpenAI Codex, have risen in prominence. For semantic parsing tasks where we map natural language into code, such models may prove more adept at it. In this paper, we test this hypothesis and find that Codex performs better on such tasks than equivalent GPT-3 models. We evaluate on Overnight and SMCalFlow and find that unlike GPT-3, Codex performs similarly when targeting meaning representations directly, perhaps because meaning representations are structured similar to code in these datasets.
@inproceedings{shin-van-durme-2022-shot,
title = "Few-Shot Semantic Parsing with Language Models Trained on Code",
author = "Shin, Richard and
Van Durme, Benjamin",
editor = "Carpuat, Marine and
de Marneffe, Marie-Catherine and
Meza Ruiz, Ivan Vladimir",
booktitle = "Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies",
month = jul,
year = "2022",
address = "Seattle, United States",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.naacl-main.396",
doi = "10.18653/v1/2022.naacl-main.396",
pages = "5417--5425",
abstract = "Large language models can perform semantic parsing with little training data, when prompted with in-context examples. It has been shown that this can be improved by formulating the problem as paraphrasing into canonical utterances, which casts the underlying meaning representation into a controlled natural language-like representation. Intuitively, such models can more easily output canonical utterances as they are closer to the natural language used for pre-training. Recently, models also pre-trained on code, like OpenAI Codex, have risen in prominence. For semantic parsing tasks where we map natural language into code, such models may prove more adept at it. In this paper, we test this hypothesis and find that Codex performs better on such tasks than equivalent GPT-3 models. We evaluate on Overnight and SMCalFlow and find that unlike GPT-3, Codex performs similarly when targeting meaning representations directly, perhaps because meaning representations are structured similar to code in these datasets.",
}
Translation of the noisy, informal language found in social media has been an understudied problem, with a principal factor being the limited availability of translation corpora in many languages. To address this need we have developed a new corpus containing over 200,000 translations of microblog posts that supports translation of thirteen languages into English. The languages are: Arabic, Chinese, Farsi, French, German, Hindi, Korean, Pashto, Portuguese, Russian, Spanish, Tagalog, and Urdu. We are releasing these data as the Multilingual Microblog Translation Corpus to support futher research in translation of informal language. We establish baselines using this new resource, and we further demonstrate the utility of the corpus by conducting experiments with fine-tuning to improve translation quality from a high performing neural machine translation (NMT) system. Fine-tuning provided substantial gains, ranging from +3.4 to +11.1 BLEU. On average, a relative gain of 21{\%} was observed, demonstrating the utility of the corpus.
@inproceedings{mcnamee-duh-2022-multilingual,
title = "The Multilingual Microblog Translation Corpus: Improving and Evaluating Translation of User-Generated Text",
author = "McNamee, Paul and
Duh, Kevin",
editor = "Calzolari, Nicoletta and
B{\'e}chet, Fr{\'e}d{\'e}ric and
Blache, Philippe and
Choukri, Khalid and
Cieri, Christopher and
Declerck, Thierry and
Goggi, Sara and
Isahara, Hitoshi and
Maegaard, Bente and
Mariani, Joseph and
Mazo, H{\'e}l{\`e}ne and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Thirteenth Language Resources and Evaluation Conference",
month = jun,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2022.lrec-1.96",
pages = "910--918",
abstract = "Translation of the noisy, informal language found in social media has been an understudied problem, with a principal factor being the limited availability of translation corpora in many languages. To address this need we have developed a new corpus containing over 200,000 translations of microblog posts that supports translation of thirteen languages into English. The languages are: Arabic, Chinese, Farsi, French, German, Hindi, Korean, Pashto, Portuguese, Russian, Spanish, Tagalog, and Urdu. We are releasing these data as the Multilingual Microblog Translation Corpus to support futher research in translation of informal language. We establish baselines using this new resource, and we further demonstrate the utility of the corpus by conducting experiments with fine-tuning to improve translation quality from a high performing neural machine translation (NMT) system. Fine-tuning provided substantial gains, ranging from +3.4 to +11.1 BLEU. On average, a relative gain of 21{\%} was observed, demonstrating the utility of the corpus.",
}
We evaluate two popular neural cognate generation models{‘} robustness to several types of human-plausible noise (deletion, duplication, swapping, and keyboard errors, as well as a new type of error, phonological errors). We find that duplication and phonological substitution is least harmful, while the other types of errors are harmful. We present an in-depth analysis of the models{‘} results with respect to each error type to explain how and why these models perform as they do.
@inproceedings{wu-yarowsky-2022-robustness,
title = "On the Robustness of Cognate Generation Models",
author = "Wu, Winston and
Yarowsky, David",
editor = "Calzolari, Nicoletta and
B{\'e}chet, Fr{\'e}d{\'e}ric and
Blache, Philippe and
Choukri, Khalid and
Cieri, Christopher and
Declerck, Thierry and
Goggi, Sara and
Isahara, Hitoshi and
Maegaard, Bente and
Mariani, Joseph and
Mazo, H{\'e}l{\`e}ne and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Thirteenth Language Resources and Evaluation Conference",
month = jun,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2022.lrec-1.458",
pages = "4299--4305",
abstract = "We evaluate two popular neural cognate generation models{'} robustness to several types of human-plausible noise (deletion, duplication, swapping, and keyboard errors, as well as a new type of error, phonological errors). We find that duplication and phonological substitution is least harmful, while the other types of errors are harmful. We present an in-depth analysis of the models{'} results with respect to each error type to explain how and why these models perform as they do.",
}
The Universal Morphology (UniMorph) project is a collaborative effort providing broad-coverage instantiated normalized morphological inflection tables for hundreds of diverse world languages. The project comprises two major thrusts: a language-independent feature schema for rich morphological annotation, and a type-level resource of annotated data in diverse languages realizing that schema. This paper presents the expansions and improvements on several fronts that were made in the last couple of years (since McCarthy et al. (2020)). Collaborative efforts by numerous linguists have added 66 new languages, including 24 endangered languages. We have implemented several improvements to the extraction pipeline to tackle some issues, e.g., missing gender and macrons information. We have amended the schema to use a hierarchical structure that is needed for morphological phenomena like multiple-argument agreement and case stacking, while adding some missing morphological features to make the schema more inclusive. In light of the last UniMorph release, we also augmented the database with morpheme segmentation for 16 languages. Lastly, this new release makes a push towards inclusion of derivational morphology in UniMorph by enriching the data and annotation schema with instances representing derivational processes from MorphyNet.
@inproceedings{batsuren-etal-2022-unimorph,
title = "{U}ni{M}orph 4.0: {U}niversal {M}orphology",
author = "Batsuren, Khuyagbaatar and
Goldman, Omer and
Khalifa, Salam and
Habash, Nizar and
Kiera{\'s}, Witold and
Bella, G{\'a}bor and
Leonard, Brian and
Nicolai, Garrett and
Gorman, Kyle and
Ate, Yustinus Ghanggo and
Ryskina, Maria and
Mielke, Sabrina and
Budianskaya, Elena and
El-Khaissi, Charbel and
Pimentel, Tiago and
Gasser, Michael and
Lane, William Abbott and
Raj, Mohit and
Coler, Matt and
Samame, Jaime Rafael Montoya and
Camaiteri, Delio Siticonatzi and
Rojas, Esa{\'u} Zumaeta and
L{\'o}pez Francis, Didier and
Oncevay, Arturo and
L{\'o}pez Bautista, Juan and
Villegas, Gema Celeste Silva and
Hennigen, Lucas Torroba and
Ek, Adam and
Guriel, David and
Dirix, Peter and
Bernardy, Jean-Philippe and
Scherbakov, Andrey and
Bayyr-ool, Aziyana and
Anastasopoulos, Antonios and
Zariquiey, Roberto and
Sheifer, Karina and
Ganieva, Sofya and
Cruz, Hilaria and
Karah{\'o}{\v{g}}a, Ritv{\'a}n and
Markantonatou, Stella and
Pavlidis, George and
Plugaryov, Matvey and
Klyachko, Elena and
Salehi, Ali and
Angulo, Candy and
Baxi, Jatayu and
Krizhanovsky, Andrew and
Krizhanovskaya, Natalia and
Salesky, Elizabeth and
Vania, Clara and
Ivanova, Sardana and
White, Jennifer and
Maudslay, Rowan Hall and
Valvoda, Josef and
Zmigrod, Ran and
Czarnowska, Paula and
Nikkarinen, Irene and
Salchak, Aelita and
Bhatt, Brijesh and
Straughn, Christopher and
Liu, Zoey and
Washington, Jonathan North and
Pinter, Yuval and
Ataman, Duygu and
Wolinski, Marcin and
Suhardijanto, Totok and
Yablonskaya, Anna and
Stoehr, Niklas and
Dolatian, Hossep and
Nuriah, Zahroh and
Ratan, Shyam and
Tyers, Francis M. and
Ponti, Edoardo M. and
Aiton, Grant and
Arora, Aryaman and
Hatcher, Richard J. and
Kumar, Ritesh and
Young, Jeremiah and
Rodionova, Daria and
Yemelina, Anastasia and
Andrushko, Taras and
Marchenko, Igor and
Mashkovtseva, Polina and
Serova, Alexandra and
Prud{'}hommeaux, Emily and
Nepomniashchaya, Maria and
Giunchiglia, Fausto and
Chodroff, Eleanor and
Hulden, Mans and
Silfverberg, Miikka and
McCarthy, Arya D. and
Yarowsky, David and
Cotterell, Ryan and
Tsarfaty, Reut and
Vylomova, Ekaterina",
editor = "Calzolari, Nicoletta and
B{\'e}chet, Fr{\'e}d{\'e}ric and
Blache, Philippe and
Choukri, Khalid and
Cieri, Christopher and
Declerck, Thierry and
Goggi, Sara and
Isahara, Hitoshi and
Maegaard, Bente and
Mariani, Joseph and
Mazo, H{\'e}l{\`e}ne and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Thirteenth Language Resources and Evaluation Conference",
month = jun,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2022.lrec-1.89",
pages = "840--855",
abstract = "The Universal Morphology (UniMorph) project is a collaborative effort providing broad-coverage instantiated normalized morphological inflection tables for hundreds of diverse world languages. The project comprises two major thrusts: a language-independent feature schema for rich morphological annotation, and a type-level resource of annotated data in diverse languages realizing that schema. This paper presents the expansions and improvements on several fronts that were made in the last couple of years (since McCarthy et al. (2020)). Collaborative efforts by numerous linguists have added 66 new languages, including 24 endangered languages. We have implemented several improvements to the extraction pipeline to tackle some issues, e.g., missing gender and macrons information. We have amended the schema to use a hierarchical structure that is needed for morphological phenomena like multiple-argument agreement and case stacking, while adding some missing morphological features to make the schema more inclusive. In light of the last UniMorph release, we also augmented the database with morpheme segmentation for 16 languages. Lastly, this new release makes a push towards inclusion of derivational morphology in UniMorph by enriching the data and annotation schema with instances representing derivational processes from MorphyNet.",
}
Whole-person functional limitations in the areas of mobility, self-care and domestic life affect a majority of individuals with disabilities. Detecting, recording and monitoring such limitations would benefit those individuals, as well as research on whole-person functioning and general public health. Dictionaries of terms related to whole-person function would enable automated identification and extraction of relevant information. However, no such terminologies currently exist, due in part to a lack of standardized coding and their availability mainly in free text clinical notes. In this paper, we introduce terminologies of whole-person function in the domains of mobility, self-care and domestic life, built and evaluated using a small set of manually annotated clinical notes, which provided a seedset that was expanded using a mix of lexical and deep learning approaches.
@inproceedings{zirikly-etal-2022-whole,
title = "A Whole-Person Function Dictionary for the Mobility, Self-Care and Domestic Life Domains: a Seedset Expansion Approach",
author = "Zirikly, Ayah and
Desmet, Bart and
Porcino, Julia and
Camacho Maldonado, Jonathan and
Ho, Pei-Shu and
Jimenez Silva, Rafael and
Sacco, Maryanne",
editor = "Calzolari, Nicoletta and
B{\'e}chet, Fr{\'e}d{\'e}ric and
Blache, Philippe and
Choukri, Khalid and
Cieri, Christopher and
Declerck, Thierry and
Goggi, Sara and
Isahara, Hitoshi and
Maegaard, Bente and
Mariani, Joseph and
Mazo, H{\'e}l{\`e}ne and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Thirteenth Language Resources and Evaluation Conference",
month = jun,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2022.lrec-1.305",
pages = "2850--2855",
abstract = "Whole-person functional limitations in the areas of mobility, self-care and domestic life affect a majority of individuals with disabilities. Detecting, recording and monitoring such limitations would benefit those individuals, as well as research on whole-person functioning and general public health. Dictionaries of terms related to whole-person function would enable automated identification and extraction of relevant information. However, no such terminologies currently exist, due in part to a lack of standardized coding and their availability mainly in free text clinical notes. In this paper, we introduce terminologies of whole-person function in the domains of mobility, self-care and domestic life, built and evaluated using a small set of manually annotated clinical notes, which provided a seedset that was expanded using a mix of lexical and deep learning approaches.",
}
We propose an enhanced adversarial training algorithm for fine-tuning transformer-based language models (i.e., RoBERTa) and apply it to the temporal reasoning task. Current adversarial training approaches for NLP add the adversarial perturbation only to the embedding layer, ignoring the other layers of the model, which might limit the generalization power of adversarial training. Instead, our algorithm searches for the best combination of layers to add the adversarial perturbation. We add the adversarial perturbation to multiple hidden states or attention representations of the model layers. Adding the perturbation to the attention representations performed best in our experiments. Our model can improve performance on several temporal reasoning benchmarks, and establishes new state-of-the-art results.
@inproceedings{kanashiro-pereira-2022-attention,
title = "Attention-Focused Adversarial Training for Robust Temporal Reasoning",
author = "Kanashiro Pereira, Lis",
editor = "Calzolari, Nicoletta and
B{\'e}chet, Fr{\'e}d{\'e}ric and
Blache, Philippe and
Choukri, Khalid and
Cieri, Christopher and
Declerck, Thierry and
Goggi, Sara and
Isahara, Hitoshi and
Maegaard, Bente and
Mariani, Joseph and
Mazo, H{\'e}l{\`e}ne and
Odijk, Jan and
Piperidis, Stelios",
booktitle = "Proceedings of the Thirteenth Language Resources and Evaluation Conference",
month = jun,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2022.lrec-1.800",
pages = "7352--7359",
abstract = "We propose an enhanced adversarial training algorithm for fine-tuning transformer-based language models (i.e., RoBERTa) and apply it to the temporal reasoning task. Current adversarial training approaches for NLP add the adversarial perturbation only to the embedding layer, ignoring the other layers of the model, which might limit the generalization power of adversarial training. Instead, our algorithm searches for the best combination of layers to add the adversarial perturbation. We add the adversarial perturbation to multiple hidden states or attention representations of the model layers. Adding the perturbation to the attention representations performed best in our experiments. Our model can improve performance on several temporal reasoning benchmarks, and establishes new state-of-the-art results.",
}
Event schemas are structured knowledge sources defining typical real-world scenarios (e.g., going to an airport). We present a framework for efficient human-in-the-loop construction of a schema library, based on a novel script induction system and a well-crafted interface that allows non-experts to {“}program{”} complex event structures. Associated with this work we release a schema library: a machine readable resource of 232 detailed event schemas, each of which describe a distinct typical scenario in terms of its relevant sub-event structure (what happens in the scenario), participants (who plays a role in the scenario), fine-grained typing of each participant, and the implied relational constraints between them. We make our schema library and the SchemaBlocks interface available online.
@inproceedings{weber-etal-2022-human,
title = "Human Schema Curation via Causal Association Rule Mining",
author = "Weber, Noah and
Belyy, Anton and
Holzenberger, Nils and
Rudinger, Rachel and
Van Durme, Benjamin",
editor = "Pradhan, Sameer and
Kuebler, Sandra",
booktitle = "Proceedings of the 16th Linguistic Annotation Workshop (LAW-XVI) within LREC2022",
month = jun,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association",
url = "https://aclanthology.org/2022.law-1.17",
pages = "139--150",
abstract = "Event schemas are structured knowledge sources defining typical real-world scenarios (e.g., going to an airport). We present a framework for efficient human-in-the-loop construction of a schema library, based on a novel script induction system and a well-crafted interface that allows non-experts to {``}program{''} complex event structures. Associated with this work we release a schema library: a machine readable resource of 232 detailed event schemas, each of which describe a distinct typical scenario in terms of its relevant sub-event structure (what happens in the scenario), participants (who plays a role in the scenario), fine-grained typing of each participant, and the implied relational constraints between them. We make our schema library and the SchemaBlocks interface available online.",
}
Pretrained multilingual encoders enable zero-shot cross-lingual transfer, but often produce unreliable models that exhibit high performance variance on the target language. We postulate that this high variance results from zero-shot cross-lingual transfer solving an under-specified optimization problem. We show that any linear-interpolated model between the source language monolingual model and source + target bilingual model has equally low source language generalization error, yet the target language generalization error reduces smoothly and linearly as we move from the monolingual to bilingual model, suggesting that the model struggles to identify good solutions for both source and target languages using the source language alone. Additionally, we show that zero-shot solution lies in non-flat region of target language error generalization surface, causing the high variance.
@inproceedings{wu-etal-2022-zero,
title = "Zero-shot Cross-lingual Transfer is Under-specified Optimization",
author = "Wu, Shijie and
Van Durme, Benjamin and
Dredze, Mark",
editor = "Gella, Spandana and
He, He and
Majumder, Bodhisattwa Prasad and
Can, Burcu and
Giunchiglia, Eleonora and
Cahyawijaya, Samuel and
Min, Sewon and
Mozes, Maximilian and
Li, Xiang Lorraine and
Augenstein, Isabelle and
Rogers, Anna and
Cho, Kyunghyun and
Grefenstette, Edward and
Rimell, Laura and
Dyer, Chris",
booktitle = "Proceedings of the 7th Workshop on Representation Learning for NLP",
month = may,
year = "2022",
address = "Dublin, Ireland",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.repl4nlp-1.25",
doi = "10.18653/v1/2022.repl4nlp-1.25",
pages = "236--248",
abstract = "Pretrained multilingual encoders enable zero-shot cross-lingual transfer, but often produce unreliable models that exhibit high performance variance on the target language. We postulate that this high variance results from zero-shot cross-lingual transfer solving an under-specified optimization problem. We show that any linear-interpolated model between the source language monolingual model and source + target bilingual model has equally low source language generalization error, yet the target language generalization error reduces smoothly and linearly as we move from the monolingual to bilingual model, suggesting that the model struggles to identify good solutions for both source and target languages using the source language alone. Additionally, we show that zero-shot solution lies in non-flat region of target language error generalization surface, causing the high variance.",
}
We propose the task of updated headline generation, in which a system generates a headline for an updated article, considering both the previous article and headline. The system must identify the novel information in the article update, and modify the existing headline accordingly. We create data for this task using the NewsEdits corpus by automatically identifying contiguous article versions that are likely to require a substantive headline update. We find that models conditioned on the prior headline and body revisions produce headlines judged by humans to be as factual as gold headlines while making fewer unnecessary edits compared to a standard headline generation model. Our experiments establish benchmarks for this new contextual summarization task.
@inproceedings{panthaplackel-etal-2022-updated,
title = "Updated Headline Generation: Creating Updated Summaries for Evolving News Stories",
author = "Panthaplackel, Sheena and
Benton, Adrian and
Dredze, Mark",
editor = "Muresan, Smaranda and
Nakov, Preslav and
Villavicencio, Aline",
booktitle = "Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = may,
year = "2022",
address = "Dublin, Ireland",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.acl-long.446",
doi = "10.18653/v1/2022.acl-long.446",
pages = "6438--6461",
abstract = "We propose the task of updated headline generation, in which a system generates a headline for an updated article, considering both the previous article and headline. The system must identify the novel information in the article update, and modify the existing headline accordingly. We create data for this task using the NewsEdits corpus by automatically identifying contiguous article versions that are likely to require a substantive headline update. We find that models conditioned on the prior headline and body revisions produce headlines judged by humans to be as factual as gold headlines while making fewer unnecessary edits compared to a standard headline generation model. Our experiments establish benchmarks for this new contextual summarization task.",
}
Collecting data for conversational semantic parsing is a time-consuming and demanding process. In this paper we consider, given an incomplete dataset with only a small amount of data, how to build an AI-powered human-in-the-loop process to enable efficient data collection. A guided K-best selection process is proposed, which (i) generates a set of possible valid candidates; (ii) allows users to quickly traverse the set and filter incorrect parses; and (iii) asks users to select the correct parse, with minimal modification when necessary. We investigate how to best support users in efficiently traversing the candidate set and locating the correct parse, in terms of speed and accuracy. In our user study, consisting of five annotators labeling 300 instances each, we find that combining keyword searching, where keywords can be used to query relevant candidates, and keyword suggestion, where representative keywords are automatically generated, enables fast and accurate annotation.
@inproceedings{belyy-etal-2022-guided,
title = "Guided K-best Selection for Semantic Parsing Annotation",
author = "Belyy, Anton and
Huang, Chieh-yang and
Andreas, Jacob and
Platanios, Emmanouil Antonios and
Thomson, Sam and
Shin, Richard and
Roy, Subhro and
Nisnevich, Aleksandr and
Chen, Charles and
Van Durme, Benjamin",
editor = "Basile, Valerio and
Kozareva, Zornitsa and
Stajner, Sanja",
booktitle = "Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics: System Demonstrations",
month = may,
year = "2022",
address = "Dublin, Ireland",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.acl-demo.11",
doi = "10.18653/v1/2022.acl-demo.11",
pages = "114--126",
abstract = "Collecting data for conversational semantic parsing is a time-consuming and demanding process. In this paper we consider, given an incomplete dataset with only a small amount of data, how to build an AI-powered human-in-the-loop process to enable efficient data collection. A guided K-best selection process is proposed, which (i) generates a set of possible valid candidates; (ii) allows users to quickly traverse the set and filter incorrect parses; and (iii) asks users to select the correct parse, with minimal modification when necessary. We investigate how to best support users in efficiently traversing the candidate set and locating the correct parse, in terms of speed and accuracy. In our user study, consisting of five annotators labeling 300 instances each, we find that combining keyword searching, where keywords can be used to query relevant candidates, and keyword suggestion, where representative keywords are automatically generated, enables fast and accurate annotation.",
}
We introduce a novel setup for low-resource task-oriented semantic parsing which incorporates several constraints that may arise in real-world scenarios: (1) lack of similar datasets/models from a related domain, (2) inability to sample useful logical forms directly from a grammar, and (3) privacy requirements for unlabeled natural utterances. Our goal is to improve a low-resource semantic parser using utterances collected through user interactions. In this highly challenging but realistic setting, we investigate data augmentation approaches involving generating a set of structured canonical utterances corresponding to logical forms, before simulating corresponding natural language and filtering the resulting pairs. We find that such approaches are effective despite our restrictive setup: in a low-resource setting on the complex SMCalFlow calendaring dataset (Andreas et al. 2020), we observe 33{\%} relative improvement over a non-data-augmented baseline in top-1 match.
@inproceedings{yang-etal-2022-addressing,
title = "Addressing Resource and Privacy Constraints in Semantic Parsing Through Data Augmentation",
author = "Yang, Kevin and
Deng, Olivia and
Chen, Charles and
Shin, Richard and
Roy, Subhro and
Van Durme, Benjamin",
editor = "Muresan, Smaranda and
Nakov, Preslav and
Villavicencio, Aline",
booktitle = "Findings of the Association for Computational Linguistics: ACL 2022",
month = may,
year = "2022",
address = "Dublin, Ireland",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.findings-acl.291",
doi = "10.18653/v1/2022.findings-acl.291",
pages = "3685--3695",
abstract = "We introduce a novel setup for low-resource task-oriented semantic parsing which incorporates several constraints that may arise in real-world scenarios: (1) lack of similar datasets/models from a related domain, (2) inability to sample useful logical forms directly from a grammar, and (3) privacy requirements for unlabeled natural utterances. Our goal is to improve a low-resource semantic parser using utterances collected through user interactions. In this highly challenging but realistic setting, we investigate data augmentation approaches involving generating a set of structured canonical utterances corresponding to logical forms, before simulating corresponding natural language and filtering the resulting pairs. We find that such approaches are effective despite our restrictive setup: in a low-resource setting on the complex SMCalFlow calendaring dataset (Andreas et al. 2020), we observe 33{\%} relative improvement over a non-data-augmented baseline in top-1 match.",
}
The evaluation campaign of the 19th International Conference on Spoken Language Translation featured eight shared tasks: (i) Simultaneous speech translation, (ii) Offline speech translation, (iii) Speech to speech translation, (iv) Low-resource speech translation, (v) Multilingual speech translation, (vi) Dialect speech translation, (vii) Formality control for speech translation, (viii) Isometric speech translation. A total of 27 teams participated in at least one of the shared tasks. This paper details, for each shared task, the purpose of the task, the data that were released, the evaluation metrics that were applied, the submissions that were received and the results that were achieved.
@inproceedings{anastasopoulos-etal-2022-findings,
title = "Findings of the {IWSLT} 2022 Evaluation Campaign",
author = {Anastasopoulos, Antonios and
Barrault, Lo{\"\i}c and
Bentivogli, Luisa and
Zanon Boito, Marcely and
Bojar, Ond{\v{r}}ej and
Cattoni, Roldano and
Currey, Anna and
Dinu, Georgiana and
Duh, Kevin and
Elbayad, Maha and
Emmanuel, Clara and
Est{\`e}ve, Yannick and
Federico, Marcello and
Federmann, Christian and
Gahbiche, Souhir and
Gong, Hongyu and
Grundkiewicz, Roman and
Haddow, Barry and
Hsu, Benjamin and
Javorsk{\'y}, D{\'a}vid and
Kloudov{\'a}, V{\u{e}}ra and
Lakew, Surafel and
Ma, Xutai and
Mathur, Prashant and
McNamee, Paul and
Murray, Kenton and
N{\v{a}}dejde, Maria and
Nakamura, Satoshi and
Negri, Matteo and
Niehues, Jan and
Niu, Xing and
Ortega, John and
Pino, Juan and
Salesky, Elizabeth and
Shi, Jiatong and
Sperber, Matthias and
St{\"u}ker, Sebastian and
Sudoh, Katsuhito and
Turchi, Marco and
Virkar, Yogesh and
Waibel, Alexander and
Wang, Changhan and
Watanabe, Shinji},
editor = "Salesky, Elizabeth and
Federico, Marcello and
Costa-juss{\`a}, Marta",
booktitle = "Proceedings of the 19th International Conference on Spoken Language Translation (IWSLT 2022)",
month = may,
year = "2022",
address = "Dublin, Ireland (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.iwslt-1.10",
doi = "10.18653/v1/2022.iwslt-1.10",
pages = "98--157",
abstract = "The evaluation campaign of the 19th International Conference on Spoken Language Translation featured eight shared tasks: (i) Simultaneous speech translation, (ii) Offline speech translation, (iii) Speech to speech translation, (iv) Low-resource speech translation, (v) Multilingual speech translation, (vi) Dialect speech translation, (vii) Formality control for speech translation, (viii) Isometric speech translation. A total of 27 teams participated in at least one of the shared tasks. This paper details, for each shared task, the purpose of the task, the data that were released, the evaluation metrics that were applied, the submissions that were received and the results that were achieved.",
}
Automated methods have been widely used to identify and analyze mental health conditions (e.g., depression) from various sources of information, including social media. Yet, deployment of such models in real-world healthcare applications faces challenges including poor out-of-domain generalization and lack of trust in black box models. In this work, we propose approaches for depression detection that are constrained to different degrees by the presence of symptoms described in PHQ9, a questionnaire used by clinicians in the depression screening process. In dataset-transfer experiments on three social media datasets, we find that grounding the model in PHQ9{‘}s symptoms substantially improves its ability to generalize to out-of-distribution data compared to a standard BERT-based approach. Furthermore, this approach can still perform competitively on in-domain data. These results and our qualitative analyses suggest that grounding model predictions in clinically-relevant symptoms can improve generalizability while producing a model that is easier to inspect.
@inproceedings{nguyen-etal-2022-improving,
title = "Improving the Generalizability of Depression Detection by Leveraging Clinical Questionnaires",
author = "Nguyen, Thong and
Yates, Andrew and
Zirikly, Ayah and
Desmet, Bart and
Cohan, Arman",
editor = "Muresan, Smaranda and
Nakov, Preslav and
Villavicencio, Aline",
booktitle = "Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = may,
year = "2022",
address = "Dublin, Ireland",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.acl-long.578",
doi = "10.18653/v1/2022.acl-long.578",
pages = "8446--8459",
abstract = "Automated methods have been widely used to identify and analyze mental health conditions (e.g., depression) from various sources of information, including social media. Yet, deployment of such models in real-world healthcare applications faces challenges including poor out-of-domain generalization and lack of trust in black box models. In this work, we propose approaches for depression detection that are constrained to different degrees by the presence of symptoms described in PHQ9, a questionnaire used by clinicians in the depression screening process. In dataset-transfer experiments on three social media datasets, we find that grounding the model in PHQ9{'}s symptoms substantially improves its ability to generalize to out-of-distribution data compared to a standard BERT-based approach. Furthermore, this approach can still perform competitively on in-domain data. These results and our qualitative analyses suggest that grounding model predictions in clinically-relevant symptoms can improve generalizability while producing a model that is easier to inspect.",
}
This paper details the Johns Hopkins speech translation (ST) system used in the IWLST2022 dialect speech translation task. Our system uses a cascade of automatic speech recognition (ASR) and machine translation (MT). We use a Conformer model for ASR systems and a Transformer model for machine translation. Surprisingly, we found that while using additional ASR training data resulted in only a negligible change in performance as measured by BLEU or word error rate (WER), aggressive text normalization improved BLEU more significantly. We also describe an approach, similar to back-translation, for improving performance using synthetic dialectal source text produced from source sentences in mismatched dialects.
@inproceedings{yang-etal-2022-jhu,
title = "{JHU} {IWSLT} 2022 Dialect Speech Translation System Description",
author = "Yang, Jinyi and
Hussein, Amir and
Wiesner, Matthew and
Khudanpur, Sanjeev",
editor = "Salesky, Elizabeth and
Federico, Marcello and
Costa-juss{\`a}, Marta",
booktitle = "Proceedings of the 19th International Conference on Spoken Language Translation (IWSLT 2022)",
month = may,
year = "2022",
address = "Dublin, Ireland (in-person and online)",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.iwslt-1.29",
doi = "10.18653/v1/2022.iwslt-1.29",
pages = "319--326",
abstract = "This paper details the Johns Hopkins speech translation (ST) system used in the IWLST2022 dialect speech translation task. Our system uses a cascade of automatic speech recognition (ASR) and machine translation (MT). We use a Conformer model for ASR systems and a Transformer model for machine translation. Surprisingly, we found that while using additional ASR training data resulted in only a negligible change in performance as measured by BLEU or word error rate (WER), aggressive text normalization improved BLEU more significantly. We also describe an approach, similar to back-translation, for improving performance using synthetic dialectal source text produced from source sentences in mismatched dialects.",
}
Recent work in multilingual machine translation (MMT) has focused on the potential of positive transfer between languages, particularly cases where higher-resourced languages can benefit lower-resourced ones. While training an MMT model, the supervision signals learned from one language pair can be transferred to the other via the tokens shared by multiple source languages. However, the transfer is inhibited when the token overlap among source languages is small, which manifests naturally when languages use different writing systems. In this paper, we tackle inhibited transfer by augmenting the training data with alternative signals that unify different writing systems, such as phonetic, romanized, and transliterated input. We test these signals on Indic and Turkic languages, two language families where the writing systems differ but languages still share common features. Our results indicate that a straightforward multi-source self-ensemble {–} training a model on a mixture of various signals and ensembling the outputs of the same model fed with different signals during inference, outperforms strong ensemble baselines by 1.3 BLEU points on both language families. Further, we find that incorporating alternative inputs via self-ensemble can be particularly effective when training set is small, leading to +5 BLEU when only 5{\%} of the total training data is accessible. Finally, our analysis demonstrates that including alternative signals yields more consistency and translates named entities more accurately, which is crucial for increased factuality of automated systems.
@inproceedings{sun-etal-2022-alternative,
title = "Alternative Input Signals Ease Transfer in Multilingual Machine Translation",
author = "Sun, Simeng and
Fan, Angela and
Cross, James and
Chaudhary, Vishrav and
Tran, Chau and
Koehn, Philipp and
Guzm{\'a}n, Francisco",
editor = "Muresan, Smaranda and
Nakov, Preslav and
Villavicencio, Aline",
booktitle = "Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = may,
year = "2022",
address = "Dublin, Ireland",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.acl-long.363",
doi = "10.18653/v1/2022.acl-long.363",
pages = "5291--5305",
abstract = "Recent work in multilingual machine translation (MMT) has focused on the potential of positive transfer between languages, particularly cases where higher-resourced languages can benefit lower-resourced ones. While training an MMT model, the supervision signals learned from one language pair can be transferred to the other via the tokens shared by multiple source languages. However, the transfer is inhibited when the token overlap among source languages is small, which manifests naturally when languages use different writing systems. In this paper, we tackle inhibited transfer by augmenting the training data with alternative signals that unify different writing systems, such as phonetic, romanized, and transliterated input. We test these signals on Indic and Turkic languages, two language families where the writing systems differ but languages still share common features. Our results indicate that a straightforward multi-source self-ensemble {--} training a model on a mixture of various signals and ensembling the outputs of the same model fed with different signals during inference, outperforms strong ensemble baselines by 1.3 BLEU points on both language families. Further, we find that incorporating alternative inputs via self-ensemble can be particularly effective when training set is small, leading to +5 BLEU when only 5{\%} of the total training data is accessible. Finally, our analysis demonstrates that including alternative signals yields more consistency and translates named entities more accurately, which is crucial for increased factuality of automated systems.",
}
Neural coreference resolution models trained on one dataset may not transfer to new, low-resource domains. Active learning mitigates this problem by sampling a small subset of data for annotators to label. While active learning is well-defined for classification tasks, its application to coreference resolution is neither well-defined nor fully understood. This paper explores how to actively label coreference, examining sources of model uncertainty and document reading costs. We compare uncertainty sampling strategies and their advantages through thorough error analysis. In both synthetic and human experiments, labeling spans within the same document is more effective than annotating spans across documents. The findings contribute to a more realistic development of coreference resolution models.
@inproceedings{yuan-etal-2022-adapting,
title = "Adapting Coreference Resolution Models through Active Learning",
author = "Yuan, Michelle and
Xia, Patrick and
May, Chandler and
Van Durme, Benjamin and
Boyd-Graber, Jordan",
editor = "Muresan, Smaranda and
Nakov, Preslav and
Villavicencio, Aline",
booktitle = "Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = may,
year = "2022",
address = "Dublin, Ireland",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.acl-long.519",
doi = "10.18653/v1/2022.acl-long.519",
pages = "7533--7549",
abstract = "Neural coreference resolution models trained on one dataset may not transfer to new, low-resource domains. Active learning mitigates this problem by sampling a small subset of data for annotators to label. While active learning is well-defined for classification tasks, its application to coreference resolution is neither well-defined nor fully understood. This paper explores how to actively label coreference, examining sources of model uncertainty and document reading costs. We compare uncertainty sampling strategies and their advantages through thorough error analysis. In both synthetic and human experiments, labeling spans within the same document is more effective than annotating spans across documents. The findings contribute to a more realistic development of coreference resolution models.",
}
@InProceedings{zhou-et-al-2022,
aclid = "2022.acl-long.110",
doi = "10.18653/v1/2022.acl-long.110",
author = "Jiawei Zhou and Jason Eisner and Michael Newman and
Emmanouil Anthony Platanios and Sam Thomson",
title = "Online Semantic Parsing for Latency Reduction in
Task-Oriented Dialogue",
booktitle = "Proceedings of the Association for Computational
Linguistics (ACL)",
pages = "1554--1576",
year = "2022",
month = may,
address = "Dublin",
URL = "http://cs.jhu.edu/~jason/papers/#zhou-et-al-2022",
}
@InProceedings{cotterell-eisner-2022,
author = "Ryan Cotterell and Jason Eisner",
title = "A Functionalist Account of Vowel System Typology",
booktitle = "Proceedings of the Association for Computational
Linguistics (ACL)",
year = "2022",
month = may,
address = "Dublin",
note = "Paper was accepted, but we withdrew it in order to add
more experiments and analysis before publication.",
URL = "http://cs.jhu.edu/~jason/papers/#cotterell-eisner-2022",
}
@InProceedings{yang-et-al-2022-iclr,
author = "Chenghao Yang and Hongyuan Mei and Jason Eisner",
title = "Transformer Embeddings of Irregularly Spaced Events
and Their Participants",
booktitle = "Proceedings of the Tenth International Conference on
Learning Representations (ICLR)",
year = "2022",
month = apr,
note = "9 pages plus appendices",
URL = "http://cs.jhu.edu/~jason/papers/#yang-et-al-2022-iclr",
}
@inproceedings{248965209,
title = {SALTED: A Framework for SAlient Long-Tail Translation Error Detection},
author = {{Vikas Raunak} and {Matt Post} and {Arul Menezes}},
year = 2022,
month = {5},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/a349bcb86ba80ef543e5deaadbb7e0ff5daef5e7},
}
@inproceedings{249437588,
title = {Temporal Contrastive-Loss for Audio Event Detection},
author = {{Sandeep Reddy Kothinti} and {Mounya Elhilali}},
year = 2022,
month = {5},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/34fe9aa0f5e26768d196087ed146e2b3a576d73e},
}
@inproceedings{251253396,
title = {Multilingual Coreference Resolution in Multiparty Dialogue},
author = {{Boyuan Zheng} and {Patrick Xia} and {M. Yarmohammadi} and {Benjamin Van Durme}},
year = 2022,
month = {8},
booktitle = {Transactions of the Association for Computational Linguistics},
url = {https://www.semanticscholar.org/paper/ced26dee12fe5fa2f666bcc2ba5b0a1969240887},
}
@inproceedings{247362702,
title = {UNeXt: MLP-based Rapid Medical Image Segmentation Network},
author = {{Jeya Maria Jose Valanarasu} and {Vishal M. Patel}},
year = 2022,
month = {3},
booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention},
url = {https://www.semanticscholar.org/paper/ccb5a70f8a6f7b7fc923b9d4c18488b2837daa6f},
}
@inproceedings{249926634,
title = {BenchCLAMP: A Benchmark for Evaluating Language Models on Semantic Parsing},
author = {{Subhro Roy} and {Sam Thomson} and {Tongfei Chen} and {Richard Shin} and {Adam Pauls} and {J. Eisner} and {Benjamin Van Durme}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/132751a80632e80a90d7c3d3cd8a361f48fdb9b4},
}
@inproceedings{246805990,
title = {Trade-Offs in Sensor Systems Design: A Tutorial},
author = {{Christos Sapsanis} and {M. Sophocleous} and {A. Andreou} and {J. Georgiou}},
year = 2022,
month = {6},
booktitle = {IEEE Sensors Journal},
url = {https://www.semanticscholar.org/paper/07cfa0c80e6ef73a2aa5fab377c2f698ed476341},
}
Humans process natural language online, whether reading a document or participating in multiparty dialogue. Recent advances in neural coreference resolution have focused on offline approaches that assume the full communication history as input. This is neither realistic nor sufficient if we wish to support dialogue understanding in real-time. We benchmark two existing, offline, models and highlight their shortcomings in the online setting. We then modify these models to perform online inference and introduce rollback: a short-term mechanism to correct mistakes. We demonstrate across five English datasets the effectiveness of this approach against an offline and a naive online model in terms of latency, final document-level coreference F1, and average running F1.
@inproceedings{xia-van-durme-2022-online,
title = "Online Neural Coreference Resolution with Rollback",
author = "Xia, Patrick and
Van Durme, Benjamin",
editor = "Ogrodniczuk, Maciej and
Pradhan, Sameer and
Nedoluzhko, Anna and
Ng, Vincent and
Poesio, Massimo",
booktitle = "Proceedings of the Fifth Workshop on Computational Models of Reference, Anaphora and Coreference",
month = oct,
year = "2022",
address = "Gyeongju, Republic of Korea",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2022.crac-1.2",
pages = "13--21",
abstract = "Humans process natural language online, whether reading a document or participating in multiparty dialogue. Recent advances in neural coreference resolution have focused on offline approaches that assume the full communication history as input. This is neither realistic nor sufficient if we wish to support dialogue understanding in real-time. We benchmark two existing, offline, models and highlight their shortcomings in the online setting. We then modify these models to perform online inference and introduce rollback: a short-term mechanism to correct mistakes. We demonstrate across five English datasets the effectiveness of this approach against an offline and a naive online model in terms of latency, final document-level coreference F1, and average running F1.",
}
@inproceedings{250105551,
title = {Spatial speech detection for binaural hearing aids using deep phoneme classifiers},
author = {{H. Kayser} and {H. Hermansky} and {B. Meyer}},
year = 2022,
month = {6},
booktitle = {Acta acustica. European Acoustics Association},
url = {https://www.semanticscholar.org/paper/5bf8888705bfa1cdbf08784606d5ebf6e6a0e2f8},
}
@inproceedings{245668909,
title = {A Transformer-Based Siamese Network for Change Detection},
author = {{W. G. C. Bandara} and {Vishal M. Patel}},
year = 2022,
month = {1},
booktitle = {IEEE International Geoscience and Remote Sensing Symposium},
url = {https://www.semanticscholar.org/paper/ef3b15260a610473c95662f5df2c195ac19f64d6},
}
@inproceedings{248228101,
title = {Shape-guided Object Inpainting},
author = {{Yu Zeng} and {Zhe Lin} and {Vishal M. Patel}},
year = 2022,
month = {4},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/69286603f2dd6037634921e1247543e30fe1756d},
}
@inproceedings{253253453,
title = {Microsoft Word-nqac237.docx},
author = {{Bruce Y Lee} and {J. Ordovás} and {E. J. Parks} and {Cheryl AM Anderson} and {A. Barabási} and {S. Clinton} and {K. Haye} and {V. Duffy} and {P. Franks} and {Elizabeth M Ginexi} and {K. Hammond} and {Erin C. Hanlon} and {Michael Hittle} and {Emily Ho} and {A. Horn} and {R. Isaacson} and {P. Mabry} and {Susan E. Malone} and {Corby K. Martin} and {J. Mattei} and {S. Meydani} and {Lorene M. Nelson} and {M. Neuhouser} and {N. Pronk} and {S. Saria} and {Frank Ajl Scheer} and {E. Segal} and {M. Sevick} and {T. Spector} and {Linda B Van Horn} and {K. Varady} and {V. S. Voruganti} and {Marie F Martinez}},
year = 2022,
booktitle = {},
url = {https://www.semanticscholar.org/paper/ae27ca3ffeb8273f258fb6a41a1cc4803adb716b},
}
@inproceedings{252383306,
title = {NBD-GAP: Non-Blind Image Deblurring without Clean Target Images},
author = {{Nithin Gopalakrishnan Nair} and {R. Yasarla} and {Vishal M. Patel}},
year = 2022,
month = {9},
booktitle = {International Conference on Information Photonics},
url = {https://www.semanticscholar.org/paper/28a43c5d52c421b1ccc24d15f39b2cdb82ed84de},
}
@inproceedings{251462729,
title = {Non-Contrastive Self-Supervised Learning for Utterance-Level Information Extraction From Speech},
author = {{Jaejin Cho} and {J. Villalba} and {L. Moro-Velázquez} and {N. Dehak}},
year = 2022,
month = {8},
booktitle = {IEEE Journal on Selected Topics in Signal Processing},
url = {https://www.semanticscholar.org/paper/7504aeee4c344c4cf9c6fc071dcc4b4b34d124cc},
}
@inproceedings{251647228,
title = {Image BERT Pre-training with Online Tokenizer},
author = {{Jinghao Zhou} and {Chen Wei} and {Huiyu Wang} and {Wei Shen} and {Cihang Xie} and {A. Yuille} and {Tao Kong}},
year = 2022,
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/ff169d09a933756e8798021dbf9e24a0bbfd9b38},
}
@inproceedings{249830266,
title = {Advances in Speaker Recognition for Multilingual Conversational Telephone Speech: The JHU-MIT System for NIST SRE20 CTS Challenge},
author = {{J. Villalba} and {B. J. Borgstrom} and {Saurabh Kataria} and {Jaejin Cho} and {P. Torres-Carrasquillo} and {N. Dehak}},
year = 2022,
month = {6},
booktitle = {The Speaker and Language Recognition Workshop},
url = {https://www.semanticscholar.org/paper/042e35459f6dfd8ad8be0dad72ae27f8e73cd4a8},
}
@inproceedings{249282662,
title = {Faster Rates of Convergence to Stationary Points in Differentially Private Optimization},
author = {{R. Arora} and {Raef Bassily} and {Tom'as Gonz'alez} and {Crist'obal Guzm'an} and {Michael Menart} and {Enayat Ullah}},
year = 2022,
month = {6},
booktitle = {International Conference on Machine Learning},
url = {https://www.semanticscholar.org/paper/6f85ad4e04fc157ed5b499e348972f188a39cd10},
}
@inproceedings{250243820,
title = {Adversarial Robustness is at Odds with Lazy Training},
author = {{Yunjuan Wang} and {Enayat Ullah} and {Poorya Mianjy} and {R. Arora}},
year = 2022,
month = {6},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/e2100da66c556f6ce3fbe904696fb0cec2aca2bf},
}
@inproceedings{248512944,
title = {In Defense of Image Pre-Training for Spatiotemporal Recognition},
author = {{Xianhang Li} and {Huiyu Wang} and {Chen Wei} and {Jieru Mei} and {A. Yuille} and {Yuyin Zhou} and {Cihang Xie}},
year = 2022,
month = {5},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/c0c0139333b9c642fe7789f4fe8f27bc647c280d},
}
@inproceedings{248832550,
title = {Digitally recorded and remotely classified lung auscultation compared with conventional stethoscope classifications among children aged 1–59 months enrolled in the Pneumonia Etiology Research for Child Health (PERCH) case–control study},
author = {{Daniel E Park} and {Nora L. Watson} and {Christopher Focht} and {D. Feikin} and {Laura L Hammit} and {W. A. Brooks} and {S. Howie} and {K. Kotloff} and {O. Levine} and {S. Madhi} and {D. Murdoch} and {K. O'Brien} and {J. Scott} and {D. Thea} and {Tussanee Amorninthapichet} and {J. Awori} and {C. Bunthi} and {B. Ebruke} and {Mounya Elhilali} and {Melissa M. Higdon} and {L. Hossain} and {Y. Jahan} and {D. Moore} and {J. Mulindwa} and {L. Mwananyanda} and {Sathapana Naorat} and {Christine Prosperi} and {S. Thamthitiwat} and {C. Verwey} and {K. Jablonski} and {M. Power} and {H. Young} and {M. Deloria Knoll} and {E. McCollum}},
year = 2022,
month = {5},
booktitle = {BMJ Open Respiratory Research},
url = {https://www.semanticscholar.org/paper/dfedb313d8718de8aa162813060af3e24e8cbe28},
}
@inproceedings{252341100,
title = {Chunking Defense for Adversarial Attacks on ASR},
author = {{Yiwen Shao} and {J. Villalba} and {Sonal Joshi} and {Saurabh Kataria} and {S. Khudanpur} and {N. Dehak}},
year = 2022,
month = {9},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/ace27d0f6e93765439e19203e69570cf00f09e63},
}
@inproceedings{250425961,
title = {No Language Left Behind: Scaling Human-Centered Machine Translation},
author = {{Nllb team} and {M. Costa-jussà} and {James Cross} and {Onur cCelebi} and {Maha Elbayad} and {Kenneth Heafield} and {Kevin Heffernan} and {Elahe Kalbassi} and {Janice Lam} and {Daniel Licht} and {Jean Maillard} and {Anna Sun} and {Skyler Wang} and {Guillaume Wenzek} and {Alison Youngblood} and {Bapi Akula} and {Loïc Barrault} and {Gabriel Mejia Gonzalez} and {Prangthip Hansanti} and {John Hoffman} and {Semarley Jarrett} and {Kaushik Ram Sadagopan} and {Dirk Rowe} and {Shannon L. Spruit} and {C. Tran} and {Pierre Yves Andrews} and {Necip Fazil Ayan} and {Shruti Bhosale} and {Sergey Edunov} and {Angela Fan} and {Cynthia Gao} and {Vedanuj Goswami} and {Francisco Guzm'an} and {Philipp Koehn} and {Alexandre Mourachko} and {C. Ropers} and {Safiyyah Saleem} and {Holger Schwenk} and {Jeff Wang}},
year = 2022,
month = {7},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/e19b54ad4c1c8af045069e9cac350ffc2ce60e1a},
}
@inproceedings{248476325,
title = {Where in the World is this Image? Transformer-based Geo-localization in the Wild},
author = {{Shraman Pramanick} and {E. Nowara} and {Joshua Gleason} and {C. Castillo} and {R. Chellappa}},
year = 2022,
month = {4},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/1889dfb7c30f2b9f8e9d4026ca71ec10caa449af},
}
@inproceedings{246210468,
title = {Transfer Learning Approaches for Building Cross-Language Dense Retrieval Models},
author = {{Suraj Nair} and {Eugene Yang} and {Dawn J Lawrie} and {Kevin Duh} and {Paul McNamee} and {Kenton Murray} and {J. Mayfield} and {Douglas W. Oard}},
year = 2022,
month = {1},
booktitle = {European Conference on Information Retrieval},
url = {https://www.semanticscholar.org/paper/d1ccffb8eb1b7a99cd586723074b82fa5399bdd2},
}
@inproceedings{255595965,
title = {Textual Data Augmentation for Arabic-English Code-Switching Speech Recognition},
author = {{A. Hussein} and {S. A. Chowdhury} and {Ahmed Abdelali} and {N. Dehak} and {Ahmed M. Ali} and {S. Khudanpur}},
year = 2022,
month = {1},
booktitle = {Spoken Language Technology Workshop},
url = {https://www.semanticscholar.org/paper/3c00e6cc82b49f046b5f36e5d5f8aa4af68cad5a},
}
@inproceedings{247628260,
title = {Complex Frequency Domain Linear Prediction: A Tool to Compute Modulation Spectrum of Speech},
author = {{Samik Sadhu} and {H. Hermansky}},
year = 2022,
month = {3},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/35a36559a133981c17759aa573afea646abe40f6},
}
@inproceedings{250298720,
title = {Modeling Constraints Can Identify Winning Arguments in Multi-Party Interactions (Student Abstract)},
author = {{Suzanna Sia} and {Kokil Jaidka} and {Niyati Chayya} and {Kevin Duh}},
year = 2022,
month = {6},
booktitle = {AAAI Conference on Artificial Intelligence},
url = {https://www.semanticscholar.org/paper/da88a7e2b2187fc230b61f36752dbf396be9ce32},
}
@inproceedings{251800257,
title = {Masked Autoencoders Enable Efficient Knowledge Distillers},
author = {{Yutong Bai} and {Zeyu Wang} and {Junfei Xiao} and {Chen Wei} and {Huiyu Wang} and {A. Yuille} and {Yuyin Zhou} and {Cihang Xie}},
year = 2022,
month = {8},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/a7cd547c539d69f99f17855242cb07bd80047f9a},
}
@inproceedings{249063004,
title = {VoynaSlov: A Data Set of Russian Social Media Activity during the 2022 Ukraine-Russia War},
author = {{Chan Young Park} and {Julia Mendelsohn} and {Anjalie Field} and {Yulia Tsvetkov}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/215a6f2b4c206975f59d81c0c9f45cfe935a85e9},
}
@inproceedings{246680149,
title = {Point-Level Region Contrast for Object Detection Pre-Training},
author = {{Yutong Bai} and {Xinlei Chen} and {Alexander Kirillov} and {A. Yuille} and {A. Berg}},
year = 2022,
month = {2},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/7d692139562f9679a3694e1d408b00bd8259b6f1},
}
@inproceedings{247839270,
title = {Supplementary File: Escaping Data Scarcity for High-Resolution Heterogeneous Face Hallucination},
author = {{Yiqun Mei} and {Pengfei Guo} and {Vishal M. Patel}},
year = 2022,
booktitle = {},
url = {https://www.semanticscholar.org/paper/33e69c1a173789d721185c07510af20013a509bf},
}
@inproceedings{258762900,
title = {NELLIE: A Neuro-Symbolic Inference Engine for Grounded, Compositional, and Explainable Reasoning},
author = {{Nathaniel Weir} and {Benjamin Van Durme}},
year = 2022,
month = {9},
booktitle = {International Joint Conference on Artificial Intelligence},
url = {https://www.semanticscholar.org/paper/52aa0f1347459ab9dec1655fc8fa29866919f624},
}
@inproceedings{251765426,
title = {Bitext Mining for Low-Resource Languages via Contrastive Learning},
author = {{Weiting Tan} and {Philipp Koehn}},
year = 2022,
month = {8},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/767853fdd964e043c485ebb92afdcdf3ee8457e8},
}
@inproceedings{250408015,
title = {k-means Mask Transformer},
author = {{Qihang Yu} and {Huiyu Wang} and {Siyuan Qiao} and {Maxwell D. Collins} and {Yukun Zhu} and {Hatwig Adam} and {A. Yuille} and {Liang-Chieh Chen}},
year = 2022,
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/f3b1dd33a2a8b533a0c08382b2a2bbf721beac21},
}
@inproceedings{247476162,
title = {DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection},
author = {{Yingwei Li} and {Adams Wei Yu} and {Tianjian Meng} and {Benjamin Caine} and {Jiquan Ngiam} and {Daiyi Peng} and {Junyang Shen} and {Bo-Xun Wu} and {Yifeng Lu} and {Denny Zhou} and {Quoc V. Le} and {A. Yuille} and {Mingxing Tan}},
year = 2022,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/5ffca96f4becdab649f085699594caa7c5c03e86},
}
@inproceedings{247154787,
title = {UnifiedQA-v2: Stronger Generalization via Broader Cross-Format Training},
author = {{Daniel Khashabi} and {Yeganeh Kordi} and {Hannaneh Hajishirzi}},
year = 2022,
month = {2},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/5b44101b2372a33ec06e15ce4d20ad9a15518325},
}
@inproceedings{246239741,
title = {Characterizing the Details of Spatial Construction: Cognitive Constraints and Variability},
author = {{A. Shelton} and {E. Davis} and {Cathryn S. Cortesa} and {Jonathan D. Jones} and {Gregory Hager} and {S. Khudanpur} and {B. Landau}},
year = 2022,
month = {1},
booktitle = {Cognitive Sciences},
url = {https://www.semanticscholar.org/paper/6482f52977f167c6db734f766b0b59e8c92d7e52},
}
@inproceedings{248300043,
title = {Fast AdvProp},
author = {{Jieru Mei} and {Yucheng Han} and {Yutong Bai} and {Yixiao Zhang} and {Yingwei Li} and {Xianhang Li} and {A. Yuille} and {Cihang Xie}},
year = 2022,
month = {4},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/f2eaaf8afc89a86035fd7127305f2bb9d2169495},
}
@inproceedings{246872267,
title = {Learning from Synthetic Vehicles},
author = {{Tae Soo Kim} and {Bohoon Shim} and {Michael Peven} and {Weichao Qiu} and {A. Yuille} and {Gregory Hager}},
year = 2022,
month = {1},
booktitle = {2022 IEEE/CVF Winter Conference on Applications of Computer Vision Workshops (WACVW)},
url = {https://www.semanticscholar.org/paper/b5ac4931672397df6d9135e0d5b615351f490a44},
}
@inproceedings{249386629,
title = {A dilemma of ground truth in noisy speech separation and an approach to lessen the impact of imperfect training data},
author = {{Matthew Maciejewski} and {Jing Shi} and {Shinji Watanabe} and {S. Khudanpur}},
year = 2022,
month = {6},
booktitle = {Computer Speech and Language},
url = {https://www.semanticscholar.org/paper/e3b6ab2d2e1a0e734bf505fbb34dc6fe723ab37e},
}
@inproceedings{254125621,
title = {Localization vs. Semantics: How Can Language Benefit Visual Representation Learning?},
author = {{Zhuowan Li} and {Cihang Xie} and {Benjamin Van Durme} and {Alan Yuille Johns Hopkins University} and {U. California} and {Santa Cruz}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/970a8ed9de244b080aa69dbf5996a37057909ca6},
}
@inproceedings{248562546,
title = {Differentially Private Generalized Linear Models Revisited},
author = {{R. Arora} and {Raef Bassily} and {Crist'obal Guzm'an} and {Michael Menart} and {Enayat Ullah}},
year = 2022,
month = {5},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/7c8634be409d59c15b717cc1dc8f696289617e89},
}
@inproceedings{254017908,
title = {JAWS: Auditing Predictive Uncertainty Under Covariate Shift},
author = {{Drew Prinster} and {Anqi Liu} and {S. Saria}},
year = 2022,
month = {7},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/4fb13897dad166844ca020e3cef1563b8dc81775},
}
@inproceedings{252337895,
title = {Dealing with Unknowns in Continual Learning for End-to-end Automatic Speech Recognition},
author = {{Martin Sustek} and {Samik Sadhu} and {H. Hermansky}},
year = 2022,
month = {9},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/dea2103e2b666413670b3f5c81a2e3ca318ea2d4},
}
@inproceedings{247958394,
title = {SwapMix: Diagnosing and Regularizing the Over-Reliance on Visual Context in Visual Question Answering},
author = {{Vipul Gupta} and {Zhuowan Li} and {Adam Kortylewski} and {Chenyu Zhang} and {Yingwei Li} and {A. Yuille}},
year = 2022,
month = {4},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/0d2f848fff121133b3b77c7e691c6a2ba502be47},
}
@inproceedings{251622408,
title = {PDRF: Progressively Deblurring Radiance Field for Fast and Robust Scene Reconstruction from Blurry Images},
author = {{Cheng Peng} and {R. Chellappa}},
year = 2022,
month = {8},
booktitle = {AAAI Conference on Artificial Intelligence},
url = {https://www.semanticscholar.org/paper/c900f690fdab5d17b0253d4362e7f1a7d9d2d495},
}
@inproceedings{260444131,
title = {Mention Annotations Alone Enable Efficient Domain Adaptation for Coreference Resolution},
author = {{Nupoor Gandhi} and {Anjalie Field} and {Emma Strubell}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/43f09be116b87046334d395a71919ab423b204a1},
}
@inproceedings{250463643,
title = {Real Number Modeling of a SAR ADC behavior using SystemVerilog},
author = {{Christos Sapsanis} and {M. Villemur} and {A. Andreou}},
year = 2022,
month = {6},
booktitle = {International Conference on Synthesis, Modeling, Analysis and Simulation Methods and Applications to Circuit Design},
url = {https://www.semanticscholar.org/paper/528b50e00ed3efece80bbc4557ecf4f8df98094a},
}
@inproceedings{248069457,
title = {AdvEst: Adversarial Perturbation Estimation to Classify and Detect Adversarial Attacks against Speaker Identification},
author = {{Sonal Joshi} and {Saurabh Kataria} and {J. Villalba} and {N. Dehak}},
year = 2022,
month = {4},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/a8144dbb8481cb78e08fc34e452603984bb5aa01},
}
@inproceedings{263625818,
title = {Beyond the Imitation Game: Quantifying and extrapolating the capabilities of language models},
author = {{Aarohi Srivastava} and {Abhinav Rastogi} and {Abhishek Rao} and {Abu Awal Md Shoeb} and {Abubakar Abid} and {Adam Fisch} and {Adam R. Brown} and {Adam Santoro} and {Aditya Gupta} and {Adrià Garriga-Alonso} and {Agnieszka Kluska} and {Aitor Lewkowycz} and {Akshat Agarwal} and {Alethea Power} and {Alex Ray} and {Alex Warstadt} and {Alexander W. Kocurek} and {Ali Safaya} and {Ali Tazarv} and {Alice Xiang} and {Alicia Parrish} and {Allen Nie} and {Aman Hussain} and {Amanda Askell} and {Amanda Dsouza} and {Ambrose Slone} and {Ameet Rahane} and {Anantharaman S. Iyer} and {Anders Andreassen} and {Andrea Madotto} and {Andrea Santilli} and {Andreas Stuhlmuller} and {Andrew M. Dai} and {Andrew La} and {Andrew Kyle Lampinen} and {Andy Zou} and {Angela Jiang} and {Angelica Chen} and {Anh Vuong} and {Animesh Gupta} and {Anna Gottardi} and {Antonio Norelli} and {Anu Venkatesh} and {Arash Gholamidavoodi} and {Arfa Tabassum} and {Arul Menezes} and {Arun Kirubarajan} and {A. Mullokandov} and {Ashish Sabharwal} and {Austin Herrick} and {Avia Efrat} and {Aykut Erdem} and {Ayla Karakacs} and {B. R. Roberts} and {B. S. Loe} and {Barret Zoph} and {Bartlomiej Bojanowski} and {Batuhan Ozyurt} and {Behnam Hedayatnia} and {Behnam Neyshabur} and {Benjamin Inden} and {Benno Stein} and {Berk Ekmekci} and {Bill Yuchen Lin} and {B. Howald} and {Bryan Orinion} and {Cameron Diao} and {Cameron Dour} and {Catherine Stinson} and {Cedrick Argueta} and {C'esar Ferri Ram'irez} and {Chandan Singh} and {Charles Rathkopf} and {Chenlin Meng} and {Chitta Baral} and {Chiyu Wu} and {Chris Callison-Burch} and {Chris Waites} and {Christian Voigt} and {Christopher D. Manning} and {Christopher Potts} and {Cindy Ramirez} and {Clara E. Rivera} and {Clemencia Siro} and {Colin Raffel} and {Courtney Ashcraft} and {Cristina Garbacea} and {Damien Sileo} and {Daniel H Garrette} and {Dan Hendrycks} and {D. Kilman} and {Dan Roth} and {Daniel Freeman} and {Daniel Khashabi} and {Daniel Levy} and {D. Gonz'alez} and {Danielle R. Perszyk} and {Danny Hernandez} and {Danqi Chen} and {Daphne Ippolito} and {D. Gilboa} and {David Dohan} and {D. Drakard} and {David Jurgens} and {Debajyoti Datta} and {Deep Ganguli} and {Denis Emelin} and {Denis Kleyko} and {Deniz Yuret} and {Derek Chen} and {Derek Tam} and {Dieuwke Hupkes} and {Diganta Misra} and {Dilyar Buzan} and {Dimitri Coelho Mollo} and {Diyi Yang} and {Dong-Ho Lee} and {Dylan Schrader} and {Ekaterina Shutova} and {E. D. Cubuk} and {Elad Segal} and {Eleanor Hagerman} and {Elizabeth Barnes} and {E. Donoway} and {Ellie Pavlick} and {E. Rodolà} and {Emma Lam} and {Eric Chu} and {Eric Tang} and {Erkut Erdem} and {Ernie Chang} and {Ethan A. Chi} and {Ethan Dyer} and {E. Jerzak} and {Ethan Kim} and {Eunice Engefu Manyasi} and {Evgenii Zheltonozhskii} and {Fanyue Xia} and {F. Siar} and {Fernando Mart'inez-Plumed} and {Francesca Happ'e} and {François Chollet} and {Frieda Rong} and {Gaurav Mishra} and {Genta Indra Winata} and {Gerard de Melo} and {Germán Kruszewski} and {Giambattista Parascandolo} and {Giorgio Mariani} and {Gloria Xinyue Wang} and {Gonzalo Jaimovitch-L'opez} and {Gregor Betz} and {Guy Gur-Ari} and {Hana Galijasevic} and {Hannah Kim} and {Hannah Rashkin} and {Hannaneh Hajishirzi} and {Harsh Mehta} and {H. Bogar} and {Henry Shevlin} and {Hinrich Schutze} and {H. Yakura} and {Hongming Zhang} and {Hugh Mee Wong} and {Ian Ng} and {Isaac Noble} and {Jaap Jumelet} and {Jack Geissinger} and {John Kernion} and {Jacob Hilton} and {Jaehoon Lee} and {J. Fisac} and {James B. Simon} and {James Koppel} and {James Zheng} and {James Zou} and {Jan Koco'n} and {Jana Thompson} and {Janelle Wingfield} and {Jared Kaplan} and {Jarema Radom} and {Jascha Narain Sohl-Dickstein} and {Jason Phang} and {Jason Wei} and {J. Yosinski} and {Jekaterina Novikova} and {Jelle Bosscher} and {Jennifer Marsh} and {Jeremy Kim} and {Jeroen Taal} and {Jesse Engel} and {Jesujoba Oluwadara Alabi} and {Jiacheng Xu} and {Jiaming Song} and {Jillian Tang} and {Jane W Waweru} and {John Burden} and {John Miller} and {John U. Balis} and {Jonathan Batchelder} and {Jonathan Berant} and {Jorg Frohberg} and {Jos Rozen} and {J. Hernández-Orallo} and {Joseph Boudeman} and {Joseph Guerr} and {Joseph Jones} and {Joshua B. Tenenbaum} and {Joshua S. Rule} and {Joyce Chua} and {Kamil Kanclerz} and {Karen Livescu} and {K. Krauth} and {Karthik Gopalakrishnan} and {Katerina Ignatyeva} and {K. Markert} and {Kaustubh D. Dhole} and {Kevin Gimpel} and {Kevin Omondi} and {K. Mathewson} and {Kristen Chiafullo} and {Ksenia Shkaruta} and {K. Shridhar} and {Kyle McDonell} and {Kyle Richardson} and {Laria Reynolds} and {Leo Gao} and {Li Zhang} and {Liam Dugan} and {Lianhui Qin} and {Lidia Contreras-Ochando} and {Louis-Philippe Morency} and {Luca Moschella} and {Luca Lam} and {Lucy Noble} and {Ludwig Schmidt} and {Luheng He} and {Luis Oliveros Col'on} and {Luke Metz} and {Lutfi Kerem cSenel} and {Maarten Bosma} and {Maarten Sap} and {Maartje ter Hoeve} and {Maheen Farooqi} and {Manaal Faruqui} and {Mantas Mazeika} and {Marco Baturan} and {Marco Marelli} and {Marco Maru} and {Maria Jose Ram’irez Quintana} and {M. Tolkiehn} and {Mario Giulianelli} and {Martha Lewis} and {Martin Potthast} and {Matthew L. Leavitt} and {Matthias Hagen} and {M. Schubert} and {Medina Baitemirova} and {Melody Arnaud} and {M. McElrath} and {Michael A. Yee} and {Michael Cohen} and {Michael Gu} and {Michael Ivanitskiy} and {Michael Starritt} and {M. Strube} and {Michal Swkedrowski} and {Michele Bevilacqua} and {Michihiro Yasunaga} and {Mihir Kale} and {Mike Cain} and {Mimee Xu} and {Mirac Suzgun} and {Mitch Walker} and {Monica Tiwari} and {Mohit Bansal} and {Moin Aminnaseri} and {Mor Geva} and {Mozhdeh Gheini} and {T. MukundVarma} and {Nanyun Peng} and {Nathan A. Chi} and {Nayeon Lee} and {Neta Gur-Ari Krakover} and {Nicholas Cameron} and {Nicholas Roberts} and {Nick Doiron} and {Nicole Martinez} and {Nikita Nangia} and {Niklas Deckers} and {Niklas Muennighoff} and {N. Keskar} and {Niveditha Iyer} and {Noah Constant} and {Noah Fiedel} and {Nuan Wen} and {Oliver Zhang} and {Omar Agha} and {Omar Elbaghdadi} and {Omer Levy} and {Owain Evans} and {Pablo Antonio Moreno Casares} and {P. Doshi} and {Pascale Fung} and {P. Liang} and {Paul Vicol} and {Pegah Alipoormolabashi} and {Peiyuan Liao} and {Percy Liang} and {Peter Chang} and {P. Eckersley} and {Phu Mon Htut} and {P. Hwang} and {P. Milkowski} and {P. Patil} and {Pouya Pezeshkpour} and {Priti Oli} and {Qiaozhu Mei} and {Qing Lyu} and {Qinlang Chen} and {Rabin Banjade} and {Rachel Etta Rudolph} and {Raefer Gabriel} and {Rahel Habacker} and {Ramon Risco} and {Raphael Milliere} and {Rhythm Garg} and {Richard Barnes} and {R. Saurous} and {Riku Arakawa} and {Robbe Raymaekers} and {Robert Frank} and {Rohan Sikand} and {Roman Novak} and {Roman Sitelew} and {Ronan Le Bras} and {Rosanne Liu} and {Rowan Jacobs} and {Rui Zhang} and {R. Salakhutdinov} and {Ryan Chi} and {Ryan Lee} and {Ryan Stovall} and {Ryan Teehan} and {Rylan Yang} and {Sahib Singh} and {Saif Mohammad} and {Sajant Anand} and {Sam Dillavou} and {Sam Shleifer} and {Sam Wiseman} and {Samuel Gruetter} and {Samuel R. Bowman} and {S. Schoenholz} and {Sanghyun Han} and {Sanjeev Kwatra} and {Sarah A. Rous} and {Sarik Ghazarian} and {Sayan Ghosh} and {Sean Casey} and {Sebastian Bischoff} and {Sebastian Gehrmann} and {Sebastian Schuster} and {Sepideh Sadeghi} and {Shadi S. Hamdan} and {Sharon Zhou} and {Shashank Srivastava} and {Sherry Shi} and {Shikhar Singh} and {Shima Asaadi} and {S. Gu} and {Shubh Pachchigar} and {Shubham Toshniwal} and {Shyam Upadhyay} and {Shyamolima Debnath} and {Siamak Shakeri} and {Simon Thormeyer} and {S. Melzi} and {Siva Reddy} and {S. Makini} and {Soo-Hwan Lee} and {Spencer Bradley Torene} and {Sriharsha Hatwar} and {S. Dehaene} and {Stefan Divic} and {Stefano Ermon} and {Stella Biderman} and {Stephanie Lin} and {Stephen Prasad} and {Steven T Piantadosi} and {Stuart M. Shieber} and {Summer Misherghi} and {S. Kiritchenko} and {Swaroop Mishra} and {Tal Linzen} and {Tal Schuster} and {Tao Li} and {Tao Yu} and {Tariq Ali} and {Tatsunori Hashimoto} and {Te-Lin Wu} and {T. Desbordes} and {Theodore Rothschild} and {Thomas Phan} and {Tianle Wang} and {Tiberius Nkinyili} and {Timo Schick} and {T. Kornev} and {T. Tunduny} and {Tobias Gerstenberg} and {T. Chang} and {Trishala Neeraj} and {Tushar Khot} and {Tyler Shultz} and {Uri Shaham} and {Vedant Misra} and {Vera Demberg} and {Victoria Nyamai} and {Vikas Raunak} and {V. Ramasesh} and {Vinay Uday Prabhu} and {Vishakh Padmakumar} and {Vivek Srikumar} and {W. Fedus} and {W. Saunders} and {William Zhang} and {Wout Vossen} and {Xiang Ren} and {Xiaoyu Tong} and {Xinran Zhao} and {Xinyi Wu} and {Xudong Shen} and {Yadollah Yaghoobzadeh} and {Yair Lakretz} and {Yangqiu Song} and {Yasaman Bahri} and {Yejin Choi} and {Yichi Yang} and {Yiding Hao} and {Yifu Chen} and {Yonatan Belinkov} and {Yu Hou} and {Yu Hou} and {Yuntao Bai} and {Zachary Seid} and {Zhuoye Zhao} and {Zijian Wang} and {Zijie J. Wang} and {Zirui Wang} and {Ziyi Wu}},
year = 2022,
month = {6},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/bd1331b233e84bab7eba503abc60b31ac08e7881},
}
@inproceedings{250340438,
title = {Learning to Enrich Query Representation with Pseudo-Relevance Feedback for Cross-lingual Retrieval},
author = {{Ramraj Chandradevan} and {Eugene Yang} and {M. Yarmohammadi} and {Eugene Agichtein}},
year = 2022,
month = {7},
booktitle = {Annual International ACM SIGIR Conference on Research and Development in Information Retrieval},
url = {https://www.semanticscholar.org/paper/f0c4f3cb741548c70a4db105fee227fc4f59dfd2},
}
@inproceedings{247318765,
title = {3SD: Self-Supervised Saliency Detection With No Labels},
author = {{R. Yasarla} and {Renliang Weng} and {Wongun Choi} and {Vishal M. Patel} and {Amir Sadeghian}},
year = 2022,
month = {3},
booktitle = {IEEE Workshop/Winter Conference on Applications of Computer Vision},
url = {https://www.semanticscholar.org/paper/2a78e1c0412cbcc851ba60224c15c501debe2049},
}
@inproceedings{252368348,
title = {T2V-DDPM: Thermal to Visible Face Translation using Denoising Diffusion Probabilistic Models},
author = {{Nithin Gopalakrishnan Nair} and {Vishal M. Patel}},
year = 2022,
month = {9},
booktitle = {IEEE International Conference on Automatic Face & Gesture Recognition},
url = {https://www.semanticscholar.org/paper/fc49634e80ab31929799786a97b7ea63834bbdb1},
}
@inproceedings{252045737,
title = {Research gaps and opportunities in precision nutrition: an NIH workshop report.},
author = {{Bruce Y Lee} and {J. Ordovás} and {E. Parks} and {Cheryl Anderson} and {A. Barabási} and {S. Clinton} and {K. de la Haye} and {V. Duffy} and {P. Franks} and {Elizabeth M Ginexi} and {K. Hammond} and {Erin C. Hanlon} and {Michael Hittle} and {E. Ho} and {A. Horn} and {R. Isaacson} and {P. Mabry} and {S. Malone} and {Corby K. Martin} and {J. Mattei} and {S. Meydani} and {Lorene M. Nelson} and {M. Neuhouser} and {Brendan Parent} and {N. Pronk} and {H. Roche} and {S. Saria} and {F. Scheer} and {E. Segal} and {M. Sevick} and {T. Spector} and {Linda Van Horn} and {K. Varady} and {V. S. Voruganti} and {Marie F Martinez}},
year = 2022,
month = {9},
booktitle = {American Journal of Clinical Nutrition},
url = {https://www.semanticscholar.org/paper/31b65b7ccc0ed5ba975753c8b0ba8da8df28a09c},
}
@inproceedings{252186400,
title = {Embedding-Enhanced GIZA++: Improving Low-Resource Word Alignment Using Embeddings},
author = {{Kelly Marchisio} and {Conghao Xiong} and {Philipp Koehn}},
year = 2022,
booktitle = {Conference of the Association for Machine Translation in the Americas},
url = {https://www.semanticscholar.org/paper/4768c7f83f1c4fbb4fd98d9b4237ab483a8bc4b2},
}
@inproceedings{251762249,
title = {Morphological, Object Detection Framework for Embedded, Event-based Sensing},
author = {{M. Villemur} and {Jonah P. Sengupta} and {P. Julián} and {A. Andreou}},
year = 2022,
month = {6},
booktitle = {International Conference on Event-Based Control, Communication, and Signal Processing},
url = {https://www.semanticscholar.org/paper/dc774c02c8260a15a0098b2a193b7b5db7e3fdb1},
}
@inproceedings{259692914,
title = {kMaX-DeepLab: k-means Mask Transformer},
author = {{Qihang Yu} and {Huiyu Wang} and {Siyuan Qiao} and {Maxwell D. Collins} and {Yukun Zhu} and {Hartwig Adam} and {A. Yuille} and {Liang-Chieh Chen}},
year = 2022,
month = {7},
booktitle = {},
url = {https://www.semanticscholar.org/paper/5f3c2a31fc84d13a72008f70106163bd92f2f9d0},
}
@inproceedings{252346611,
title = {End-to-End Neural Speaker Diarization with an Iterative Refinement of Non-Autoregressive Attention-based Attractors},
author = {{Magdalena Rybicka} and {J. Villalba} and {N. Dehak} and {K. Kowalczyk}},
year = 2022,
month = {9},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/916cfa98c48af9931559fe0d8953bcaf7bdf7f2c},
}
@inproceedings{248227361,
title = {Revisiting Consistency Regularization for Semi-supervised Change Detection in Remote Sensing Images},
author = {{W. G. C. Bandara} and {Vishal M. Patel}},
year = 2022,
month = {4},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/d27fcbf42787d90a8afc76bf0598960fbb58b060},
}
@inproceedings{246823296,
title = {Open-Set Adversarial Defense with Clean-Adversarial Mutual Learning},
author = {{Rui Shao} and {Pramuditha Perera} and {P. Yuen} and {Vishal M. Patel}},
year = 2022,
month = {2},
booktitle = {International Journal of Computer Vision},
url = {https://www.semanticscholar.org/paper/bce77cb22110eaf52438cf03b8668b875c699c46},
}
@inproceedings{249953553,
title = {DDPM-CD: Denoising Diffusion Probabilistic Models as Feature Extractors for Change Detection},
author = {{W. G. C. Bandara} and {Nithin Gopalakrishnan Nair} and {Vishal M. Patel}},
year = 2022,
month = {6},
booktitle = {},
url = {https://www.semanticscholar.org/paper/f278eaffb6ee792858ecdcb7209986542d018269},
}
@inproceedings{249877931,
title = {Supplementary Materials: ”TransMix: Attend to Mix for Vision Transformers”},
author = {{Jieneng Chen} and {Shuyang Sun} and {Ju He} and {Philip H. S. Torr} and {A. Yuille} and {Song Bai}},
year = 2022,
booktitle = {},
url = {https://www.semanticscholar.org/paper/d378dc21ab5cfbde24b295ab759c9947f820bc94},
}
@inproceedings{251766132,
title = {An analysis of emotions and the prominence of positivity in #BlackLivesMatter tweets},
author = {{Anjalie Field} and {Chan Young Park} and {Antônio Theóphilo} and {J. Watson-Daniels} and {Yulia Tsvetkov}},
year = 2022,
month = {8},
booktitle = {Proceedings of the National Academy of Sciences of the United States of America},
url = {https://www.semanticscholar.org/paper/6dadf66d41b5c5bf4ce8f49fce38bc4f44889246},
}
@inproceedings{249209486,
title = {SAR Despeckling Using Overcomplete Convolutional Networks},
author = {{Malsha V. Perera} and {W. G. C. Bandara} and {Jeya Maria Jose Valanarasu} and {Vishal M. Patel}},
year = 2022,
month = {5},
booktitle = {IEEE International Geoscience and Remote Sensing Symposium},
url = {https://www.semanticscholar.org/paper/c4911e20fb50f6da552c812bda9ef4fdb525b939},
}
@inproceedings{253513495,
title = {Appendix for k -means Mask Transformer},
author = {{Qihang Yu} and {Huiyu Wang} and {Siyuan Qiao} and {Maxwell D. Collins} and {Yukun Zhu} and {Hartwig Adam} and {A. Yuille} and {Liang-Chieh Chen}},
year = 2022,
booktitle = {},
url = {https://www.semanticscholar.org/paper/46bfaa37e8b95f6bff810e5563d67e3404e78225},
}
@inproceedings{252165718,
title = {Implications of clinical variability on computer-aided lung auscultation classification},
author = {{A. Kala} and {E. McCollum} and {Mounya Elhilali}},
year = 2022,
month = {7},
booktitle = {Annual International Conference of the IEEE Engineering in Medicine and Biology Society},
url = {https://www.semanticscholar.org/paper/f97aa46f0602e85f4254933ad709f8fd1a4ab35f},
}
@inproceedings{248377080,
title = {Unsupervised Restoration of Weather-affected Images using Deep Gaussian Process-based CycleGAN},
author = {{R. Yasarla} and {Vishwanath A. Sindagi} and {Vishal M. Patel}},
year = 2022,
month = {4},
booktitle = {International Conference on Pattern Recognition},
url = {https://www.semanticscholar.org/paper/ee48b57139e1d84c60926796195f5f77c2d8b1db},
}
@inproceedings{248476149,
title = {Por Qué Não Utiliser Alla Språk? Mixed Training with Gradient Optimization in Few-Shot Cross-Lingual Transfer},
author = {{Haoran Xu} and {Kenton Murray}},
year = 2022,
month = {4},
booktitle = {NAACL-HLT},
url = {https://www.semanticscholar.org/paper/811a5c79d8c0f6f5b57697e7be0e84b5f9a94ce8},
}
@inproceedings{248832471,
title = {A bias evaluation checklist for predictive models and its pilot application for 30-day hospital readmission models},
author = {{H. E. Echo Wang} and {M. Landers} and {R. Adams} and {Adarsh Subbaswamy} and {Hadi Kharrazi} and {D. Gaskin} and {S. Saria}},
year = 2022,
month = {5},
booktitle = {J. Am. Medical Informatics Assoc.},
url = {https://www.semanticscholar.org/paper/cdb65bc7700f365cf5ff152b6f3cb7434d9ad7e8},
}
@inproceedings{253833423,
title = {A Random Forest Genomic Classifier for Tumor Agnostic Prediction of Response to Anti-PD1 Immunotherapy},
author = {{Emma Bigelow} and {S. Saria} and {B. Piening} and {B. Curti} and {A. Dowdell} and {R. Weerasinghe} and {C. Bifulco} and {W. Urba} and {N. Finkelstein} and {E. Fertig} and {A. Baras} and {N. Zaidi} and {E. Jaffee} and {M. Yarchoan}},
year = 2022,
month = {1},
booktitle = {Cancer Informatics},
url = {https://www.semanticscholar.org/paper/a407bd6bae19371a8d3c92da0981aaf1e80b382e},
}
@inproceedings{250918749,
title = {In Defense of Online Models for Video Instance Segmentation},
author = {{Junfeng Wu} and {Qihao Liu} and {Yi Jiang} and {S. Bai} and {A. Yuille} and {Xiang Bai}},
year = 2022,
month = {7},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/65edfa85e5e665d51540a2c7ae1bcb6381793f68},
}
@inproceedings{251018520,
title = {JAWS: Predictive Inference Under Covariate Shift},
author = {{Drew Prinster} and {Anqi Liu} and {S. Saria}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/e9b0db3dae9050413e3eda2861acf82bff41624b},
}
@inproceedings{247922750,
title = {Importance of Different Temporal Modulations of Speech: a Tale of two Perspectives},
author = {{Samik Sadhu} and {H. Hermansky}},
year = 2022,
month = {3},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/3ce501d4d81d9a78c2e506df7f6de0d79ca91a5b},
}
@inproceedings{247594586,
title = {Enriching Unsupervised User Embedding via Medical Concepts},
author = {{Xiaolei Huang} and {Franck Dernoncourt} and {Mark Dredze}},
year = 2022,
month = {3},
booktitle = {ACM Conference on Health, Inference, and Learning},
url = {https://www.semanticscholar.org/paper/78a4f90b348f5401e8fb6b84bca0e539142b2530},
}
@inproceedings{258588228,
title = {Representation Projection Invariance Mitigates Representation Collapse},
author = {{Anastasia Razdaibiedina} and {A. Khetan} and {Zohar S. Karnin} and {Daniel Khashabi} and {Vishaal Kapoor} and {V. Madan}},
year = 2022,
month = {5},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/3746b0e7370784d5242dc9d3fc3fd3853a34409b},
}
@inproceedings{216914509,
title = {The 6th AI City Challenge},
author = {{M. Naphade} and {Shuo Wang} and {D. Anastasiu} and {Zheng Tang} and {Ming-Ching Chang} and {Xiaodong Yang} and {Liang Zheng} and {Anuj Sharma} and {R. Chellappa} and {Pranamesh Chakraborty}},
year = 2022,
month = {4},
booktitle = {2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)},
url = {https://www.semanticscholar.org/paper/7f489232a16a54fa2b11d5758101f078f9db797c},
}
@inproceedings{251223772,
title = {Explicit Occlusion Reasoning for Multi-person 3D Human Pose Estimation},
author = {{Qihao Liu} and {Yi Zhang} and {S. Bai} and {A. Yuille}},
year = 2022,
month = {7},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/79743618fd9bc1e249e8b9df6ddde77b5e29e84f},
}
@inproceedings{266876125,
title = {BenchCLAMP: A Benchmark for Evaluating Language Models on Syntactic and Semantic Parsing},
author = {{Subhro Roy} and {Sam Thomson} and {Tongfei Chen} and {Richard Shin} and {Adam Pauls} and {Jason Eisner} and {Benjamin Van Durme} and {Microsoft Semantic Machines} and {Scaled Cognition}},
year = 2022,
month = {6},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/95e2f656017f9ec5d9cd411b1f744b278131ce6c},
}
@inproceedings{248239720,
title = {A Comparison of Different Atmospheric Turbulence Simulation Methods for Image Restoration},
author = {{Nithin Gopalakrishnan Nair} and {Kangfu Mei} and {Vishal M. Patel}},
year = 2022,
month = {4},
booktitle = {International Conference on Information Photonics},
url = {https://www.semanticscholar.org/paper/be3eb6827c645f176e204dffb5d740e5281dd67c},
}
@inproceedings{247318941,
title = {Towards performant and reliable undersampled MR reconstruction via diffusion model sampling},
author = {{Cheng Peng} and {Pengfei Guo} and {S. K. Zhou} and {Vishal M. Patel} and {Ramalingam Chellappa}},
year = 2022,
month = {3},
booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention},
url = {https://www.semanticscholar.org/paper/be60e95fabbe3469d1ec3556c8a8c3efca56b7c8},
}
@inproceedings{245877805,
title = {SparseDet: Improving Sparsely Annotated Object Detection with Pseudo-positive Mining},
author = {{Sai Saketh Rambhatla} and {Saksham Suri} and {R. Chellappa} and {Abhinav Shrivastava}},
year = 2022,
month = {1},
booktitle = {IEEE International Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/7f71d5804fe434168643babc616a76eb65d5882e},
}
@inproceedings{249827199,
title = {Advances in Cross-Lingual and Cross-Source Audio-Visual Speaker Recognition: The JHU-MIT System for NIST SRE21},
author = {{J. Villalba} and {B. J. Borgstrom} and {Saurabh Kataria} and {Magdalena Rybicka} and {C. Castillo} and {Jaejin Cho} and {Leibny Paola García-Perera} and {P. Torres-Carrasquillo} and {N. Dehak}},
year = 2022,
month = {6},
booktitle = {The Speaker and Language Recognition Workshop},
url = {https://www.semanticscholar.org/paper/9d9b5b782cbaf98bfb198b120c343d813c99ecf5},
}
@inproceedings{249538421,
title = {SAR Despeckling Using a Denoising Diffusion Probabilistic Model},
author = {{Malsha V. Perera} and {Nithin Gopalakrishnan Nair} and {W. G. C. Bandara} and {Vishal M. Patel}},
year = 2022,
month = {6},
booktitle = {IEEE Geoscience and Remote Sensing Letters},
url = {https://www.semanticscholar.org/paper/946e217f0e734561ac0acd8b58063ca882c963df},
}
@inproceedings{252547478,
title = {A Study of Pre-trained Language Models for Analogy Generation},
author = {{Tom B. Brown} and {Benjamin Mann} and {Nick Ryder} and {Jared D Subbiah} and {Prafulla Kaplan} and {A. Dhariwal} and {Chris Callison-Burch} and {Miles Osborne} and {J. Devlin} and {Ming-Wei Chang} and {Kenton Lee} and {Daniel Khashabi} and {Sewon Min} and {Tushar Khot}},
year = 2022,
booktitle = {},
url = {https://www.semanticscholar.org/paper/d7a5b73532635b6fa429c634519c70935887cf26},
}
@inproceedings{253461961,
title = {Embedded Processing Pipeline Exploration For Neuromorphic Event Based Perceptual Systems},
author = {{Jonah P. Sengupta} and {M. Villemur} and {P. Pouliquen} and {P. Julián} and {A. Andreou}},
year = 2022,
month = {5},
booktitle = {International Symposium on Circuits and Systems},
url = {https://www.semanticscholar.org/paper/42845a69a8efd8e8dc7b697c3ce0a4a8f6dfae86},
}
@inproceedings{248505905,
title = {Learn To Remember: Transformer with Recurrent Memory for Document-Level Machine Translation},
author = {{Yukun Feng} and {Feng Li} and {Ziang Song} and {Boyuan Zheng} and {Philipp Koehn}},
year = 2022,
month = {5},
booktitle = {NAACL-HLT},
url = {https://www.semanticscholar.org/paper/4293121e2bef84aa8db5aab6634cfcd2d06947d4},
}
@inproceedings{245827791,
title = {Code-Switching Text Augmentation for Multilingual Speech Processing},
author = {{A. Hussein} and {S. A. Chowdhury} and {Ahmed Abdelali} and {N. Dehak} and {Ahmed M. Ali}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/be5074a85ef8166fc173cb51971a2e3f79685134},
}
@inproceedings{252519938,
title = {The FELIX Project: Deep Networks To Detect Pancreatic Neoplasms},
author = {{Y. Xia} and {Q. Yu} and {L. Chu} and {S. Kawamoto} and {S. Park} and {F. Liu} and {J. Chen} and {Z. Zhu} and {B. Li} and {Z. Zhou} and {Y. Lu} and {Y. Wang} and {W. Shen} and {L. Xie} and {Y. Zhou} and {elliot k fishman} and {A. Javed} and {D. Fouladi} and {S. Shayesteh} and {J. Graves} and {A. Blanco} and {E. Zinreich} and {B. Kinny-Koster} and {K. Kinzler} and {R. Hruban} and {B. Vogelstein} and {A. Yuille} and {E. Fishman}},
year = 2022,
month = {9},
booktitle = {medRxiv},
url = {https://www.semanticscholar.org/paper/3167cedfe031711fa832f5ba48519357923ac0c7},
}
@inproceedings{249437208,
title = {Time-Balanced Focal Loss for Audio Event Detection},
author = {{Sangwook Park} and {Mounya Elhilali}},
year = 2022,
month = {5},
booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing},
url = {https://www.semanticscholar.org/paper/62b7aa0300a9ebc3d494629579a4a051874b82a8},
}
@inproceedings{249062873,
title = {Asking the Right Questions in Low Resource Template Extraction},
author = {{Nils Holzenberger} and {Yunmo Chen} and {Benjamin Van Durme}},
year = 2022,
month = {5},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/196b71b4e8465dd632954cf499f0467754cbd9d4},
}
@inproceedings{248227391,
title = {Benchmarking Generalization via In-Context Instructions on 1, 600+ Language Tasks},
author = {{Yizhong Wang} and {Swaroop Mishra} and {Pegah Alipoormolabashi} and {Yeganeh Kordi} and {Amirreza Mirzaei} and {Anjana Arunkumar} and {Arjun Ashok} and {Arut Selvan Dhanasekaran} and {Atharva Naik} and {David Stap} and {Eshaan Pathak} and {Giannis Karamanolakis} and {H. Lai} and {I. Purohit} and {Ishani Mondal} and {Jacob Anderson} and {Kirby Kuznia} and {Krima Doshi} and {Maitreya Patel} and {Kuntal Kumar Pal} and {M. Moradshahi} and {Mihir Parmar} and {Mirali Purohit} and {Neeraj Varshney} and {Phani Rohitha Kaza} and {Pulkit Verma} and {Ravsehaj Singh Puri} and {Rushang Karia} and {Shailaja Keyur Sampat} and {Savan Doshi} and {Siddhartha Mishra} and {Sujan Reddy} and {Sumanta Patro} and {Tanay Dixit} and {Xudong Shen} and {Chitta Baral} and {Yejin Choi} and {Hannaneh Hajishirzi} and {Noah A. Smith} and {Daniel Khashabi}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/ec64e324ce1210fe5245dfd0fb5a92058732e5b9},
}
@inproceedings{255750913,
title = {R-SSL: Region based Semi-Supervised Learning for Sparsely Annotated Object Detection},
author = {{Saksham Suri} and {Saketh Rambhatla} and {R. Chellappa} and {Abhinav Shrivastava}},
year = 2022,
booktitle = {},
url = {https://www.semanticscholar.org/paper/e2e159205030b9d3e3d742b4bdbebd7e94201d3f},
}
@inproceedings{246595318,
title = {Multiuser Scheduling in Centralized Cognitive Radio Networks: A Multi-Armed Bandit Approach},
author = {{Amir Alipour-Fanid} and {Monireh Dabaghchian} and {R. Arora} and {K. Zeng}},
year = 2022,
month = {6},
booktitle = {IEEE Transactions on Cognitive Communications and Networking},
url = {https://www.semanticscholar.org/paper/ad0c8cc0a80c5873591e62ca9f47fa21b631c35f},
}
@inproceedings{249795778,
title = {A Novel Dual-band filtenna for 2.4 and 5.8 GHz Wireless Local Area for Network Applications},
author = {{Harminder Singh} and {R. Sharma} and {R. Arora}},
year = 2022,
month = {2},
booktitle = {2022 Interdisciplinary Research in Technology and Management (IRTM)},
url = {https://www.semanticscholar.org/paper/a773c6edcc796c34a4cd477d6a39043cab45d037},
}
@inproceedings{256665944,
title = {Application of Natural Language Processing to Identify Social Needs from The Electronic Health Record's Free-Text Notes},
author = {{Geoffrey M. Gray} and {L. Ahumada} and {Ayah Zirikly} and {Masoud Rouhizadeh} and {Tom M. Richards} and {E. Hatef}},
year = 2022,
booktitle = {American Medical Informatics Association Annual Symposium},
url = {https://www.semanticscholar.org/paper/9b579eeb9351a75c1c491f22f28ae36bdadded28},
}
@inproceedings{248118691,
title = {Large-Scale Streaming End-to-End Speech Translation with Neural Transducers},
author = {{Jian Xue} and {Peidong Wang} and {Jinyu Li} and {Matt Post} and {Yashesh Gaur}},
year = 2022,
month = {4},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/5a5704382fd8c980937e10618713d641c846b313},
}
@inproceedings{208391943,
title = {Pre-hospital caloric deficits in surgical patients.},
author = {{J. Sadeghi} and {Kevin Duh} and {G. Sugiyama} and {V. Patel} and {G. Coppa} and {R. Barrera}},
year = 2022,
month = {7},
booktitle = {Nutrition and Health},
url = {https://www.semanticscholar.org/paper/cfee21939b8a016ed3d947607940dc9a0ccf8b0c},
}
@inproceedings{249276757,
title = {Informatics Research on Mental Health Functioning: Decision Support for the Social Security Administration Disability Program.},
author = {{H. Goldman} and {Julia Porcino} and {Guy Divita} and {Ayah Zirikly} and {Bart Desmet} and {Maryanne Sacco} and {E. Marfeo} and {Christine M. McDonough} and {E. Rasch} and {L. Chan}},
year = 2022,
month = {6},
booktitle = {Psychiatric Services},
url = {https://www.semanticscholar.org/paper/99410edf5a03b98ff66fa16e86bc39412fefa2e6},
}
@inproceedings{248887310,
title = {On Trace of PGD-Like Adversarial Attacks},
author = {{Mo Zhou} and {Vishal M. Patel}},
year = 2022,
month = {5},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/90d02089aaf88b621880a036a2cc4c5924f7102c},
}
@inproceedings{250953863,
title = {Factors driving provider adoption of the TREWS machine learning-based early warning system and its effects on sepsis treatment timing},
author = {{K. Henry} and {R. Adams} and {Cassandra Parent} and {Hossein Soleimani} and {A. Sridharan} and {Lauren Johnson} and {D. Hager} and {S. Cosgrove} and {Andrew Markowski} and {E. Klein} and {E. Chen} and {M. Saheed} and {Maureen Henley} and {S. Miranda} and {Katrina Houston} and {Robert C. Linton} and {Anushree R Ahluwalia} and {Albert W. Wu} and {S. Saria}},
year = 2022,
month = {7},
booktitle = {Nature Network Boston},
url = {https://www.semanticscholar.org/paper/4cf1afc1e27d26a77aca58d7a5ec7fe3d6b7ffad},
}
@inproceedings{249848080,
title = {Orientation-guided Graph Convolutional Network for Bone Surface Segmentation},
author = {{Aimon Rahman} and {W. G. C. Bandara} and {Jeya Maria Jose Valanarasu} and {I. Hacihaliloglu} and {Vishal M. Patel}},
year = 2022,
month = {6},
booktitle = {International Conference on Medical Image Computing and Computer-Assisted Intervention},
url = {https://www.semanticscholar.org/paper/bdcd82545a729552d83ed920bd117718c9f6948f},
}
@inproceedings{246294754,
title = {Discovering Phonetic Inventories with Crosslingual Automatic Speech Recognition},
author = {{Piotr Żelasko} and {Siyuan Feng} and {Laureano Moro Velázquez} and {A. Abavisani} and {Saurabhchand Bhati} and {O. Scharenborg} and {M. Hasegawa-Johnson} and {N. Dehak}},
year = 2022,
month = {1},
booktitle = {Computer Speech and Language},
url = {https://www.semanticscholar.org/paper/9da09ca7192a7546728575b2c0dfb923a36f110f},
}
@inproceedings{250954558,
title = {Prospective, multi-site study of patient outcomes after implementation of the TREWS machine learning-based early warning system for sepsis},
author = {{R. Adams} and {K. Henry} and {A. Sridharan} and {Hossein Soleimani} and {A. Zhan} and {Nishi Rawat} and {Lauren Johnson} and {D. Hager} and {S. Cosgrove} and {Andrew Markowski} and {E. Klein} and {E. Chen} and {M. Saheed} and {Maureen Henley} and {S. Miranda} and {Katrina Houston} and {Robert C. Linton} and {Anushree R Ahluwalia} and {Albert W. Wu} and {S. Saria}},
year = 2022,
month = {7},
booktitle = {Nature Network Boston},
url = {https://www.semanticscholar.org/paper/9ad55e7b87e1557983bdef0e9fe7eb0f4254dd94},
}
@inproceedings{248085083,
title = {Towards Online Domain Adaptive Object Detection},
author = {{VS Vibashan} and {Poojan Oza} and {Vishal M. Patel}},
year = 2022,
month = {4},
booktitle = {IEEE Workshop/Winter Conference on Applications of Computer Vision},
url = {https://www.semanticscholar.org/paper/ae1a767e40ce43b3cdcc2440a91dfe4a77cad901},
}
@inproceedings{247244749,
title = {HyperTransformer: A Textural and Spectral Feature Fusion Transformer for Pansharpening},
author = {{W. G. C. Bandara} and {Vishal M. Patel}},
year = 2022,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/0477780c61e668c47630ae1cd74cee55c2493b5f},
}
@inproceedings{246996539,
title = {Exploring Adversarially Robust Training for Unsupervised Domain Adaptation},
author = {{Shao-Yuan Lo} and {Vishal M. Patel}},
year = 2022,
month = {2},
booktitle = {Asian Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/1329a9e14f6454227dfb584a57a910ef168f6a7d},
}
@inproceedings{247447734,
title = {Auto-FedRL: Federated Hyperparameter Optimization for Multi-institutional Medical Image Segmentation},
author = {{Pengfei Guo} and {Dong Yang} and {Ali Hatamizadeh} and {An Xu} and {Ziyue Xu} and {Wenqi Li} and {Can Zhao} and {Daguang Xu} and {S. Harmon} and {E. Turkbey} and {B. Turkbey} and {B. Wood} and {F. Patella} and {Elvira Stellato} and {G. Carrafiello} and {Vishal M. Patel} and {H. Roth}},
year = 2022,
month = {3},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/ea8889c3bbca75fcdd71ba60068df014dfb7d861},
}
@inproceedings{249209554,
title = {VoGE: A Differentiable Volume Renderer using Gaussian Ellipsoids for Analysis-by-Synthesis},
author = {{Angtian Wang} and {Peng Wang} and {Jian Sun} and {Adam Kortylewski} and {A. Yuille}},
year = 2022,
month = {5},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/31e79b62a9483dcdf2575603469e6ff888e7f234},
}
@inproceedings{259840482,
title = {Assembling Existing Labels from Public Datasets to Diagnose Novel Diseases: COVID-19 in Late 2019},
author = {{Zengle Zhu} and {Mintong Kang} and {A. Yuille} and {Zongwei Zhou}},
year = 2022,
booktitle = {},
url = {https://www.semanticscholar.org/paper/5e9e11dbe87d01e44fc3a4e68d151f2a2809f261},
}
@inproceedings{247291930,
title = {Enhance Language Identification using Dual-mode Model with Knowledge Distillation},
author = {{Hexin Liu} and {Leibny Paola García Perera} and {Andy W. H. Khong} and {J. Dauwels} and {S. Styles} and {S. Khudanpur}},
year = 2022,
month = {3},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/b238287cad4bf831f1f7600207e967b95620017d},
}
@inproceedings{252531266,
title = {Investigating self-supervised learning for lyrics recognition},
author = {{Xiangyu Zhang} and {Zhanhong He} and {Shuyu Li} and {R. Togneri} and {Leibny Paola García-Perera}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/6632436fd0a465c7b1399c503396233eb9d88b0e},
}
@inproceedings{253107926,
title = {Challenges and Opportunities in Information Manipulation Detection: An Examination of Wartime Russian Media},
author = {{Chan Young Park} and {Julia Mendelsohn} and {Anjalie Field} and {Yulia Tsvetkov}},
year = 2022,
month = {5},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/b616154578751e156b21561e1a5d5ed833a3506f},
}
@inproceedings{249394670,
title = {Online Neural Diarization of Unlimited Numbers of Speakers Using Global and Local Attractors},
author = {{Shota Horiguchi} and {Shinji Watanabe} and {Leibny Paola García-Perera} and {Yuki Takashima} and {Y. Kawaguchi}},
year = 2022,
month = {6},
booktitle = {IEEE/ACM Transactions on Audio Speech and Language Processing},
url = {https://www.semanticscholar.org/paper/872c99ead3cc2644fbabd7dab37b82d233cc81cb},
}
@inproceedings{247778633,
title = {Instance Relation Graph Guided Source-Free Domain Adaptive Object Detection},
author = {{VS Vibashan} and {Poojan Oza} and {Vishal M. Patel}},
year = 2022,
month = {3},
booktitle = {Computer Vision and Pattern Recognition},
url = {https://www.semanticscholar.org/paper/c850d77f3ce8e8fa989cc4f7b466b63b113fd6db},
}
@inproceedings{260443047,
title = {When Not to Trust Language Models: Investigating Effectiveness and Limitations of Parametric and Non-Parametric Memories},
author = {{Alex Troy Mallen} and {Akari Asai} and {Victor Zhong} and {Rajarshi Das} and {Hannaneh Hajishirzi} and {Daniel Khashabi}},
year = 2022,
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/7b0f98f51040700aae3cd9f0e3432dedcd69fb30},
}
@inproceedings{247762191,
title = {Data Selection Curriculum for Neural Machine Translation},
author = {{Tasnim Mohiuddin} and {Philipp Koehn} and {Vishrav Chaudhary} and {James Cross} and {Shruti Bhosale} and {Shafiq R. Joty}},
year = 2022,
month = {3},
booktitle = {Conference on Empirical Methods in Natural Language Processing},
url = {https://www.semanticscholar.org/paper/d6c4b31958fe9e4ff4f83e049ed5c6881653eb03},
}
@inproceedings{248218560,
title = {Scalable and Real-time Multi-Camera Vehicle Detection, Re-Identification, and Tracking},
author = {{Pirazh Khorramshahi} and {Vineet Shenoy} and {M. Pack} and {R. Chellappa}},
year = 2022,
month = {4},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/0babd241088a1d84dec824c9749c93a3e20fd583},
}
@inproceedings{252533374,
title = {Cross-Lingual Speaker Identification from Weak Local Evidence},
author = {{Thomas Wolf} and {Lysandre Debut} and {Julien Victor Sanh} and {Clement Chaumond} and {Anthony Delangue} and {Pier-339 Moi} and {Clara ric Cistac} and {Yacine Ma} and {Julien Jernite} and {Plu} and {Teven Xu} and {Sylvain Le Scao} and {Gugger} and {Mariama} and {Quentin Drame} and {M. LhoestAlexander} and {Rush} and {Michael Miller Yoder} and {Sopan Khosla} and {Qinlan Shen} and {Ben Zhou} and {Qiang Ning} and {Daniel Khashabi} and {Kyle Richardson} and {Tushar Khot}},
year = 2022,
booktitle = {},
url = {https://www.semanticscholar.org/paper/385b71fb56b54b019b855ff0265bbdbb01ad01ea},
}
@inproceedings{248069341,
title = {Defense against Adversarial Attacks on Hybrid Speech Recognition using Joint Adversarial Fine-tuning with Denoiser},
author = {{Sonal Joshi} and {Saurabh Kataria} and {Yiwen Shao} and {Piotr Żelasko} and {J. Villalba} and {S. Khudanpur} and {N. Dehak}},
year = 2022,
month = {4},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/49011d1b139bbb65fe273fd9e4b2197cee237385},
}
@inproceedings{247058662,
title = {COLD Decoding: Energy-based Constrained Text Generation with Langevin Dynamics},
author = {{Lianhui Qin} and {S. Welleck} and {Daniel Khashabi} and {Yejin Choi}},
year = 2022,
month = {2},
booktitle = {Neural Information Processing Systems},
url = {https://www.semanticscholar.org/paper/4a6a65968a8eb8c09ffb57a7774ddabb596565b1},
}
@inproceedings{261102271,
title = {Conference on Health, Inference, and Learning (CHIL) 2022},
author = {{Gerardo Flores} and {George H. Chen} and {T. Pollard} and {Ayah Zirikly} and {Michael C. Hughes} and {Tasmie Sarker} and {Joyce Ho} and {Tristan Naumann}},
year = 2022,
booktitle = {ACM Conference on Health, Inference, and Learning},
url = {https://www.semanticscholar.org/paper/20d7a0ea43dfc3c086fd41ca90f8885ea892f965},
}
@inproceedings{251710281,
title = {A Risk-Sensitive Approach to Policy Optimization},
author = {{Jared Markowitz} and {Ryan W. Gardner} and {Ashley J. Llorens} and {R. Arora} and {I-J. Wang}},
year = 2022,
month = {8},
booktitle = {AAAI Conference on Artificial Intelligence},
url = {https://www.semanticscholar.org/paper/2a1b41221def527e17eb1ca04f4f32442fa09ba7},
}
@inproceedings{250644264,
title = {Deep Semantic Statistics Matching (D2SM) Denoising Network},
author = {{Kangfu Mei} and {Vishal M. Patel} and {Rui Huang}},
year = 2022,
month = {7},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/19f83c24c56904754be700247b416cee704d5738},
}
@inproceedings{252211999,
title = {Robust Category-Level 6D Pose Estimation with Coarse-to-Fine Rendering of Neural Features},
author = {{Wufei Ma} and {Angtian Wang} and {A. Yuille} and {Adam Kortylewski}},
year = 2022,
month = {9},
booktitle = {European Conference on Computer Vision},
url = {https://www.semanticscholar.org/paper/efa699cba13396c1b6d05a0dea9840020d29ae57},
}
@inproceedings{252683281,
title = {Blind Signal Dereverberation for Machine Speech Recognition},
author = {{Samik Sadhu} and {H. Hermansky}},
year = 2022,
month = {9},
booktitle = {arXiv.org},
url = {https://www.semanticscholar.org/paper/d2fda509740eede59e46892958531088f3f25aed},
}
@inproceedings{251936798,
title = {Medicine 2032: The future of cardiovascular disease prevention with machine learning and digital health technology},
author = {{A. Javaid} and {Fawzi Zghyer} and {Chang H Kim} and {Erin M. Spaulding} and {Nino Isakadze} and {Jie Ding} and {Daniel Kargillis} and {Yumin Gao} and {Faisal Rahman} and {Donald E. Brown} and {S. Saria} and {Seth S. Martin} and {C. Kramer} and {R. Blumenthal} and {F. Marvel}},
year = 2022,
month = {8},
booktitle = {American Journal of Preventive Cardiology},
url = {https://www.semanticscholar.org/paper/fe2f3307cb21f446a2e1272a008b2938cfd3d402},
}
@inproceedings{251539930,
title = {Author Correction: Regenerative and restorative medicine for eye disease},
author = {{B. Vasey} and {M. Nagendran} and {Bruce Campbell} and {D. Clifton} and {Gary S. Collins} and {Spiros C. Denaxas} and {A. Denniston} and {L. Faes} and {B. Geerts} and {Mudathir Ibrahim} and {Xiaoxuan Liu} and {B. Mateen} and {P. Mathur} and {M. Mccradden} and {L. Morgan} and {Johan Ordish} and {Campbell Rogers} and {S. Saria} and {D. Ting} and {P. Watkinson} and {W. Weber} and {P. Wheatstone} and {P. McCulloch}},
year = 2022,
month = {8},
booktitle = {Nature Network Boston},
url = {https://www.semanticscholar.org/paper/a22215acadb4ad4ec04624025021023acf7261d6},
}
@inproceedings{248890002,
title = {Reporting guideline for the early-stage clinical evaluation of decision support systems driven by artificial intelligence: DECIDE-AI},
author = {{B. Vasey} and {M. Nagendran} and {Bruce Campbell} and {D. Clifton} and {Gary S. Collins} and {Spiros C. Denaxas} and {A. Denniston} and {L. Faes} and {B. Geerts} and {Mudathir Ibrahim} and {Xiaoxuan Liu} and {B. Mateen} and {P. Mathur} and {M. Mccradden} and {L. Morgan} and {Johan Ordish} and {Campbell Rogers} and {S. Saria} and {D. Ting} and {P. Watkinson} and {W. Weber} and {P. Wheatstone} and {P. McCulloch}},
year = 2022,
month = {5},
booktitle = {Nature Network Boston},
url = {https://www.semanticscholar.org/paper/83b6a76ba5112d27bdbfca3efd2ed918d8e73db5},
}
@inproceedings{247476364,
title = {Interactive Portrait Harmonization},
author = {{Jeya Maria Jose Valanarasu} and {He Zhang} and {Jianming Zhang} and {Yilin Wang} and {Zhe Lin} and {J. Echevarria} and {Yinglan Ma} and {Zijun Wei} and {Kalyan Sunkavalli} and {Vishal M. Patel}},
year = 2022,
month = {3},
booktitle = {International Conference on Learning Representations},
url = {https://www.semanticscholar.org/paper/c423c8ef2d8101676a4c2ba403ad5970c0364f09},
}
@inproceedings{252346818,
title = {Defense against Adversarial Attacks on Hybrid Speech Recognition System using Adversarial Fine-tuning with Denoiser},
author = {{Sonal Joshi} and {Saurabh Kataria} and {Yiwen Shao} and {Piotr Żelasko} and {J. Villalba} and {S. Khudanpur} and {N. Dehak}},
year = 2022,
month = {9},
booktitle = {Interspeech},
url = {https://www.semanticscholar.org/paper/b8c3c97f239a1048b460d659a14110cc7f7a499e},
}
@inproceedings{248006370,
title = {Thermal to Visible Image Synthesis Under Atmospheric Turbulence},
author = {{Kangfu Mei} and {Yiqun Mei} and {Vishal M. Patel}},
year = 2022,
month = {4},
booktitle = {International Conference on Information Photonics},
url = {https://www.semanticscholar.org/paper/0a123eb1a768cc151ff9ebb004cc2461414a53a3},
}
@inproceedings{251224367,
title = {Learning Feature Decomposition for Domain Adaptive Monocular Depth Estimation},
author = {{Shao-Yuan Lo} and {Wei Wang} and {Jim Thomas} and {Jingjing Zheng} and {Vishal M. Patel} and {Cheng-Hao Kuo}},
year = 2022,
month = {7},
booktitle = {IEEE/RJS International Conference on Intelligent RObots and Systems},
url = {https://www.semanticscholar.org/paper/c28582e042a0bb482517ef844d5a3a6794f994f6},
}
@inproceedings{252333098,
title = {Addressing the 'coin flip model' and the role of 'process of care' variables in the analysis of TREWS},
author = {{R. Adams} and {K. Henry} and {S. Saria}},
year = 2022,
month = {9},
booktitle = {medRxiv},
url = {https://www.semanticscholar.org/paper/39383cc7a62fdd63e05873096d7283d5f1b90d59},
}