← Home Page
Publications
David Chiang.
Transformers in uniform
TC\(^0\).
arXiv:2409.13629.
PDF
BibTeX
@misc{chiang:2024,
author = "Chiang, David",
title = "Transformers in Uniform {TC$^0$}",
url = "https://arxiv.org/abs/2409.13629",
note = "{arXiv}:2409.13629"
}
Andy Yang, David Chiang, and Dana Angluin.
Masked hard-attention transformers recognize exactly the star-free languages.
In
Proc. NeurIPS. 2024.
To appear.
PDF
BibTeX
@inproceedings{angluin+:2024,
author = "Yang, Andy and Chiang, David and Angluin, Dana",
title = "Masked Hard-Attention Transformers Recognize Exactly the Star-Free Languages",
booktitle = "Proc. NeurIPS",
url = "https://arxiv.org/abs/2310.13897",
year = "2024",
note = "To appear"
}
Yuhi Matogawa, Yusuke Sakai, Taro Watanabe, and Chihiro Taguchi.
Japanese rule-based grapheme-to-phoneme conversion system and multilingual named entity dataset with international phonetic alphabet.
In Garrett Nicolai, Eleanor Chodroff, Frederic Mailhot, and
Ça
ğr
ı Çöltekin, editors,
Proc. SIGMORPHON workshop on Computational Research in Phonetics, Phonology, and Morphology, 77–86. 2024.
doi:10.18653/v1/2024.sigmorphon-1.9.
PDF
BibTeX
@inproceedings{matogawa-etal-2024-japanese,
author = "Matogawa, Yuhi and Sakai, Yusuke and Watanabe, Taro and Taguchi, Chihiro",
editor = {Nicolai, Garrett and Chodroff, Eleanor and Mailhot, Frederic and {\c{C}}{\"o}ltekin, {\c{C}}a{\u{g}}r{\i}},
title = "{J}apanese Rule-based Grapheme-to-phoneme Conversion System and Multilingual Named Entity Dataset with International Phonetic Alphabet",
booktitle = "Proc. SIGMORPHON workshop on Computational Research in Phonetics, Phonology, and Morphology",
year = "2024",
url = "https://aclanthology.org/2024.sigmorphon-1.9",
doi = "10.18653/v1/2024.sigmorphon-1.9",
pages = "77--86"
}
Ken Sible and David Chiang.
Improving rare word translation with dictionaries and attention masking.
In
Proc. AMTA. 2024.
PDF
BibTeX
@inproceedings{sible-chiang-2024,
author = "Sible, Ken and Chiang, David",
title = "Improving Rare Word Translation With Dictionaries and Attention Masking",
booktitle = "Proc. AMTA",
year = "2024",
url = "https://arxiv.org/abs/2408.09075"
}
Andy Yang and David Chiang.
Counting like transformers: compiling temporal counting logic into softmax transformers.
In
Proc. CoLM. 2024.
PDF
BibTeX
@inproceedings{yang-chiang-2024-counting,
author = "Yang, Andy and Chiang, David",
title = "Counting Like Transformers: Compiling Temporal Counting Logic Into Softmax Transformers",
booktitle = "Proc. CoLM",
year = "2024",
url = "https://openreview.net/forum?id=FmhPg4UJ9K"
}
Aarohi Srivastava and David Chiang.
We're calling an intervention: taking a closer look at language model adaptation to different types of linguistic variation.
2024.
arXiv:2404.07304.
PDF
BibTeX
@misc{srivastava-chiang-2024,
author = "Srivastava, Aarohi and Chiang, David",
title = "We're Calling an Intervention: Taking a Closer Look at Language Model Adaptation to Different Types of Linguistic Variation",
year = "2024",
url = "https://arxiv.org/abs/2404.07304",
note = "arXiv:2404.07304"
}
Lena Strobl, Dana Angluin, David Chiang, Jonathan Rawski, and Ashish Sabharwal.
Transformers as transducers.
Transactions of the Association for Computational Linguistics, 2024.
To appear.
PDF
BibTeX
@article{strobl-etal-2024-transducers,
author = "Strobl, Lena and Angluin, Dana and Chiang, David and Rawski, Jonathan and Sabharwal, Ashish",
title = "Transformers as Transducers",
journal = "Transactions of the Association for Computational Linguistics",
year = "2024",
note = "To appear",
url = "https://arxiv.org/abs/2404.02040"
}
Tatsuya Aoyama, Chihiro Taguchi, and Nathan Schneider.
J-
SNACS: adposition and case supersenses for
Japanese joshi.
In
Proc. LREC-COLING, 9604–9614. 2024.
PDF
BibTeX
@inproceedings{aoyama-etal-2024-j-snacs,
author = "Aoyama, Tatsuya and Taguchi, Chihiro and Schneider, Nathan",
title = "{J}-{SNACS}: Adposition and Case Supersenses for {J}apanese Joshi",
booktitle = "Proc. LREC-COLING",
year = "2024",
url = "https://aclanthology.org/2024.lrec-main.839",
pages = "9604--9614"
}
Jonathan Washington,
Ça
ğr
ı Çöltekin, Furkan Akkurt, Bermet Chontaeva, Soudabeh Eslami, Gulnura Jumalieva, Aida Kasieva, Asl
ı Kuzgun, B
üşra Mar
şan, and Chihiro Taguchi.
Strategies for the annotation of pronominalised locatives in
Turkic
Universal
Dependency treebanks.
In
Proc. Joint Workshop on Multiword Expressions and Universal Dependencies, 207–219. 2024.
PDF
BibTeX
@inproceedings{washington-etal-2024-strategies,
author = {Washington, Jonathan and {\c{C}}{\"o}ltekin, {\c{C}}a{\u{g}}r{\i} and Akkurt, Furkan and Chontaeva, Bermet and Eslami, Soudabeh and Jumalieva, Gulnura and Kasieva, Aida and Kuzgun, Asl{\i} and Mar{\c{s}}an, B{\"u}{\c{s}}ra and Taguchi, Chihiro},
title = "Strategies for the Annotation of Pronominalised Locatives in {T}urkic {U}niversal {D}ependency Treebanks",
booktitle = "Proc. Joint Workshop on Multiword Expressions and Universal Dependencies",
year = "2024",
url = "https://aclanthology.org/2024.mwe-1.25",
pages = "207--219"
}
Chihiro Taguchi and Jefferson Saransig.
Non-discourse-configurationality in
Imbabura
Kichwa.
Proceedings of the Linguistic Society of America, 2024.
doi:https://doi.org/10.3765/plsa.v9i1.5687.
DOI
BibTeX
@article{taguchi-saransig-2024,
author = "Taguchi, Chihiro and Saransig, Jefferson",
title = "Non-discourse-configurationality in {I}mbabura {K}ichwa",
year = "2024",
journal = "Proceedings of the Linguistic Society of America",
volume = "9",
number = "1",
doi = "https://doi.org/10.3765/plsa.v9i1.5687"
}
Chihiro Taguchi and David Chiang.
Language complexity and speech recognition accuracy: orthographic complexity hurts, phonological complexity doesn't.
In
Proc. ACL. 2024.
Outstanding Paper Award and Senior Area Chair Award.
PDF
BibTeX
@inproceedings{taguchi-chiang-2024-complexity,
author = "Taguchi, Chihiro and Chiang, David",
title = "Language Complexity and Speech Recognition Accuracy: Orthographic Complexity Hurts, Phonological Complexity Doesn't",
year = "2024",
url = "https://aclanthology.org/2024.acl-long.827/",
booktitle = "Proc. ACL"
}
Fahim Faisal, Orevaoghene Ahia, Aarohi Srivastava, Kabir Ahuja, David Chiang, Yulia Tsvetkov, and Antonios Anastasopoulos.
DIALECTBENCH: a
NLP benchmark for dialects, varieties, and closely-related languages.
In
Proc. ACL. 2024.
Social Impact Award.
PDF
BibTeX
@inproceedings{faisal+:2024,
author = "Faisal, Fahim and Ahia, Orevaoghene and Srivastava, Aarohi and Ahuja, Kabir and Chiang, David and Tsvetkov, Yulia and Anastasopoulos, Antonios",
title = "{DIALECTBENCH}: A {NLP} Benchmark for Dialects, Varieties, and Closely-Related Languages",
year = "2024",
booktitle = "Proc. ACL",
url = "https://aclanthology.org/2024.acl-long.777/"
}
Stephen Bothwell, Brian DuSell, David Chiang, and Brian Krostenko.
PILA: a historical-linguistic dataset of
Proto-
Italic and
Latin.
In
Proc. LREC-COLING, 12749–12760. 2024.
PDF
BibTeX
@inproceedings{bothwell+:2024,
author = "Bothwell, Stephen and DuSell, Brian and Chiang, David and Krostenko, Brian",
title = "{PILA}: A Historical-Linguistic Dataset of {P}roto-{I}talic and {L}atin",
booktitle = "Proc. LREC-COLING",
pages = "12749--12760",
year = "2024",
url = "https://aclanthology.org/2024.lrec-main.1116/"
}
Chihiro Taguchi, Jefferson Saransig, Dayana Vel
ásquez, and David Chiang.
KILLKAN: the automatic speech recognition dataset for
Kichwa with morphosyntactic information.
In
Proc. LREC-COLING, 9753–9763. 2024.
PDF
BibTeX
@inproceedings{taguchi+:2024,
author = "Taguchi, Chihiro and Saransig, Jefferson and Vel{\'a}squez, Dayana and Chiang, David",
title = "{KILLKAN}: The Automatic Speech Recognition Dataset for {K}ichwa with Morphosyntactic Information",
booktitle = "Proc. LREC-COLING",
pages = "9753--9763",
year = "2024",
url = "https://aclanthology.org/2024.lrec-main.852/"
}
Stephen Bothwell, Abigail Swenor, and David Chiang.
Nostra
Domina at
Eva
Latin 2024: improving
Latin polarity detection through data augmentation.
In
Proc. Workshop on Language Technologies for Historical and Ancient Languages, 215–222. 2024.
PDF
BibTeX
@inproceedings{bothwell-etal-2024-nostra,
author = "Bothwell, Stephen and Swenor, Abigail and Chiang, David",
title = "{N}ostra {D}omina at {E}va{L}atin 2024: Improving {L}atin Polarity Detection through Data Augmentation",
booktitle = "Proc. Workshop on Language Technologies for Historical and Ancient Languages",
year = "2024",
url = "https://aclanthology.org/2024.lt4hala-1.25",
pages = "215--222"
}
Lena Strobl, William Merrill, Gail Weiss, David Chiang, and Dana Angluin.
What formal languages can transformers express?
A survey.
Transactions of the Association for Computational Linguistics, 12:543–561, 2024.
doi:10.1162/tacl_a_00663.
DOI
BibTeX
@article{strobl-etal-2024-survey,
author = "Strobl, Lena and Merrill, William and Weiss, Gail and Chiang, David and Angluin, Dana",
title = "What Formal Languages Can Transformers Express? {A} Survey",
year = "2024",
journal = "Transactions of the Association for Computational Linguistics",
volume = "12",
pages = "543--561",
doi = "10.1162/tacl\_a\_00663"
}
Brian DuSell and David Chiang.
Stack attention: improving the ability of transformers to model hierarchical patterns.
In
Proc. ICLR. 2024.
Spotlight paper.
PDF
BibTeX
@inproceedings{dusell+chiang:2024attention,
author = "DuSell, Brian and Chiang, David",
title = "Stack Attention: Improving the Ability of Transformers to Model Hierarchical Patterns",
year = "2024",
booktitle = "Proc. ICLR",
url = "https://openreview.net/pdf?id=XVhm3X8Fum"
}
Stephen Bothwell, Justin DeBenedetto, Theresa Crnkovich, Hildegund M
üller, and David Chiang.
Introducing rhetorical parallelism detection: a new task with datasets, metrics, and baselines.
In
Proc. EMNLP, 5007–5039. 2023.
doi:10.18653/v1/2023.emnlp-main.305.
PDF
BibTeX
@inproceedings{bothwell+:2023,
author = {Bothwell, Stephen and DeBenedetto, Justin and Crnkovich, Theresa and M{\"u}ller, Hildegund and Chiang, David},
title = "Introducing Rhetorical Parallelism Detection: A New Task with Datasets, Metrics, and Baselines",
booktitle = "Proc. EMNLP",
year = "2023",
url = "https://aclanthology.org/2023.emnlp-main.305",
doi = "10.18653/v1/2023.emnlp-main.305",
pages = "5007--5039"
}
Alexandra Butoi, Tim Vieira, Ryan Cotterell, and David Chiang.
Efficient algorithms for recognizing weighted tree-adjoining languages.
In
Proc. EMNLP. 2023.
PDF
BibTeX
@inproceedings{butoi+:2023efficient,
author = "Butoi, Alexandra and Vieira, Tim and Cotterell, Ryan and Chiang, David",
title = "Efficient Algorithms for Recognizing Weighted Tree-Adjoining Languages",
booktitle = "Proc. EMNLP",
year = "2023",
url = "https://aclanthology.org/2023.emnlp-main.328/"
}
Aarohi Srivastava and David Chiang.
BERTwich: extending
BERT's capabilities to model dialectal and noisy text.
In
Findings of ACL: EMNLP. 2023.
PDF
BibTeX
@inproceedings{srivastava+chiang:2023,
author = "Srivastava, Aarohi and Chiang, David",
title = "{BERTwich}: Extending {BERT}'s Capabilities to Model Dialectal and Noisy Text",
booktitle = "Findings of ACL: EMNLP",
year = "2023",
url = "https://aclanthology.org/2023.findings-emnlp.1037/"
}
Chihiro Taguchi.
Japanese gapless relativization: the syntax-prosody interface to semantics.
In
Proc. Lexical-Functional Grammar Conference. 2023.
PDF
BibTeX
@inproceedings{taguchi:2023,
author = "Taguchi, Chihiro",
title = "{J}apanese gapless relativization: The syntax-prosody interface to semantics",
booktitle = "Proc. Lexical-Functional Grammar Conference",
year = "2023",
url = "https://sas.rochester.edu/cls/lfg23/wp-content/uploads/2023/06/CT-LFG23-abstract.pdf"
}
Chihiro Taguchi, Yusuke Sakai, Parisa Haghani, and David Chiang.
Universal automatic phonetic transcription into the
International
Phonetic
Alphabet.
In
Proc. INTERSPEECH. 2023.
doi:10.21437/Interspeech.2023-2584.
PDF
BibTeX
@inproceedings{taguchi+:2023,
author = "Taguchi, Chihiro and Sakai, Yusuke and Haghani, Parisa and Chiang, David",
title = "Universal Automatic Phonetic Transcription into the {I}nternational {P}honetic {A}lphabet",
booktitle = "Proc. INTERSPEECH",
year = "2023",
url = "https://arxiv.org/abs/2308.03917",
doi = "10.21437/Interspeech.2023-2584"
}
Alexandra Butoi, Ryan Cotterell, and David Chiang.
Convergence and diversity in the control hierarchy.
In
Proc. ACL. 2023.
PDF
BibTeX
@inproceedings{butoi+:2023convergence,
author = "Butoi, Alexandra and Cotterell, Ryan and Chiang, David",
title = "Convergence and Diversity in the Control Hierarchy",
booktitle = "Proc. ACL",
year = "2023",
url = "https://aclanthology.org/2023.acl-long.420/"
}
David Chiang, Peter Cholak, and Anand Pillay.
Tighter bounds on the expressivity of transformer encoders.
In
Proc. ICML, 5544–5562. 2023.
PDF
BibTeX
@inproceedings{chiang+cholak+pillay:2023,
author = "Chiang, David and Cholak, Peter and Pillay, Anand",
title = "Tighter Bounds on the Expressivity of Transformer Encoders",
booktitle = "Proc. ICML",
url = "https://proceedings.mlr.press/v202/chiang23a.html",
year = "2023",
pages = "5544--5562"
}
Aarohi Srivastava and David Chiang.
Fine-tuning
BERT with character-level noise for zero-shot transfer to dialects and closely-related languages.
In
Proc. Workshop on NLP for Similar Languages, Varieties and Dialects. 2023.
PDF
BibTeX
@inproceedings{srivastava+chiang:2023fine,
author = "Srivastava, Aarohi and Chiang, David",
title = "Fine-Tuning {BERT} with Character-Level Noise for Zero-Shot Transfer to Dialects and Closely-Related Languages",
year = "2023",
booktitle = "Proc. Workshop on NLP for Similar Languages, Varieties and Dialects",
url = "https://aclanthology.org/2023.vardial-1.16/"
}
Patrick Soga and David Chiang.
Bridging graph position encodings for transformers with weighted graph-walking automata.
Transactions on Machine Learning Research, 2023.
PDF
BibTeX
@article{soga+chiang:2023,
author = "Soga, Patrick and Chiang, David",
title = "Bridging Graph Position Encodings for Transformers with Weighted Graph-Walking Automata",
year = "2023",
journal = "Transactions on Machine Learning Research",
url = "https://openreview.net/pdf?id=tE2NiMGd07"
}
Brian DuSell and David Chiang.
The surprising computational power of nondeterministic stack
RNNs.
In
Proc. ICLR. 2023.
PDF
BibTeX
@inproceedings{dusell+chiang:2023surprising,
author = "DuSell, Brian and Chiang, David",
title = "The Surprising Computational Power of Nondeterministic Stack {RNN}s",
booktitle = "Proc. ICLR",
url = "https://openreview.net/pdf?id=o58JtGDs6y",
year = "2023"
}
David Chiang, Colin McDonald, and Chung-chieh Shan.
Exact recursive probabilistic programming.
PACMPL, 2023.
doi:10.1145/3586050.
PDF
BibTeX
@article{chiang+mcdonald+shan:2023,
author = "Chiang, David and McDonald, Colin and Shan, Chung-chieh",
title = "Exact Recursive Probabilistic Programming",
journal = "PACMPL",
volume = "7",
number = "OOPSLA1",
article = "98",
xmonth = "April",
url = "https://dl.acm.org/doi/10.1145/3586050",
year = "2023",
doi = "10.1145/3586050"
}
Chihiro Taguchi and David Chiang.
Introducing morphology in
Universal
Dependencies
Japanese.
In
Proc. Workshop on Universal Dependencies, 65–72. 2023.
PDF
BibTeX
@inproceedings{taguchi+chiang:2023,
author = "Taguchi, Chihiro and Chiang, David",
title = "Introducing Morphology in {U}niversal {D}ependencies {J}apanese",
year = "2023",
booktitle = "Proc. Workshop on Universal Dependencies",
url = "https://aclanthology.org/2023.udw-1.8",
pages = "65--72"
}
David Chiang, Alexander M. Rush, and Boaz Barak.
Named tensor notation.
Transactions on Machine Learning Research, January 2023.
PDF
BibTeX
@article{chiang+rush+barak:2023,
author = "Chiang, David and Rush, Alexander M. and Barak, Boaz",
title = "Named Tensor Notation",
year = "2023",
month = "January",
journal = "Transactions on Machine Learning Research",
url = "https://openreview.net/pdf?id=hVT7SHlilx"
}
Chihiro Taguchi.
Mermaid constructions in
Lexical
Functional
Grammar.
In
Proc. LFG, 365–384. 2022.
PDF
BibTeX
@inproceedings{taguchi:2022,
author = "Taguchi, Chihiro",
title = "Mermaid Constructions in {L}exical {F}unctional {G}rammar",
year = "2022",
booktitle = "Proc. LFG",
pages = "365--384",
url = "https://ojs.ub.uni-konstanz.de/lfg/index.php/main/article/view/19"
}
Darcey Riley and David Chiang.
A continuum of generation tasks for investigating length bias and degenerate repetition.
In
Proc. BlackboxNLP. 2022.
PDF
BibTeX
@inproceedings{riley+chiang:2022,
author = "Riley, Darcey and Chiang, David",
title = "A Continuum of Generation Tasks for Investigating Length Bias and Degenerate Repetition",
url = "https://arxiv.org/abs/2210.10817",
booktitle = "Proc. BlackboxNLP",
year = "2022"
}
Alexandra Butoi, Brian DuSell, Tim Vieira, Ryan Cotterell, and David Chiang.
Algorithms for weighted pushdown automata.
In Yoav Goldberg, Zornitsa Kozareva, and Yue Zhang, editors,
Proc. EMNLP, 9669–9680. 2022.
doi:10.18653/v1/2022.emnlp-main.656.
PDF
BibTeX
@inproceedings{butoi-etal-2022-algorithms,
author = "Butoi, Alexandra and DuSell, Brian and Vieira, Tim and Cotterell, Ryan and Chiang, David",
editor = "Goldberg, Yoav and Kozareva, Zornitsa and Zhang, Yue",
title = "Algorithms for Weighted Pushdown Automata",
booktitle = "Proc. EMNLP",
year = "2022",
url = "https://aclanthology.org/2022.emnlp-main.656",
doi = "10.18653/v1/2022.emnlp-main.656",
pages = "9669--9680"
}
Aarohi Srivastava, Abhinav Rastogi, Abhishek Rao, Abu Awal Md Shoeb, Abubakar Abid, Adam Fisch, Adam R. Brown, Adam Santoro, Aditya Gupta, Adri
à Garriga-Alonso, and others.
Beyond the
Imitation
Game: quantifying and extrapolating the capabilities of language models.
Transactions on Machine Learning Research, 2023.
PDF
BibTeX
@article{srivastava+:2023,
author = "Srivastava, Aarohi and Rastogi, Abhinav and Rao, Abhishek and Shoeb, Abu Awal Md and Abid, Abubakar and Fisch, Adam and Brown, Adam R. and Santoro, Adam and Gupta, Aditya and Garriga-Alonso, Adri{\a} and others",
title = "Beyond the {I}mitation {G}ame: Quantifying and extrapolating the capabilities of language models",
journal = "Transactions on Machine Learning Research",
year = "2023",
url = "https://openreview.net/pdf?id=uyTL5Bvosj"
}
David Chiang and Peter Cholak.
Overcoming a theoretical limitation of self-attention.
In Smaranda Muresan, Preslav Nakov, and Aline Villavicencio, editors,
Proc. ACL, volume 1, 7654–7664. 2022.
doi:10.18653/v1/2022.acl-long.527.
PDF
BibTeX
@inproceedings{chiang-cholak-2022-overcoming,
author = "Chiang, David and Cholak, Peter",
editor = "Muresan, Smaranda and Nakov, Preslav and Villavicencio, Aline",
title = "Overcoming a Theoretical Limitation of Self-Attention",
booktitle = "Proc. ACL",
year = "2022",
url = "https://aclanthology.org/2022.acl-long.527",
doi = "10.18653/v1/2022.acl-long.527",
pages = "7654--7664",
volume = "1"
}
Brian DuSell and David Chiang.
Learning hierarchical structures with differentiable nondeterministic stacks.
In
Proc. ICLR. 2022.
Spotlight paper.
PDF
BibTeX
@inproceedings{dusell+chiang:iclr2022,
author = "DuSell, Brian and Chiang, David",
title = "Learning Hierarchical Structures with Differentiable Nondeterministic Stacks",
booktitle = "Proc. ICLR",
year = "2022",
url = "https://openreview.net/pdf?id=5LXw\_QplBiF"
}
Isaac Caswell, Julia Kreutzer, Lisa Wang, Ahsan Wahab, Daan van Esch, Nasanbayar Ulzii-Orshikh, Allahsera Tapo, Nishant Subramani, Artem Sokolov, Claytone Sikasote, Monang Setyawan, Supheakmungkol Sarin, Sokhar Samb, Benoît Sagot, Clara Rivera, Annette Rios, Isabel Papadimitriou, Salomey Osei, Pedro Javier Ortiz Su
árez, Iroro Orife, Kelechi Ogueji, Rubungo Andre Niyongabo, Toan Q. Nguyen, Mathias M
üller, Andr
é M
üller, Shamsuddeen Hassan Muhammad, Nanda Muhammad, Ayanda Mnyakeni, Jamshidbek Mirzakhalov, Tapiwanashe Matangira, Colin Leong, Nze Lawson, Sneha Kudugunta, Yacine Jernite, Mathias Jenny, Orhan Firat, Bonaventure F. P. Dossou, Sakhile Dlamini, Nisansa de Silva, Sakine
Çabuk Ball
ı, Stella Biderman, Alessia Battisti, Ahmed Baruwa, Ankur Bapna, Pallavi Baljekar, Israel Abebe Azime, Ayodele Awokoya, Duygu Ataman, Orevaoghene Ahia, Oghenefego Ahia, Sweta Agrawal, and Mofetoluwa Adeyemi.
Quality at a glance: an audit of
Web-crawled multilingual datasets.
In
Proc. AfricaNLP. 2021.
PDF
BibTeX
@inproceedings{caswell+:2021,
author = {Caswell, Isaac and Kreutzer, Julia and Wang, Lisa and Wahab, Ahsan and van Esch, Daan and Ulzii-Orshikh, Nasanbayar and Tapo, Allahsera and Subramani, Nishant and Sokolov, Artem and Sikasote, Claytone and Setyawan, Monang and Sarin, Supheakmungkol and Samb, Sokhar and Sagot, Benoît and Rivera, Clara and Rios, Annette and Papadimitriou, Isabel and Osei, Salomey and Su{\'a}rez, Pedro Javier Ortiz and Orife, Iroro and Ogueji, Kelechi and Niyongabo, Rubungo Andre and Nguyen, Toan Q. and M{\"u}ller, Mathias and M{\"u}ller, Andr{\'e} and Muhammad, Shamsuddeen Hassan and Muhammad, Nanda and Mnyakeni, Ayanda and Mirzakhalov, Jamshidbek and Matangira, Tapiwanashe and Leong, Colin and Lawson, Nze and Kudugunta, Sneha and Jernite, Yacine and Jenny, Mathias and Firat, Orhan and Dossou, Bonaventure F. P. and Dlamini, Sakhile and de Silva, Nisansa and Ball{\i}, Sakine {\c C}abuk and Biderman, Stella and Battisti, Alessia and Baruwa, Ahmed and Bapna, Ankur and Baljekar, Pallavi and Azime, Israel Abebe and Awokoya, Ayodele and Ataman, Duygu and Ahia, Orevaoghene and Ahia, Oghenefego and Agrawal, Sweta and Adeyemi, Mofetoluwa},
title = "Quality at a Glance: An Audit of {W}eb-Crawled Multilingual Datasets",
booktitle = "Proc. AfricaNLP",
url = "https://arxiv.org/abs/2103.12028",
year = "2021"
}
Samuel Grieggs, Bingyu Shen, Greta Rauch, Pei Li, Jiaqi Ma, David Chiang, Brian Price, and Walter Scheirer.
Measuring human perception to improve handwritten document transcription.
IEEE Transactions on Pattern Analysis and Machine Intelligence, 2021.
doi:10.1109/TPAMI.2021.3092688.
DOI
BibTeX
@article{grieggs+:tpami2021,
author = "Grieggs, Samuel and Shen, Bingyu and Rauch, Greta and Li, Pei and Ma, Jiaqi and Chiang, David and Price, Brian and Scheirer, Walter",
journal = "IEEE Transactions on Pattern Analysis and Machine Intelligence",
title = "Measuring Human Perception to Improve Handwritten Document Transcription",
year = "2021",
doi = "10.1109/TPAMI.2021.3092688"
}
Toan Q. Nguyen, Kenton Murray, and David Chiang.
Data augmentation by concatenation for low-resource translation: a mystery and a solution.
In
Proc. Conference on Spoken Language Translation. 2021.
PDF
BibTeX
@inproceedings{nguyen+:2021,
author = "Nguyen, Toan Q. and Murray, Kenton and Chiang, David",
title = "Data Augmentation by Concatenation for Low-Resource Translation: A Mystery and a Solution",
booktitle = "Proc. Conference on Spoken Language Translation",
year = "2021",
url = "https://aclanthology.org/2021.iwslt-1.33/"
}
Colin McDonald and David Chiang.
Syntax-based attention masking for neural machine translation.
In
Proc. NAACL Student Research Workshop. 2021.
PDF
BibTeX
@inproceedings{mcdonald+chiang:2021,
author = "McDonald, Colin and Chiang, David",
title = "Syntax-Based Attention Masking for Neural Machine Translation",
year = "2021",
booktitle = "Proc. NAACL Student Research Workshop",
url = "https://www.aclweb.org/anthology/2021.naacl-srw.7/"
}
David Chiang and Chung-chieh Shan.
Translating recursive probabilistic programs to factor graph grammars.
2020.
Presented at PROBPROG 2020.
PDF
BibTeX
@misc{chiang+shan:2020,
author = "Chiang, David and Shan, Chung-chieh",
title = "Translating Recursive Probabilistic Programs to Factor Graph Grammars",
note = "Presented at PROBPROG 2020",
url = "https://arxiv.org/abs/2010.12071",
year = "2020"
}
David Chiang and Darcey Riley.
Factor graph grammars.
In
Proc. NeurIPS, 6648–6658. 2020.
Spotlight paper.
PDF
BibTeX
@inproceedings{chiang+riley:2020,
author = "Chiang, David and Riley, Darcey",
title = "Factor Graph Grammars",
year = "2020",
booktitle = "Proc. NeurIPS",
pages = "6648--6658",
url = "https://arxiv.org/abs/2010.12048"
}
Brian DuSell and David Chiang.
Learning context-free languages with nondeterministic stack
RNNs.
In
Proc. CoNLL, 507–519. 2020.
PDF
BibTeX
@inproceedings{dusell+chiang:2020,
author = "DuSell, Brian and Chiang, David",
title = "Learning Context-free Languages with Nondeterministic Stack {RNN}s",
booktitle = "Proc. CoNLL",
year = "2020",
url = "https://www.aclweb.org/anthology/2020.conll-1.41",
pages = "507--519"
}
Julian Salazar, Davis Liang, Toan Q. Nguyen, and Katrin Kirchhoff.
Masked language model scoring.
In
Proc. ACL, 2699–2712. 2020.
doi:10.18653/v1/2020.acl-main.240.
PDF
BibTeX
@inproceedings{salazar+:acl2020,
author = "Salazar, Julian and Liang, Davis and Nguyen, Toan Q. and Kirchhoff, Katrin",
title = "Masked Language Model Scoring",
booktitle = "Proc. ACL",
year = "2020",
url = "https://www.aclweb.org/anthology/2020.acl-main.240",
doi = "10.18653/v1/2020.acl-main.240",
pages = "2699--2712"
}
Justin DeBenedetto and David Chiang.
Representing unordered data using complex-weighted multiset automata.
In
Proc. ICML, 2412–2420. 2020.
PDF
BibTeX
@inproceedings{debenedetto+chiang:icml2020,
author = "DeBenedetto, Justin and Chiang, David",
title = "Representing Unordered Data Using Complex-Weighted Multiset Automata",
booktitle = "Proc. ICML",
pages = "2412--2420",
year = "2020",
pdf = "http://proceedings.mlr.press/v119/debenedetto20a/debenedetto20a.pdf",
url = "http://proceedings.mlr.press/v119/debenedetto20a.html"
}
Toan Q. Nguyen and Julian Salazar.
Transformers without tears: improving the normalization of self-attention.
In
Proc. Workshop on Spoken Language Translation. 2019.
doi:10.5281/zenodo.3525484.
DOI
BibTeX
@inproceedings{nguyen+salazar:iwslt2019,
author = "Nguyen, Toan Q. and Salazar, Julian",
title = "{T}ransformers without Tears: Improving the Normalization of Self-Attention",
booktitle = "Proc. Workshop on Spoken Language Translation",
year = "2019",
doi = "10.5281/zenodo.3525484"
}
Kenton Murray, Jeffery Kinnison, Toan Q. Nguyen, Walter Scheirer, and David Chiang.
Auto-sizing the
Transformer network: improving speed, efficiency, and performance for low-resource machine translation.
In
Proc. Workshop on Neural Generation and Translation, 231–240. 2019.
PDF
BibTeX
@inproceedings{murray-etal-2019-auto,
author = "Murray, Kenton and Kinnison, Jeffery and Nguyen, Toan Q. and Scheirer, Walter and Chiang, David",
title = "Auto-Sizing the {T}ransformer Network: Improving Speed, Efficiency, and Performance for Low-Resource Machine Translation",
booktitle = "Proc. Workshop on Neural Generation and Translation",
year = "2019",
url = "https://www.aclweb.org/anthology/D19-5625",
pages = "231--240"
}
Kenton Murray, Brian DuSell, and David Chiang.
Efficiency through auto-sizing:
Notre
Dame
NLP's submission to the
WNGT 2019 efficiency task.
In
Proc. Workshop on Neural Generation and Translation, 297–301. 2019.
doi:10.18653/v1/D19-5634.
PDF
BibTeX
@inproceedings{murray-etal-2019-efficiency,
author = "Murray, Kenton and DuSell, Brian and Chiang, David",
title = "Efficiency through Auto-Sizing: {N}otre {D}ame {NLP}{'}s Submission to the {WNGT} 2019 Efficiency Task",
booktitle = "Proc. Workshop on Neural Generation and Translation",
year = "2019",
url = "https://www.aclweb.org/anthology/D19-5634",
doi = "10.18653/v1/D19-5634",
pages = "297--301"
}
Arturo Argueta and David Chiang.
Accelerating sparse matrix operations in neural networks on graphics processing units.
In
Proc. ACL, 6215–6224. 2019.
PDF
BibTeX
@inproceedings{argueta+chiang:acl2019,
author = "Argueta, Arturo and Chiang, David",
title = "Accelerating Sparse Matrix Operations in Neural Networks on Graphics Processing Units",
booktitle = "Proc. ACL",
year = "2019",
url = "https://www.aclweb.org/anthology/P19-1626",
xdoi = "10.18653/v1/P19-1626",
pages = "6215--6224"
}
Antonios Anastasopoulos, Alison Lui, Toan Q. Nguyen, and David Chiang.
Neural machine translation of text from non-native speakers.
In
Proc. NAACL: HLT, volume 1, 3070–3080. 2019.
PDF
BibTeX
@inproceedings{lui+al:naacl2019,
author = "Anastasopoulos, Antonios and Lui, Alison and Nguyen, Toan Q. and Chiang, David",
title = "Neural Machine Translation of Text from Non-Native Speakers",
booktitle = "Proc. NAACL: HLT",
year = "2019",
url = "https://www.aclweb.org/anthology/N19-1311",
xdoi = "10.18653/v1/N19-1311",
pages = "3070--3080",
volume = "1"
}
Xuan Zhang, Gaurav Kumar, Huda Khayrallah, Kenton Murray, Jeremy Gwinnup, Marianna J Martindale, Paul McNamee, Kevin Duh, and Marine Carpuat.
An empirical exploration of curriculum learning for neural machine translation.
2018.
arXiv:1811.00739.
PDF
BibTeX
@misc{zhang+:arxiv2018,
author = "Zhang, Xuan and Kumar, Gaurav and Khayrallah, Huda and Murray, Kenton and Gwinnup, Jeremy and Martindale, Marianna J and McNamee, Paul and Duh, Kevin and Carpuat, Marine",
title = "An Empirical Exploration of Curriculum Learning for Neural Machine Translation",
note = "arXiv:1811.00739",
year = "2018",
url = "https://arxiv.org/pdf/1811.00739.pdf"
}
Kenton Murray and David Chiang.
Correcting length bias in neural machine translation.
In
Proc. WMT, 212–223. 2018.
PDF
BibTeX
@inproceedings{murray+chiang:wmt2018,
author = "Murray, Kenton and Chiang, David",
title = "Correcting Length Bias in Neural Machine Translation",
booktitle = "Proc. WMT",
year = "2018",
pages = "212--223",
location = "Belgium, Brussels",
url = "http://aclweb.org/anthology/W18-6322"
}
Brian Thompson, Huda Khayrallah, Antonios Anastasopoulos, Arya D. McCarthy, Kevin Duh, Rebecca Marvin, Paul McNamee, Jeremy Gwinnup, Tim Anderson, and Philipp Koehn.
Freezing subnetworks to analyze domain adaptation in neural machine translation.
In
Proc. WMT, 124–132. 2018.
PDF
BibTeX
@inproceedings{thompson+:wmt2018,
author = "Thompson, Brian and Khayrallah, Huda and Anastasopoulos, Antonios and McCarthy, Arya D. and Duh, Kevin and Marvin, Rebecca and McNamee, Paul and Gwinnup, Jeremy and Anderson, Tim and Koehn, Philipp",
title = "Freezing Subnetworks to Analyze Domain Adaptation in Neural Machine Translation",
booktitle = "Proc. WMT",
year = "2018",
pages = "124--132",
location = "Belgium, Brussels",
url = "http://aclweb.org/anthology/W18-6313"
}
Xinyi Wang, Salvador Aguinaga, Tim Weninger, and David Chiang.
Growing better graphs with latent-variable probabilistic graph grammars.
In
Proc. Workshop on Mining and Learning with Grammars. 2018.
PDF
BibTeX
@inproceedings{wang+al:mlg2018,
author = "Wang, Xinyi and Aguinaga, Salvador and Weninger, Tim and Chiang, David",
title = "Growing Better Graphs With Latent-Variable Probabilistic Graph Grammars",
year = "2018",
booktitle = "Proc. Workshop on Mining and Learning with Grammars",
url = "https://arxiv.org/pdf/1806.07955.pdf"
}
Antonios Anastasopoulos, Marika Lekakou, Josep Quer, Eleni Zimianiti, Justin DeBenedetto, and David Chiang.
Part-of-speech tagging on an endangered language: a parallel
Griko-Italian resource.
In
Proc. COLING, 2529–2539. 2018.
PDF
BibTeX
@inproceedings{anastasopoulos+al:coling2018,
author = "Anastasopoulos, Antonios and Lekakou, Marika and Quer, Josep and Zimianiti, Eleni and DeBenedetto, Justin and Chiang, David",
title = "Part-of-Speech Tagging on an Endangered Language: a Parallel {Griko-Italian} Resource",
booktitle = "Proc. COLING",
year = "2018",
pages = "2529--2539",
location = "Santa Fe, New Mexico, USA",
url = "http://aclweb.org/anthology/C18-1214"
}
Marcely Zanon Boito, Antonios Anastasopoulos, Marika Lekakou, Aline Villavicencio, and Laurent Besacier.
A small
Griko-Italian speech translation corpus.
In
Proc. Workshop on Spoken Language Technologies for Under-Resourced Languages. 2018.
BibTeX
@inproceedings{boito+al:sltu2018,
author = "Boito, Marcely Zanon and Anastasopoulos, Antonios and Lekakou, Marika and Villavicencio, Aline and Besacier, Laurent",
title = "A small {Griko-Italian} speech translation corpus",
booktitle = "Proc. Workshop on Spoken Language Technologies for Under-Resourced Languages",
year = "2018"
}
Arturo Argueta and David Chiang.
Composing finite state transducers on
GPUs.
In
Proc. ACL, 2697–2705. 2018.
PDF
BibTeX
@inproceedings{argueta+chiang:acl2018,
author = "Argueta, Arturo and Chiang, David",
title = "Composing Finite State Transducers on {GPUs}",
booktitle = "Proc. ACL",
year = "2018",
pages = "2697--2705",
location = "Melbourne, Australia",
url = "http://aclweb.org/anthology/P18-1251"
}
Justin DeBenedetto and David Chiang.
Algorithms and training for weighted multiset automata and regular expressions.
In
Proc. Conference on Implementation and Applications of Automata, 146–158. 2018.
PDF
BibTeX
@inproceedings{debenedetto+chiang:2018,
author = "DeBenedetto, Justin and Chiang, David",
title = "Algorithms and Training for Weighted Multiset Automata and Regular Expressions",
booktitle = "Proc. Conference on Implementation and Applications of Automata",
year = "2018",
pages = "146--158",
url = "https://arxiv.org/pdf/1806.03315.pdf"
}
Antonios Anastasopoulos and David Chiang.
Leveraging translations for speech transcription in low-resource settings.
In
Proc. INTERSPEECH. 2018.
PDF
BibTeX
@inproceedings{anastasopoulos+chiang:interspeech2018,
author = "Anastasopoulos, Antonios and Chiang, David",
title = "Leveraging translations for speech transcription in low-resource settings",
booktitle = "Proc. INTERSPEECH",
url = "https://arxiv.org/pdf/1803.08991.pdf",
year = "2018"
}
Corey Pennycuff, Satyaki Sikdar, Catalina Vajiac, David Chiang, and Tim Weninger.
Synchronous hyperedge replacement graph grammars.
In
Proc. Conference on Graph Transformations. 2018.
BibTeX
@inproceedings{pennycuff+al:2018,
author = "Pennycuff, Corey and Sikdar, Satyaki and Vajiac, Catalina and Chiang, David and Weninger, Tim",
title = "Synchronous Hyperedge Replacement Graph Grammars",
booktitle = "Proc. Conference on Graph Transformations",
year = "2018"
}
Antonios Anastasopoulos and David Chiang.
Tied multitask learning for neural speech translation.
In
Proc. NAACL: HLT, volume 1, 82–91. 2018.
PDF
BibTeX
@inproceedings{anastasopoulos+chiang:naacl2018,
author = "Anastasopoulos, Antonios and Chiang, David",
title = "Tied Multitask Learning for Neural Speech Translation",
booktitle = "Proc. NAACL: HLT",
year = "2018",
pages = "82--91",
location = "New Orleans, Louisiana",
url = "http://aclweb.org/anthology/N18-1008",
volume = "1"
}
Toan Nguyen and David Chiang.
Improving lexical choice in neural machine translation.
In
Proc. NAACL: HLT, volume 1, 334–343. 2018.
PDF
BibTeX
@inproceedings{nguyen+chiang:naacl2018,
author = "Nguyen, Toan and Chiang, David",
title = "Improving Lexical Choice in Neural Machine Translation",
booktitle = "Proc. NAACL: HLT",
year = "2018",
pages = "334--343",
location = "New Orleans, Louisiana",
url = "http://aclweb.org/anthology/N18-1031",
volume = "1"
}
Huadong Chen, Shujian Huang, David Chiang, Xinyu Dai, and Jiajun Chen.
Combining character and word information in neural machine translation using a multi-level attention.
In
Proc. NAACL: HLT, volume 1, 1284–1293. 2018.
PDF
BibTeX
@inproceedings{chen+:naacl2018,
author = "Chen, Huadong and Huang, Shujian and Chiang, David and Dai, Xinyu and Chen, Jiajun",
title = "Combining Character and Word Information in Neural Machine Translation Using a Multi-Level Attention",
booktitle = "Proc. NAACL: HLT",
year = "2018",
pages = "1284--1293",
location = "New Orleans, Louisiana",
url = "http://aclweb.org/anthology/N18-1116",
volume = "1"
}
Salvador Aguinaga, David Chiang, and Tim Weninger.
Learning hyperedge replacement grammars for graph generation.
IEEE Trans. Pattern Analysis and Machine Intelligence, 41(3):625–638, 2019.
doi:10.1109/TPAMI.2018.2810877.
PDF
BibTeX
@article{aguinaga+:tpami2019,
author = "Aguinaga, Salvador and Chiang, David and Weninger, Tim",
title = "Learning Hyperedge Replacement Grammars for Graph Generation",
journal = "IEEE Trans. Pattern Analysis and Machine Intelligence",
year = "2019",
volume = "41",
number = "3",
pages = "625--638",
url = "https://arxiv.org/abs/1802.08068",
doi = "10.1109/TPAMI.2018.2810877"
}
David Chiang, Frank Drewes, Daniel Gildea, Adam Lopez, and Giorgio Satta.
Weighted
DAG automata for semantic graphs.
Computational Linguistics, 44(1):119–186, 2018.
PDF
BibTeX
@article{chiang+:cl2018,
author = "Chiang, David and Drewes, Frank and Gildea, Daniel and Lopez, Adam and Satta, Giorgio",
title = "Weighted {DAG} automata for semantic graphs",
journal = "Computational Linguistics",
year = "2018",
volume = "44",
number = "1",
pages = "119--186",
url = "https://www.mitpressjournals.org/doi/full/10.1162/COLI\_a\_00309"
}
Graham Neubig, Chris Dyer, Yoav Goldberg, Austin Matthews, Waleed Ammar, Antonios Anastasopoulos, Miguel Ballesteros, David Chiang, Daniel Clothiaux, Trevor Cohn, Kevin Duh, Manaal Faruqui, Cynthia Gan, Dan Garrette, Yangfeng Ji, Lingpeng Kong, Adhiguna Kuncoro, Gaurav Kumar, Chaitanya Malaviya, Paul Michel, Yusuke Oda, Matthew Richardson, Naomi Saphra, Swabha Swayamdipta, and Pengcheng Yin.
DyNet: the dynamic neural network toolkit.
2017.
arXiv:1701.03980.
PDF
BibTeX
@misc{dynet:2017,
author = "Neubig, Graham and Dyer, Chris and Goldberg, Yoav and Matthews, Austin and Ammar, Waleed and Anastasopoulos, Antonios and Ballesteros, Miguel and Chiang, David and Clothiaux, Daniel and Cohn, Trevor and Duh, Kevin and Faruqui, Manaal and Gan, Cynthia and Garrette, Dan and Ji, Yangfeng and Kong, Lingpeng and Kuncoro, Adhiguna and Kumar, Gaurav and Malaviya, Chaitanya and Michel, Paul and Oda, Yusuke and Richardson, Matthew and Saphra, Naomi and Swayamdipta, Swabha and Yin, Pengcheng",
title = "{DyNet}: The Dynamic Neural Network Toolkit",
year = "2017",
note = "arXiv:1701.03980",
url = "https://arxiv.org/pdf/1701.03980.pdf"
}
Toan Q. Nguyen and David Chiang.
Transfer learning across low-resource, related languages for neural machine translation.
In
Proc. IJCNLP, volume 2, 296–301. 2017.
PDF
BibTeX
@inproceedings{nguyen-chiang:2017:I17-2,
author = "Nguyen, Toan Q. and Chiang, David",
title = "Transfer Learning across Low-Resource, Related Languages for Neural Machine Translation",
booktitle = "Proc. IJCNLP",
year = "2017",
pages = "296--301",
url = "http://www.aclweb.org/anthology/I17-2050",
volume = "2"
}
Huadong Chen, Shujian Huang, David Chiang, Xin-Yu Dai, and Jiajun Chen.
Top-rank enhanced listwise optimization for statistical machine translation.
In
Proc. CoNLL, 90–99. 2017.
PDF
BibTeX
@inproceedings{chen-EtAl:2017:CoNLL2corpus,
author = "Chen, Huadong and Huang, Shujian and Chiang, David and Dai, Xin-Yu and Chen, Jiajun",
title = "Top-Rank Enhanced Listwise Optimization for Statistical Machine Translation",
booktitle = "Proc. CoNLL",
year = "2017",
pages = "90--99",
url = "http://aclweb.org/anthology/K17-1011"
}
Antonios Anastasopoulos, Sameer Bansal, David Chiang, Sharon Goldwater, and Adam Lopez.
Spoken term discovery for language documentation using translations.
In
Proc. Workshop on Speech-Centric NLP, 53–58. 2017.
PDF
BibTeX
@inproceedings{anastasopoulos-EtAl:2017:Speech-Centric,
author = "Anastasopoulos, Antonios and Bansal, Sameer and Chiang, David and Goldwater, Sharon and Lopez, Adam",
title = "Spoken Term Discovery for Language Documentation using Translations",
booktitle = "Proc. Workshop on Speech-Centric NLP",
year = "2017",
pages = "53--58",
url = "http://www.aclweb.org/anthology/W17-4607"
}
Antonios Anastasopoulos and David Chiang.
A case study on using speech-to-translation alignments for language documentation.
In
Proc. Workshop on Use of Computational Methods in Study of Endangered Languages, 170–178. 2017.
PDF
BibTeX
@inproceedings{anastasopoulos-chiang:2017:W17-01,
author = "Anastasopoulos, Antonios and Chiang, David",
title = "A case study on using speech-to-translation alignments for language documentation",
booktitle = "Proc. Workshop on Use of Computational Methods in Study of Endangered Languages",
year = "2017",
pages = "170--178",
url = "http://www.aclweb.org/anthology/W17-0123"
}
Huadong Chen, Shujian Huang, David Chiang, and Jiajun Chen.
Improved neural machine translation with a syntax-aware encoder and decoder.
In
Proc. ACL, volume 1, 1936–1945. 2017.
PDF
BibTeX
@inproceedings{chen-EtAl:2017:Long6,
author = "Chen, Huadong and Huang, Shujian and Chiang, David and Chen, Jiajun",
title = "Improved Neural Machine Translation with a Syntax-Aware Encoder and Decoder",
booktitle = "Proc. ACL",
year = "2017",
pages = "1936--1945",
url = "http://aclweb.org/anthology/P17-1177",
volume = "1"
}
Arturo Argueta and David Chiang.
Decoding with finite-state transducers on
GPUs.
In
Proc. EACL, volume 1, 1044–1052. 2017.
PDF
BibTeX
@inproceedings{argueta-chiang:2017:EACLlong,
author = "Argueta, Arturo and Chiang, David",
title = "Decoding with Finite-State Transducers on {GPUs}",
booktitle = "Proc. EACL",
year = "2017",
pages = "1044--1052",
url = "http://www.aclweb.org/anthology/E17-1098",
volume = "1"
}
Ulf Hermjakob, Qiang Li, Daniel Marcu, Jonathan May, Sebastian J. Mielke, Nima Pourdamghani, Michael Pust, Xing Shi, Kevin Knight, Tomer Levinboim, Kenton Murray, David Chiang, Boliang Zhang, Xiaoman Pan, Di Lu, Ying Lin, and Heng Ji.
Incident-driven machine translation and name tagging for low-resource languages.
Machine Translation, 32(1–2):59–89, 2018.
doi:10.1007/s10590-017-9207-1.
DOI
BibTeX
@article{hermjakob+:mt2018,
author = "Hermjakob, Ulf and Li, Qiang and Marcu, Daniel and May, Jonathan and Mielke, Sebastian J. and Pourdamghani, Nima and Pust, Michael and Shi, Xing and Knight, Kevin and Levinboim, Tomer and Murray, Kenton and Chiang, David and Zhang, Boliang and Pan, Xiaoman and Lu, Di and Lin, Ying and Ji, Heng",
title = "Incident-Driven Machine Translation and Name Tagging for Low-resource Languages",
journal = "Machine Translation",
year = "2018",
volume = "32",
number = "1--2",
pages = "59--89",
doi = "10.1007/s10590-017-9207-1"
}
Antonios Anastasopoulos, David Chiang, and Long Duong.
An unsupervised probability model for speech-to-translation alignment of low-resource languages.
In
Proc. EMNLP, 1255–1263. 2016.
PDF
BibTeX
@inproceedings{anastasopoulos-chiang-duong:2016:EMNLP2016,
author = "Anastasopoulos, Antonios and Chiang, David and Duong, Long",
title = "An Unsupervised Probability Model for Speech-to-Translation Alignment of Low-Resource Languages",
booktitle = "Proc. EMNLP",
year = "2016",
pages = "1255--1263",
url = "https://aclweb.org/anthology/D16-1133"
}
Salvador Aguiñaga, Rodrigo Palacios, David Chiang, and Tim Weninger.
Growing graphs from hyperedge replacement graph grammars.
In
Proc. CIKM, 469–478. 2016.
doi:10.1145/2983323.2983826.
DOI
BibTeX
@inproceedings{aguinaga+:cikm2016,
author = "Aguiñaga, Salvador and Palacios, Rodrigo and Chiang, David and Weninger, Tim",
title = "Growing Graphs from Hyperedge Replacement Graph Grammars",
booktitle = "Proc. CIKM",
year = "2016",
pages = "469--478",
doi = "10.1145/2983323.2983826"
}
Long Duong, Antonios Anastasopoulos, David Chiang, Steven Bird, and Trevor Cohn.
An attentional model for speech translation without transcription.
In
Proc. NAACL: HLT, 949–959. 2016.
PDF
BibTeX
@inproceedings{duong-EtAl:2016:N16-1,
author = "Duong, Long and Anastasopoulos, Antonios and Chiang, David and Bird, Steven and Cohn, Trevor",
title = "An Attentional Model for Speech Translation Without Transcription",
booktitle = "Proc. NAACL: HLT",
year = "2016",
pages = "949--959",
url = "http://www.aclweb.org/anthology/N16-1109"
}
Kenton W. Murray and Jayant Krishnamurthy.
Probabilistic neural programs.
In
Proc. Workshop on Neural Abstract Machines and Program Induction. 2016.
PDF
BibTeX
@inproceedings{murray+krishnamurthy:nampi2016,
author = "Murray, Kenton W. and Krishnamurthy, Jayant",
title = "Probabilistic Neural Programs",
year = "2016",
booktitle = "Proc. Workshop on Neural Abstract Machines and Program Induction",
url = "https://arxiv.org/pdf/1612.00712.pdf"
}
Tomer Levinboim and David Chiang.
Supervised phrase table triangulation with neural word embeddings for low-resource languages.
In
Proc. EMNLP, 1079–1083. 2015.
PDF
BibTeX
@inproceedings{levinboim-chiang:2015:EMNLP,
author = "Levinboim, Tomer and Chiang, David",
title = "Supervised Phrase Table Triangulation with Neural Word Embeddings for Low-Resource Languages",
booktitle = "Proc. EMNLP",
year = "2015",
pages = "1079--1083",
url = "http://aclweb.org/anthology/D15-1126"
}
Tomer Levinboim and David Chiang.
Multi-task word alignment triangulation for low-resource languages.
In
Proc. NAACL: HLT, 1221–1226. 2015.
PDF
BibTeX
@inproceedings{levinboim-chiang:2015:NAACL-HLT,
author = "Levinboim, Tomer and Chiang, David",
title = "Multi-Task Word Alignment Triangulation for Low-Resource Languages",
booktitle = "Proc. NAACL: HLT",
year = "2015",
pages = "1221--1226",
url = "http://www.aclweb.org/anthology/N15-1129"
}
Kenton Murray and David Chiang.
Auto-sizing neural networks: with applications to
\(n\)-gram language models.
In
Proc. EMNLP, 908–916. 2015.
PDF
BibTeX
@inproceedings{murray-chiang:2015:EMNLP,
author = "Murray, Kenton and Chiang, David",
title = "Auto-Sizing Neural Networks: With Applications to {$n$}-gram Language Models",
booktitle = "Proc. EMNLP",
year = "2015",
pages = "908--916",
url = "http://aclweb.org/anthology/D15-1107"
}
Tomer Levinboim, Ashish Vaswani, and David Chiang.
Model invertibility regularization: sequence alignment with or without parallel data.
In
Proc. NAACL: HLT, 609–618. 2015.
PDF
Code
BibTeX
@inproceedings{levinboim-vaswani-chiang:2015:NAACL-HLT,
author = "Levinboim, Tomer and Vaswani, Ashish and Chiang, David",
title = "Model Invertibility Regularization: Sequence Alignment With or Without Parallel Data",
booktitle = "Proc. NAACL: HLT",
year = "2015",
pages = "609--618",
url = "http://www.aclweb.org/anthology/N15-1063"
}
Steven Bird, David Chiang, Friedel Frowein, Florian Hanke, and Ashish Vaswani.
Documentary linguistics and computational linguistics: a response to
Brooks.
Language Documentation and Conservation, 9:10–11, 2015.
BibTeX
@article{bird+:ldc2015,
author = "Bird, Steven and Chiang, David and Frowein, Friedel and Hanke, Florian and Vaswani, Ashish",
title = "Documentary Linguistics and Computational Linguistics: A response to {B}rooks",
journal = "Language Documentation and Conservation",
volume = "9",
year = "2015",
pages = "10--11"
}