@InProceedings{lets:go, author={Raux, Antoine and Langner, Brian and Bohus, Dan and Black, Alan W. and Eskenazi, Maxine}, year=2005, tile={Let's go public! {Taking} a spoken dialog system to the real world}, booktitle={INTERSPEECH-2005}, pages={885--888} } @unpublished{Boersma2003PraatDP, author = {Paul Boersma and David Weenink}, title = {Praat: {D}oing phonetics by computer}, note = {Computer program}, year = {2006} } @book{ClarkClark:1977, title={Psychology and language: {A}n introduction to psycholinguistics}, author={Clark, Herbert H. and Clark, Eve V.}, year={1977}, address = {New York}, publisher={Harcourt Brace Jovanovich} } @article{Heift:2010, title={Developing an intelligent language tutor}, author={Heift, Trude}, journal={CALICO journal}, volume={27}, number={3}, pages={443--459}, year={2010}, doi = {10.11139/cj.27.3.443-459} } @article{Loftus:1975, title={Leading questions and the eyewitness report}, author={Loftus, Elizabeth F.}, journal={Cognitive Psychology}, volume={7}, number={4}, pages={560--572}, year={1975}, publisher={Elsevier}, doi = {10.1016/0010-0285(75)90023-7} } @inproceedings{ShahBender:2022, title={Situating search}, author={Shah, Chirag and Bender, Emily M.}, booktitle={Proceedings of the 2022 {C}onference on {H}uman {I}nformation {I}nteraction and {R}etrieval}, pages={221--232}, year={2022}, doi = {10.1145/3498366.3505816} } @article{Peng-etal:2023, title={Knowledge graphs: {O}pportunities and challenges}, author={Peng, Ciyuan and Xia, Feng and Naseriparsa, Mehdi and Osborne, Francesco}, journal={Artificial Intelligence Review}, volume={56}, number={11}, pages={13071--13102}, year={2023}, doi={10.1007/s10462-023-10465-9} } @article{Piantadosi:2014, title={Zipf’s word frequency law in natural language: {A} critical review and future directions}, author={Piantadosi, Steven T.}, journal={Psychonomic Bulletin \& Review}, volume={21}, pages={1112--1130}, year={2014}, doi={10.3758/s13423-014-0585-6} } @article{Bamman-etal:2014, title={Gender identity and lexical variation in social media}, author={Bamman, David and Eisenstein, Jacob and Schnoebelen, Tyler}, journal={Journal of Sociolinguistics}, volume={18}, number={2}, pages={135--160}, year={2014}, doi={10.1111/josl.12080} } @inproceedings{Ouyang-etal:2022, title={Training language models to follow instructions with human feedback}, author={Ouyang, Long and Wu, Jeff and Jiang, Xu and Almeida, Diogo and Wainwright, Carroll L. and Mishkin, Pamela and Zhang, Chong and Agarwal, Sandhini and Slama, Katarina and Ray, Alex and Schulman, John and Hilton, Jacob and Kelton, Fraser and Miller, Luke and Simens, Maddie and Askell, Amanda and Welinder, Peter and Christiano, Paul and Leike, Jan and Lowe, Ryan}, booktitle = {Advances in {N}eural {I}nformation {P}rocessing {S}ystems ({NeurIPS})}, editor = {Koyejo, Sanmi and Mohamed, Shakir and Agarwal, Alekh and Belgrave, Danielle and Cho, Kyunghyun and Oh, Alice}, volume = {35}, pages = {27730-27744}, year={2022} } @article{DasChen:2007, title={Yahoo! for {A}mazon: {S}entiment parsing from small talk on the web}, author={Das, Sanjiv Ranjan and Chen, Mike Y.}, journal={Management Science}, pages = {1375-1388}, volume = {59}, number = {9}, year={2007}, doi = {10.1287/mnsc.1070.0704} } @inproceedings{Mikolov-etal:2013, title={Efficient estimation of word representations in vector space}, author={Mikolov, Tom\'as and Chen, Kai and Corrado, Greg and Dean, Jeffrey}, booktitle={Proceedings of the {I}nternational {C}onference on {L}earning {R}epresentations ({ICLR})}, editor = {Yoshua Bengio and Yann LeCun}, address = {Scottsdale, AZ}, year={2013} } @inproceedings{Pennington-etal:2014, title={{G}LO{V}e: {G}lobal vectors for word representation}, author={Pennington, Jeffrey and Socher, Richard and Manning, Christopher D.}, booktitle={Proceedings of {E}mpirical {M}ethods in {N}atural {L}anguage {P}rocessing ({EMNLP})}, pages={1532--1543}, editor = {Alessandro Moschitti and Bo Pang and Walter Daelemans}, year={2014}, doi = {10.3115/v1/d14-1162} } @article{Futrell-etal:2015, title={Large-scale evidence of dependency length minimization in 37 languages}, author={Futrell, Richard and Mahowald, Kyle and Gibson, Edward}, journal={Proceedings of the National Academy of Sciences}, volume={112}, number={33}, pages={10336--10341}, year={2015}, doi = {10.1073/pnas.1502134112} } @techreport{alpac:1966, author = {{Automatic Language Processing Advisory Committee (ALPAC), Division of Behavioral Sciences}}, title = {Languages and machines: {Computers} in translation and linguistics}, institution = {National Academy of Sciences, National Research Council}, year = {1966}, address = {Washington, D.C.}, doi = {10.17226/9547} } @inproceedings{Hamilton-etal:2016, title={Diachronic word embeddings reveal statistical laws of semantic change}, author={Hamilton, William L. and Leskovec, Jure and Jurafsky, Dan}, editor = {Erk, Katrin and Smith, Noah A.}, booktitle={Proceedings of the 54th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics ({ACL})}, year={2016}, address = {Berlin}, pages = {1489–1501}, publisher = {Association for Computational Linguistics}, volume = {1: Long Papers}, doi = {10.18653/v1/p16-1141} } @phdthesis{Rikters:2019, title={Hybrid machine translation by combining output from multiple machine translation systems}, author={Rikters, Mat{\=\i}ss}, year={2019}, school={Latvijas Universit{\=a}te (University of Latvia)} } @inproceedings{Stanovsky-etal:2019, title={Evaluating gender bias in machine translation}, author={Stanovsky, Gabriel and Smith, Noah A. and Zettlemoyer, Luke}, booktitle={Proceedings of the 57th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics}, pages = {1679--1684}, address = {Florence, Italy}, editor = {Anna Korhonen and David Traum and Llu\'is M\`arquez}, publisher = {Association for Computational Linguistics}, year={2019}, doi = {10.18653/v1/p19-1164} } @incollection{Weaver:1949, author = {Weaver, Warren}, title = {Translation}, booktitle = {Machine translation of languages: {F}ourteen essays}, pages ={15-23}, editor = {Locke, William N. and Booth, A. Donald}, publisher = {The Technology Press of MIT}, address = {New York}, doi = {10.7551/mitpress/5779.003.0004}, year = {1949}} @inproceedings{Bahdanau-etal:2015, title={Neural machine translation by jointly learning to align and translate}, author={Bahdanau, Dzmitry and Cho, Kyunghyun and Bengio, Yoshua}, booktitle={International {C}onference on {L}earning {R}epresentations ({ICLR})}, editor = {Yoshua Bengio and Yann LeCun}, year={2015}, address = {San Diego, CA} } @article{Vauquois:1968, author = {Vauquois, Bernard}, title = {Structures profondes et traduction automatique: {L}e syst\`me du {CETA}}, journal = {Revue Roumaine de Linguistique}, volume={13}, number={2}, pages ={103-130}, year = {1968}} @book{TraugottDasher:2001, title={Regularity in semantic change}, author={Traugott, Elizabeth Closs and Dasher, Richard B.}, year={2001}, address = {Cambridge}, publisher={Cambridge University Press}, doi = {10.1017/cbo9780511486500} } @book{Goffman:1967, title={Interaction Ritual: {E}ssays on Face-to-Face Behavior}, author={Goffman, Erving}, year={1967}, address = {Chicago}, publisher={Aldine Publishing Company}, doi = {10.4324/9780203788387} } @book{BrownLevinson:1987, title={Politeness: {S}ome universals in language usage}, author={Brown, Penelope and Levinson, Stephen C.}, year={1987}, address = {Cambridge, UK}, publisher={Cambridge University Press}, doi = {10.1017/cbo9780511813085} } @article{Searle:1994, title={Literary theory and its discontents}, author={Searle, John R.}, journal={New Literary History}, volume={25}, number={3}, pages={637--667}, year={1994}, doi = {10.2307/469470} } @inproceedings{Vaswani-etal:2017, title={Attention is all you need}, author={Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N. and Kaiser, {\L}ukasz and Polosukhin, Illia}, booktitle={Advances in {N}eural {I}nformation {P}rocessing {S}ystems}, volume={30}, editor = {Guyon, Isabelle and Von Luxburg, Ulrike and Bengio, Samy and Wallach, Hanna and Fergus, Rob and Vishwanathan, S.V.N. and Garnett, Roman}, pages = {5998-6008}, address = {Long Beach, CA}, year={2017} } @book{Blatt:2017, title={Nabokov's favorite word is mauve: {W}hat the numbers reveal about the classics, bestsellers, and our own writing}, author={Blatt, Ben}, year={2017}, address = {New York}, publisher={Simon and Schuster} } @article{Levesque:2014, title={On our best behaviour}, author={Levesque, Hector J.}, journal={Artificial Intelligence}, volume={212}, pages={27--35}, year={2014}, doi = {10.1016/j.artint.2014.03.007} } @incollection{Firth:1957, title={A synopsis of linguistic theory, 1930-1955}, author={Firth, John R.}, booktitle={Studies in Linguistic Analysis}, year={1957}, address = {Oxford}, editor = {Firth, John R.}, pages = {1--32}, publisher={Basil Blackwell} } @book{Chomsky:1957, title={Syntactic structures}, author={Chomsky, Noam}, booktitle={Syntactic Structures}, year={1957}, publisher={Mouton and Co.}, address = {The Hague}, doi = {10.1515/9783112316009} } @incollection{Lewis:1972, title={General semantics}, author={Lewis, David}, booktitle={Semantics of natural language}, pages={169--218}, year={1972}, editor = {Donald Davidson and Gilbert Harman}, address = {Dordrecht}, publisher={Springer}, doi = {10.1007/978-94-010-2557-7_7} } @article{Levenshtein:1966, title={Binary codes capable of correcting deletions, insertions, and reversals (translated from the 1965 {R}ussian original)}, author={Levenshtein, Vladimir I.}, journal={Doklady Physics}, volume={10}, number={8}, pages={707--710}, year={1966} } @article{Blei-etal:2003, title={Latent {D}irichlet Allocation}, author={Blei, David M. and Ng, Andrew Y. and Jordan, Michael I.}, journal={Journal of Machine Learning Research}, volume={3}, pages={993--1022}, year={2003}, doi = {10.7551/mitpress/1120.003.0082} } @book{PaquotGries:2021, title={A practical handbook of corpus linguistics}, editor={Paquot, Magali and Gries, Stefan Th.}, year={2021}, address = {Cham}, publisher={Springer Nature}, doi = {10.1007/978-3-030-46216-1} } @book{Bird-etal:2009, title={Natural language processing with {P}ython: {A}nalyzing text with the {N}atural {L}anguage {T}ool{K}it}, author={Bird, Steven and Klein, Ewan and Loper, Edward}, year={2009}, address = {Sebastopol, CA}, publisher={O'Reilly Media, Inc.} } @incollection{Keynes:1931, author = {Keynes, John Maynard}, title = {Economic possibilities for our grandchildren}, booktitle = {Essays in persuasion}, address = {London}, publisher = {Macmillan}, year = {1931}, doi = {10.7551/mitpress/9780262162494.003.0002} } @inproceedings{Piron:1988, title={Learning from translation mistakes}, author={Piron, Claude}, booktitle={Proceedings of {N}ew {D}irections in {M}achine {T}ranslation}, pages={233--242}, editor = {Maxwell, Dan and Schubert, Klaus and Witkam, Toon}, address = {Dordrecht}, publisher = {Foris Publications}, year={1988}, doi = {10.1515/9783110874204-017} } @article{Warstadt-etal:2019, title={Neural network acceptability judgments}, author={Warstadt, Alex and Singh, Amanpreet and Bowman, Samuel R}, journal={Transactions of the Association for Computational Linguistics}, volume={7}, pages={625--641}, doi = {10.1162/tacl_a_00290}, year={2019}} @inproceedings{Devlin-etal:2019, title={{BERT}: {P}re-training of deep bidirectional transformers for language understanding}, author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina}, booktitle={Proceedings of {North American Association for Computational Linguistics: Human Language Technologies} ({NAACL-HLT})}, editor = {Jill Burstein and Christy Doran and Thamar Solorio}, publisher = {Association for Computational Linguistics}, address = {Minneapolis, MN}, volume = {1: Long and short papers}, pages = {4171--4186}, year={2019} } @book{Koehn:2020, title={Neural Machine Translation}, author={Koehn, Philipp}, year={2020}, address = {Cambridge, UK}, publisher={Cambridge University Press}, doi = {10.1017/9781108608480} } @book{Eisenstein:2019, title={Introduction to natural language processing}, author={Eisenstein, Jacob}, year={2019}, address = {Cambridge, MA}, publisher={MIT Press} } @book{Osgood-etal:1957, title={The measurement of meaning}, author={Osgood, Charles Egerton and Suci, George J. and Tannenbaum, Percy H.}, year={1957}, address = {Urbana and Chicago, IL}, publisher={University of Illinois Press} } @article{BlackwellDweck-etal:2007, title={Implicit theories of intelligence predict achievement across an adolescent transition: {A} longitudinal study and an intervention}, author={Blackwell, Lisa S. and Trzesniewski, Kali H. and Dweck, Carol S.}, journal={Child Development}, volume={78}, number={1}, pages={246--263}, year={2007}, doi = {10.1111/j.1467-8624.2007.00995.x} } @book{Krashen:1982, title={Principles and practice in second language acquisition}, author={Krashen, Stephen}, year={1982}, address = {Oxford}, publisher={Pergamon Press} } @article{Lenneberg:67, title={The biological foundations of language}, author={Lenneberg, Eric H}, journal={Hospital Practice}, volume={2}, number={12}, pages={59--67}, year={1967}, doi = {10.1080/21548331.1967.11707799} } @article{White:2021, title={On believing and hoping whether}, author={White, Aaron Steven}, journal={Semantics and Pragmatics}, volume={14}, year={2021}, doi = {/10.3765/sp.14.6} } @article{Haspelmath:2008, title={Frequency vs. iconicity in explaining grammatical asymmetries}, author={Haspelmath, Martin}, year={2008}, volume={19}, issue ={1}, journal={Cognitive Linguistics}, } @book{Glassner:2003, title={The invention of cuneiform: {W}riting in {S}umer}, author={Glassner, Jean-Jacques}, year={2003}, note = {Translated from the original French edition (2000) by Zainab Bahrani and Marc van de Mieroop}, address = {Baltimore, MD}, publisher={Johns Hopkins University Press} } @book{Moretti:2013, title={Distant reading}, author={Moretti, Franco}, year={2013}, address = {London}, publisher={Verso Books} } @article{Flor-etal:2015, title={Patterns of misspellings in {L}2 and {L}1 {E}nglish: {A} view from the {ETS} Spelling Corpus}, author={Flor, Michael and Futagi, Yoko and Lopez, Melissa and Mulholland, Matthew}, journal={Bergen Language and Linguistics Studies}, volume={6}, year={2015}, doi = {10.15845/bells.v6i0.811} } @article{Davies:2009, title={The 385+ million word {C}orpus of {C}ontemporary {A}merican {E}nglish (1990--2008+): {D}esign, architecture, and linguistic insights}, author={Davies, Mark}, journal={International Journal of Corpus Linguistics}, volume={14}, number={2}, pages={159--190}, year={2009}, doi={10.1075/ijcl.14.2.02dav} } @book{Zipf:1932, title={Selected studies of the principle of relative frequency in language}, author={Zipf, George Kingsley}, year={1932}, address = {Cambridge, MA}, publisher={Harvard University Press}, doi = {10.4159/harvard.9780674434929} } @book{MacWhinney:2000, title={The {CHILDES} Project: {T}ools for analyzing talk - {T}ranscription format and Programs}, volume = {1}, author={MacWhinney, Brian}, volume={1}, year={2000}, address = {New York}, publisher={Psychology Press}, doi = {10.4324/9781315805672} } @article{Davies:2012, title={Expanding horizons in historical linguistics with the 400-million word {C}orpus of {H}istorical {A}merican {E}nglish}, author={Davies, Mark}, journal={Corpora}, volume={7}, number={2}, pages={121--157}, year={2012}, doi= {10.3366/corp.2012.0024} } @article{MostellerWallace:1963, title={Inference in an authorship problem: {A} comparative study of discrimination methods applied to the authorship of the disputed {F}ederalist {P}apers}, author={Mosteller, Frederick and Wallace, David L}, journal={Journal of the American Statistical Association}, volume={58}, number={302}, pages={275--309}, year={1963}, doi = {10.1080/01621459.1963.10500849} } @article{Rosenbach:2005, title={Animacy versus weight as determinants of grammatical variation in {E}nglish}, author={Rosenbach, Anette}, journal={Language}, pages={613--644}, year={2005}, doi={10.1353/lan.2005.0149} } @article{Klein:2013, title={The image of absence: {A}rchival silence, data visualization, and {J}ames {H}emings}, author={Klein, Lauren F}, journal={American Literature}, volume={85}, number={4}, pages={661--688}, year={2013}, doi = {10.1215/00029831-2367310} } @article{Underwood-etal:2018, title={The transformation of gender in {E}nglish-language fiction}, author={Underwood, Ted and Bamman, David and Lee, Sabrina}, journal = {Journal of Cultural Analytics}, year={2018}, volume = {1}, issue = {1}, doi = {10.22148/16.019} } @inproceedings{Danescu-etal:2013, title={A computational approach to politeness with application to social factors}, author={Danescu-Niculescu-Mizil, Cristian and Sudhof, Moritz and Jurafsky, Dan and Leskovec, Jure and Potts, Christopher}, editor = {Hinrich Sch\"utze and Pascale Fung and Massimo Poesio}, booktitle= {Proceedings of the 51st {A}ssociation for {C}omputational {L}inguistics ({ACL})}, volume = {1: Long papers}, address = {Sofia, Bulgaria}, pages = {250--259}, year={2013} } @inproceedings{Potts:2010, title={On the negativity of negation}, author={Potts, Christopher}, booktitle={Semantics and {L}inguistic {T}heory ({SALT})}, volume={20}, pages={636--659}, editor = {Nan Li and David Lutz}, year={2010}, doi = {10.3765/salt.v20i0.2565} } @article{Levin-etal:2019, title={Systematicity in the semantics of noun compounds: {T}he role of artifacts vs. natural kinds}, author={Levin, Beth and Glass, Lelia and Jurafsky, Dan}, journal={Linguistics}, volume={57}, number={3}, pages={429--471}, year={2019}, doi = {10.1515/ling-2019-0013} } @INPROCEEDINGS{Larsson, author = {Staffan Larsson}, title = {Questions Under Discussion and dialogue moves}, editor = {Joris Hulstijn and Anton Nijholt}, booktitle = {Proceedings of the {T}wente {W}orkshop on {L}anguage {T}echnology ({TWENDIAL}): {F}ormal semantics and pragmatics of dialogue}, volume = {13}, year = {1998} } @inproceedings{Demszky-etal:2019, title={Analyzing polarization in social media: {M}ethod and application to tweets on 21 mass shootings}, author={Demszky, Dorottya and Garg, Nikhil and Voigt, Rob and Zou, James and Gentzkow, Matthew and Shapiro, Jesse and Jurafsky, Dan}, booktitle={Proceedings of the {N}orth {A}merican {A}ssociation for {C}omputational {L}inguistics: {H}uman {L}anguage {T}echnologies ({NAACL-HLT})}, editor = {Jill Burstein and Christy Doran and Thamar Solorio}, year={2019}, pages = {2970-3005}, volume = {1: Long and short papers}, doi = {10.18653/v1/n19-1304}, address = {Minneapolis, MN} } @article{Jurafsky-etal:2018, title={Linguistic markers of status in food culture: {B}ourdieu’s distinction in a menu corpus}, author={Jurafsky, Dan and Chahuneau, Victor and Routledge, Bryan and Smith, Noah}, year={2018}, journal = {Journal of Cultural Analytics}, doi={10.22148/16.007} } @article{harsham:84, author= {Harsham, Philip}, title={A misinterpreted word worth \$71 million.}, journal={Medical Economics}, year=1984, volume=61, number=5, pages={289--292}, } @article{DBLP:journals/ftir/PangL07, author = {Bo Pang and Lillian Lee}, title = {Opinion Mining and Sentiment Analysis}, journal = {Foundations and Trends in Information Retrieval}, volume = {2}, number = {1-2}, year = {2007}, pages = {1-135}, doi = {10.1561/9781601981516} } @article{Searle:1980, title={Minds, brains, and programs}, author={Searle, John R.}, journal={Behavioral and Brain Sciences}, volume={3}, number={3}, pages={417--424}, year={1980}, doi = {10.1017/s0140525x00005756} } @BOOK{Williams.Kane-08, title = {Exploring the National Student Survey. Assessment and feedback issues}, publisher = {Center for Research into Quality (CRQ). The Higher Education Academy}, year = {2008}, author = {James Williams and David Kane}, address = {Heslington, York, UK}, file = {:Williams.Kane-08.pdf:PDF}, keywords = {feedback,survey}, url = {http://www.heacademy.ac.uk/assets/York/documents/ourwork/nss/NSS_assessment_and_feedback_issues.pdf} } @Article{turing, author= {Turing, Alan M.}, year={1950}, title={Computing Machinery and Intelligence}, journal={ Mind}, volume={49}, pages={433-460}, doi = {10.1093/oso/9780198250791.003.0017} } @inproceedings{DBLP:conf/emnlp/GenzelUO10, author = {Dmitriy Genzel and Jakob Uszkoreit and Franz Josef Och}, title = {'Poetic' Statistical Machine Translation: Rhyme and Meter}, booktitle = {EMNLP}, year = {2010}, pages = {158-166}, ee = {http://www.aclweb.org/anthology/D10-1016}, crossref = {DBLP:conf/emnlp/2010}, bibsource = {DBLP, http://dblp.uni-trier.de} } @proceedings{DBLP:conf/emnlp/2010, title = {Proceedings of Empirical Methods in Natural Language Processing, EMNLP 2010, 9-11 October 2010, MIT Stata Center, Massachusetts, USA, A meeting of SIGDAT, a Special Interest Group of the ACL}, booktitle = {EMNLP}, publisher = {ACL}, year = {2010}, isbn = {978-1-932432-86-2}, bibsource = {DBLP, http://dblp.uni-trier.de} } @article{weizenbaum:83, author = {Weizenbaum, Joseph}, title = {ELIZA -- a computer program for the study of natural language communication between man and machine}, journal = {Commun. ACM}, volume = {26}, issue = {1}, month = {01}, year = {1983}, issn = {0001-0782}, pages = {23--28}, numpages = {6}, url = {http://doi.acm.org/10.1145/357980.357991}, doi = {http://doi.acm.org/10.1145/357980.357991}, acmid = {357991}, publisher = {ACM}, address = {New York, NY, USA}, } @book{WinogradFlores:1986, title={Understanding computers and cognition: {A} new foundation for design}, author={Winograd, Terry and Flores, Fernando}, year={1986}, publisher={Intellect Books}, address = {Bristol, UK} } @book{austin:75, address = {Cambridge, MA}, author = {Austin, John Langshaw}, interhash = {a49dc923369161c6c7005ae12cb66a0f}, intrahash = {f145088661029d04e54c1d159df89af4}, publisher = {Harvard University Press}, title = {How to do things with words}, year = 1975, timestamp = {2009-02-11T01:07:46.000+0100}, keywords = {SpeechAct}, added-at = {2009-02-11T01:07:46.000+0100}, doi = {10.1093/acprof:oso/9780198245537.001.0001} } @book{weizenbaum:76, address = {San Francisco}, author = {Weizenbaum, Joseph}, citeulike-article-id = {132850}, keywords = {bibtex-import}, posted-at = {2005-03-18 14:23:43}, priority = {0}, publisher = {W. H. Freeman}, title = {Computer Power and Human Reason}, year = {1976} } @InProceedings{cucerzan:brill:04, author = {S. Cucerzan and E. Brill}, title = {Spelling correction as an iterative process that exploits the collective knowledge of web users}, booktitle = {Proceedings of EMNLP 2004}, pages = {293-300}, year = 2004 } @BOOK{weka, AUTHOR = {Ian H. Witten and Eibe Frank}, TITLE = {Data Mining: Practical Machine Learning Tools and Techniques}, PUBLISHER = {Morgan Kaufmann}, YEAR = 2005, ADDRESS = {San Francisco}, EDITION = 2, HTTP = {http://www.cs.waikato.ac.nz/~ml/weka/book.html} } @Misc{perseus, author = {Gregory R. Crane}, title = {Perseus {D}igital {L}ibrary}, URL = {https://www.perseus.tufts.edu}, URLDate = {2024-04-19}, year = {2009} } @Misc{gunther:07, author = {Erik Gunther}, title = {The Most Mispelled}, howpublished = {Webpage, The Buzz Log, \url{http://buzz.yahoo.com/buzzlog/70226/the-most-misspelled}}, year = 2007 } @inproceedings{gamon-et-al:08, author = {Michael Gamon and Jianfeng Gao and Chris Brockett and Alexander Klementiev and William Dolan and Dmitriy Belenko and Lucy Vanderwende}, title = {Using Contextual Speller Techniques and Language Modeling for ESL Error Correction}, booktitle = {Proceedings of IJCNLP}, address = {Hyderabad, India}, year = 2008 } @book{gordon:05, editor = {Raymond G. Gordon}, year = {2005}, title = {Ethnologue: {L}anguages of the World}, edition = {Fifteenth edition}, address = {Dallas, TX}, publisher = {SIL International}, URL = {https://www.ethnologue.com/}, URLDate = {2024-04-19} } @book{sproat:00, author = {Richard Sproat}, title = {A Computational Theory of Writing Systems}, year = {2000}, publisher = {Cambridge University Press}, address = {Cambridge, UK} } @Book{Sproat-11, author = {Richard Sproat}, title = {Language, Technology, and Society}, publisher = {Oxford University Press}, year = 2011, address = {Oxford} } @inproceedings{Weizenbaum:1966, title={{ELIZA} -- a computer program for the study of natural language communication between man and machine}, author={Weizenbaum, Joseph}, booktitle={Communications of the {ACM}}, volume={9}, number={1}, pages={36--45}, editor = {Gerard Salton}, year={1966}, address = {New York}, doi = {10.1145/365153.365168}, publisher={Association for Computing Machinery} } @book{daniels:bright:96, editor = {Peter T. Daniels and William Bright}, title = {The World's Writing Systems}, year = {1996}, publisher = {Oxford University Press}, address = {Oxford} } @inproceedings{Levesque-etal:2012, title={The {W}inograd schema challenge}, author={Levesque, Hector J. and Davis, Ernest and Morgenstern, Leora}, booktitle={Thirteenth {I}nternational {C}onference on the principles of {K}nowledge {R}epresentation and {R}easoning}, editor = {Brewja, Gerhard and Eiter, Thomas and McIlraith, Sheila}, address = {Palo Alto}, publisher = {AAAI (Association for the Advancement of Artificial Intelligence) Press}, pages = {552--561}, year={2012} } @article{Ji-etal:2023, title={Survey of hallucination in natural language generation}, author={Ji, Ziwei and Lee, Nayeon and Frieske, Rita and Yu, Tiezheng and Su, Dan and Xu, Yan and Ishii, Etsuko and Bang, Ye Jin and Madotto, Andrea and Fung, Pascale}, journal={ACM (Association for Computing Machinery) Computing Surveys}, volume={55}, number={12}, pages={1--38}, year={2023}, doi = {10.1145/3571730} } @inproceedings{BenderKoller:2020, title={Climbing towards {NLU}: {O}n meaning, form, and understanding in the age of data}, author={Bender, Emily M. and Koller, Alexander}, booktitle={Proceedings of the 58th annual meeting of the {A}ssociation for {C}omputational {L}inguistics ({ACL})}, pages={5185--5198}, editor = {Dan Jurafsky and Joyce Chai and Natalie Schluter and Joel Tetreault}, doi = {10.18653/v1/2020.acl-main.463}, year={2020} } @unpublished{Norvig:2007, author = {Norvig, Peter}, title = {How to Write a Spelling Corrector}, note = {\url{https://norvig.com/spell-correct.html}}, date = {2007}, URLdate ={2024-04-17}} @incollection{Shieber:1985, title={Evidence against the context-freeness of natural language}, author={Shieber, Stuart M.}, booktitle={The Formal complexity of natural language}, pages={320--334}, editor = {Savitch, Walter J. and Bach, Emmon and Marsh, William and Safran-Naveh, Gila}, year={1985}, address = {Dordrecht}, publisher={Springer}, doi = {10.1007/978-94-009-2727-8_4} } @book{grice:89, author = {Grice, H. Paul}, publisher = {Harvard University Press}, title = {Studies in the way of words}, year = {1989}, address = {Cambridge, MA}, } @book{LadefogedJohnson:2014, author = {Peter Ladefoged and Keith Johnson}, title = {A Course in Phonetics}, publisher = {Cengage Learning}, edition = {7}, year = {2014}, address = {Boston, MA} } @BOOK{Jurafsky.Martin-09, title = {Speech and Language Processing: {A}n Introduction to Natural Language Processing, Computational Linguistics, and Speech Recognition}, publisher = {Prentice Hall}, year = {2009}, author = {Dan Jurafsky and James H. Martin}, address = {Upper Saddle River, NJ}, edition = {Second} } @Book{mitton:96, author = {Roger Mitton}, title = {English Spelling and the Computer}, publisher = {Longman}, address = {London}, year = {1996} } @inproceedings{Green-etal:2013, title={The efficacy of human post-editing for language translation}, author={Green, Spence and Heer, Jeffrey and Manning, Christopher D.}, booktitle={Proceedings of the {S}pecial {I}nterest {G}roup on {C}omputer-{H}uman {I}nteraction ({SIGCHI}) {C}onference on {H}uman {F}actors in {C}omputing {S}ystems}, editor = {Mackay, Wendy E. and Brewster, Stephen and B{\o}dker Susanne}, pages={439--448}, year={2013}, publisher = {Association for Computing Machinery}, address = {New York}, doi = {10.1145/2470654.2470718} } @inproceedings{TiedemannNygaard:2004, title={The {OPUS} Corpus: {P}arallel and Free \url{{https://opus.nlpl.eu/}}}, author={Tiedemann, J{\"o}rg and Nygaard, Lars}, booktitle={Proceedings of the Fourth International Conference on Language {R}esources and {E}valuation {C}onference ({LREC})}, year={2004}, editor = {Lino, Maria Teresa and Xavier, Maria Francisca and Ferreira, F\'atima and Costa, Rute and Silva, Raquel and Pereira, Carla and Carvalho, Filipa and Lopes, Milene and Catarino, M\'onica and Barros, S\'ergio}, address = {Lisbon, Portugal}, publisher = {European Language Resources Association} } @inproceedings{Papineni-etal:2002, title={{BLEU}: {A} method for automatic evaluation of machine translation}, author={Papineni, Kishore and Roukos, Salim and Ward, Todd and Zhu, Wei-Jing}, booktitle={Proceedings of the 40th {A}nnual {M}eeting of the {A}ssociation for {C}omputational {L}inguistics ({ACL})}, editor = {Pierre Isabelle and Eugene Charniak and Dekang Lin}, pages={311--318}, year={2002}, doi = {10.3115/1073083.1073135} } @inproceedings{CohnGoodman:2019, title={Lost in machine translation: {A} method to reduce meaning loss}, author={Cohn-Gordon, Reuben and Goodman, Noah}, booktitle={Proceedings of the 2019 Conference of the {N}orth {A}merican Chapter of the {A}ssociation for {C}omputational {L}inguistics: {H}uman {L}anguage {T}echnologies ({NAACL-HLT})}, editor = {Jill Burstein and Christy Doran and Thamar Solorio}, year={2019}, doi = {10.18653/v1/n19-1042} } @book{wals, address = {Leipzig}, editor = {Matthew S. Dryer and Martin Haspelmath}, publisher = {Max Planck Institute for Evolutionary Anthropology}, title = {World Atlas of Language Structures ({WALS}) Online}, URL = {https://wals.info/}, URLDate = {2024-04-19}, year = {2013} } @Book{johnson:03, author = {Keith Johnson}, title = {Acoustic and Auditory Phonetics}, publisher = {Blackwell}, address = {Oxford}, year = {2003}, edition = {2} } @Article{kukich:92, author = {Karen Kukich}, title = {Techniques for Automatically Correcting Words in Text}, journal = {ACM Computing Surveys}, pages = {377-439}, year = 1992, volume = 24, number = 4, doi = {10.1145/170791.171147} } @article{golding:roth:99, author = "Andrew R. Golding and Dan Roth", title = "A Winnow-Based Approach to Context-Sensitive Spelling Correction", journal = "Machine Learning", volume = "34", number = "1-3", pages = "107-130", year = "1999", url = "citeseer.ist.psu.edu/golding99winnowbased.html" } @book{BothaKnight:2009, title={The cradle of language}, author={Botha, Rudolf and Knight, Chris}, year={2009}, address = {Oxford}, publisher={Oxford University Press}, doi = {10.1093/oso/9780199545858.001.0001} } @inproceedings{jones:martin:97, author = {Michael P. Jones and James H. Martin}, title = {Contextual Spelling Correction Using Latent Semantic Analysis}, booktitle = {Proceedings of the Fifth Conference on Applied Natural Language Processing (ANLP)}, year = {1997}, pages = {166--173}, address = {Washington, DC} } @Misc{tillenius:96, author = {Mikael Tillenius}, title = {Efficient generation and ranking of spelling error corrections}, year = {1996}, note = {NADA report TRITA-NA-E9621} } @Article{damerau:64, author = {Fred Damerau}, title = {A technique for computer detection and correction of spelling errors}, journal = {Communications of the ACM}, pages = {171-176}, year = 1964, volume = 7, number = 3, doi = {10.1145/363958.363994} } @InCollection{wing:baddeley:80, author = {Wing, Alan M. and Baddeley, Alan}, title = {Spelling errors in handwriting: A corpus and distributional analysis}, booktitle = {Cognitive Processes in Spelling}, publisher = {Academic Press}, year = {1980}, editor = {Frith, Uta}, address = {London} } @article{Huang-etal:2022, title={Chatbots for language learning -- Are they really useful? {A} systematic review of chatbot-supported language learning}, author={Huang, Weijiao and Hew, Khe Foon and Fryer, Luke K.}, journal={Journal of Computer Assisted Learning}, volume={38}, number={1}, pages={237--257}, year={2022}, doi = {10.1111/jcal.12610} } @inproceedings{HonnibalJohnson:2015, title={An improved non-monotonic transition system for dependency parsing}, author={Honnibal, Matthew and Johnson, Mark}, booktitle={{E}mpirical {M}ethods in {N}atural {L}anguage {P}rocessing ({EMNLP})}, pages={1373--1378}, editor = {Llu\'is M\`arquez and Chris Callison-Burch and Jian Su}, doi = {10.18653/v1/d15-1162}, address = {Lisbon, Portugal}, publisher = {Association for Computational Linguistics (ACL) Anthology}, year={2015} } @inproceedings{deMarneffe-etal:2006, title={Generating typed dependency parses from phrase structure parses}, author={de Marneffe, Marie-Catherine and MacCartney, Bill and Manning, Christopher D.}, booktitle={Proceedings of the Fifth International Conference on Language {R}esources and {E}valuation {C}onference ({LREC})}, volume={6}, editor = {Nicoletta Calzolari and Khalid Choukri and Aldo Gangemi and Bente Maegaard and Joseph Mariani and Jan Odijk and Daniel Tapias}, address = {Genoa, Italy}, pages={449--454}, publisher = {European Language Resources Association}, year={2006} } @unpublished{Neubig:2017, title={Neural machine translation and sequence-to-sequence models: {A} tutorial}, author={Neubig, Graham}, note={arXiv preprint: arXiv:1703.01619}, doi = {10.48550/arXiv.1703.01619}, year={2017} } @inproceedings{NordhoffKramer:2022, title={{IMTV}ault: {E}xtracting and Enriching Low-resource Language Interlinear Glossed Text from Grammatical Descriptions and Typological Survey Articles}, author={Nordhoff, Sebastian and Kr{\"a}mer, Thomas}, booktitle={Proceedings of the 8th Workshop on {L}inked {D}ata in {L}inguistics within the 13th {L}anguage {R}esources and {E}valuation {C}onference ({LREC})}, pages={17--25}, editor = {Declerck, Thierry and McCrae, John P. and Montiel, Elena and Chiarcos, Christian and Ionov, Maxim}, address = {Marseille, France}, year={2022}, publisher = {European Language Resources Association} } @TechReport{russell:18, author = {Russell, Robert C.}, title = {U.{S}. Patent Numbers 1,261,167 (1918) and 1,435,663 (1922)}, institution = {U.S. Patent Office}, year = 1918, address = {Washington, D.C.} } @TechReport{Hajaj:2015, author = {Hajaj, Nissan}, title = {Producing a ranking for pages using distances in a web-link graph (U.{S}. Patent Number 9,165,040 B1)}, institution = {U.S. Patent Office}, year = 2015, address = {Washington, D.C.} } @unpublished{ACTFL, author = {{American Council on the Teaching of Foreign Language}}, title = {{ACTFL} Proficiency Guidlines}, year = {2024}, URL = {https://www.actfl.org/uploads/files/general/Resources-Publications/ACTFL_Proficiency_Guidelines_2024.pdf}, address = {Alexandria, VA}, urldate = {2024-07-01} } @book{CEFR, author = {{Council of Europe}}, title = {Common European Framework of Reference for Languages}, address = {Cambridge, UK}, publisher = {Cambridge University Press}, year = {2001}} @MastersThesis{naber:03, author = {Daniel Naber}, title = {A Rule-Based Style and Grammar Checker}, school = {Technische Fakult\"{a}t, Universit\"{a}t Bielefeld}, year = {2003} } @inproceedings{Nivre-etal:2016, title={Universal dependencies v.1: {A} multilingual treebank collection}, author={Nivre, Joakim and De Marneffe, Marie-Catherine and Ginter, Filip and Goldberg, Yoav and Hajic, Jan and Manning, Christopher D. and McDonald, Ryan and Petrov, Slav and Pyysalo, Sampo and Silveira, Natalia and Tsarfaty, Reut and Zeman Daniel}, booktitle={Proceedings of the Tenth International {L}anguage {R}esources and {E}valuation {C}onference ({LREC})}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Sara Goggi and Marko Grobelnik and Bente Maegaard and Joseph Mariani and Helene Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, pages={1659--1666}, address = {Portoro\v{z}, Slovenia}, publisher = {European Language Resources Association}, year={2016} } @article{Haffner:1992, title={Translation is not enough: {I}nterpreting in a medical setting.}, author={Haffner, Linda}, journal={Western Journal of Medicine}, volume={157}, number={3}, pages={255--259}, year={1992} } @article{Lu-etal:2015, title={Recommender system application developments: {A} survey}, author={Lu, Jie and Wu, Dianshuang and Mao, Mingsong and Wang, Wei and Zhang, Guangquan}, journal={Decision Support Systems}, volume={74}, pages={12--32}, year={2015}, publisher={Elsevier}, doi = {10.1016/j.dss.2015.03.008} } @inproceedings{Rajpurkar-etal:2016, title={{SQ}u{AD}: 100,000+ questions for machine comprehension of text}, author={Rajpurkar, Pranav and Zhang, Jian and Lopyrev, Konstantin and Liang, Percy}, booktitle={Proceedings of the 2016 conference on {E}mpirical {M}ethods in {N}atural {L}anguage {P}rocessing ({EMNLP})}, address = {Austin, TX}, publisher = {Association for Computational Linguistics}, editor = {Jian Su and Kevin Duh and Xavier Carreras}, year={2016}, pages = {2383-2392}, doi = {10.18653/v1/d16-1264} } @book{FrancisKucera:1979, author = {Francis, W. Nelson and Kucera, Henry}, title = {Brown corpus manual}, publisher = {Brown University}, address = {Providence, RI}, year = {1979} } @article{GriesSlocum:2017, title={Ordinary meaning and corpus linguistics}, author={Gries, Stefan Th. and Slocum, Brian G.}, journal={Brigham Young University Law Review}, year={2017}, pages = {1417--1472}, issue = {6} } @article{Hessick:2017, title={Corpus linguistics and the criminal law}, author={Hessick, Carissa Byrne}, journal={Brigham Young University Law Review}, year={2017}, pages = {1504--1530}, issue = {6} } @book{Cowan:1983, title={More work for {M}other}, author={Cowan, Ruth Schwartz}, year={1983}, address = {New York}, publisher={Basic Books} } @article{SparckJones:1972, title={A statistical interpretation of term specificity and its application in retrieval}, author={Sp\"arck Jones, Karen}, journal={Journal of Documentation}, volume={28}, number={1}, pages={11--21}, year={1972} } @inproceedings{Mikolov-etal:2013b, title={Linguistic regularities in continuous space word representations}, author={Mikolov, Tom{\'a}{\v{s}} and Yih, Wen-tau and Zweig, Geoffrey}, booktitle={Proceedings of the 2013 conference of the {N}orth {A}merican {C}hapter of the {A}ssociation for {C}omputational {L}inguistics: {H}uman {L}anguage {T}echnologies}, pages={746--751}, address = {Atlanta, Georgia}, publisher = {Association for Computational Linguistics}, editor = {Vanderwende, Lucy and Daum\'e III, Hal and Kirchhoff, Katrin}, year={2013} } @book{Heaps:1978, title={Information retrieval: Computational and theoretical aspects}, author={Heaps, Harold Stanley}, year={1978}, address = {Cambridge, MA}, publisher={Academic Press} } @book{BunardAston:1998, title = {The {BNC} handbook: Exploring the {B}ritish {N}ational {C}orpus}, author = {Bunard, Lou and Aston, Guy}, address = {Edinnurgh, UK}, publisher = {Edinburgh University Press}, year = {1998} } @article{Marian-etal:2012, title={CLEARPOND: Cross-linguistic easy-access resource for phonological and orthographic neighborhood densities}, author={Marian, Viorica and Bartolotti, James and Chabal, Sarah and Shook, Anthony}, year={2012}, publisher={Public Library of Science San Francisco, USA} } @inproceedings{Baumgartner-etal:2020, title={The {P}ush{S}hift {R}eddit dataset}, author={Baumgartner, Jason and Zannettou, Savvas and Keegan, Brian and Squire, Megan and Blackburn, Jeremy}, booktitle={Proceedings of the {I}nternational {AAAI} {C}onference on {W}eb and {S}ocial {M}edia}, editor = {De Choudhury, Munmun and Chunara, Rumi and Culotta, Aron and Welle, Brooke Foucault}, volume={14}, pages={830--839}, year={2020}, doi = {10.1609/icwsm.v14i1.7347} } @article{Hockett:1960, title={The origin of speech}, author={Hockett, Charles F.}, journal={Scientific American}, volume={203}, number={3}, pages={88--97}, year={1960}, doi = {10.1038/scientificamerican0960-88} } @inproceedings{LoperBird:2002, title={{NLTK}: {T}he natural language toolkit}, author={Loper, Edward and Bird, Steven}, booktitle={Proceedings of the {A}ssociation for {C}omputational {L}inguistics ({ACL}) {W}orkshop on {E}ffective {T}ools and {M}ethodologies for {T}eaching {N}atural {L}anguage {P}rocessing and {C}omputational {L}inguistics}, editor = {Chris Brew and Michael Rosner and Dragomir Radev}, year={2002}, address = {Philadelphia, PA}, pages = {63--70}, doi = {10.3115/1118108.1118117} } @book{McCulloch:2020, title={Because internet: {U}nderstanding the new rules of language}, author={McCulloch, Gretchen}, year={2020}, address = {New York}, publisher={Riverhead Books} } @inproceedings{ReddyKnight:2011, title={What we know about the {V}oynich manuscript}, author={Reddy, Sravana and Knight, Kevin}, booktitle={Proceedings of the 5th {ACL-HLT} workshop on language technology for cultural heritage, social sciences, and humanities}, editor = {Kalliopi Zervanou and Piroska Lendvai}, pages={78--86}, year={2011} } @inproceedings{Mohammad:2018, title={Obtaining reliable human ratings of valence, arousal, and dominance for 20,000 {E}nglish words}, author={Mohammad, Saif}, booktitle={Proceedings of the 56th {A}nnual {M}eeting of the {A}ssociation for {C}omputational {L}inguistics}, editor = {Iryna Gurevych and Yusuke Miyao}, volume = {1: Long papers}, pages={174--184}, year={2018}, doi = {10.18653/v1/p18-1017} } @article{Munday:2016, title={The case for using {D}UOLINGO as part of the language classroom experience}, author={Munday, Pilar}, journal={RIED: Revista Iberoamericana de Educaci{\'o}n a Distancia}, volume={19}, number={1}, pages={83--101}, year={2016}, doi = {10.5944/ried.19.1.14581} } @book{Meskill:2002, title={Teaching and learning in real time: {M}edia, technologies, and language acquisition}, author={Meskill, Carla}, year={2002}, address = {Houston, TX}, publisher={Athelstan} } @article{BowernLindemann:2021, title={The linguistics of the {V}oynich manuscript}, author={Bowern, Claire L. and Lindemann, Luke}, journal={Annual Review of Linguistics}, volume={7}, pages={285--308}, year={2021}, publisher={Annual Reviews}, doi = {10.1146/annurev-linguistics-011619-030613} } @InProceedings{kernighan-et-al:90, author = {Mark D. Kernighan and Kenneth W. Church and William A. Gale}, title = {A Spelling Correction Program Based on a Noisy Channel Model}, booktitle = {Proceedings of COLING-90}, pages = {205-210}, year = {1990} } @InCollection{mcilroy:82, author = {M.D. McIlroy}, title = {Development of a Spelling List}, booktitle = {IEEE Trans. on Communications}, pages = {91-99}, year = {1982}, volume = {30} } @InProceedings{domeij-et-al:00, author = {Richard Domeij and Ola Knutsson and Johan Carlberger and Viggo Kann}, title = {Granska -- an efficient hybrid system for Swedish grammar checking}, booktitle = {Proceedings of Nodalida '99}, pages = {49-56}, year = {2000}, address = {Trondheim, Norway} } @InProceedings{brill:moore:00, author = {Eric Brill and Robert C. Moore}, title = {An improved error model for noisy channel spelling correction}, booktitle = {Proceedings of the 38th Annual Meeting of the Association for Computational Linguistics (ACL 2000)}, year = {2000}, address = {Hong Kong} } @book{fellbaum:98, editor = {Christiane Fellbaum}, title = {Word{N}et: {A}n Electronic Lexical Database}, year = {1998}, publisher = {MIT Press}, address = {Cambridge, MA}, doi = {10.7551/mitpress/7287.003.0004} } @inproceedings{Rudzewitz-etal:2017, title={Developing a web-based workbook for {E}nglish supporting the interaction of students and teachers}, author={Rudzewitz, Bj{\"o}rn and Ziai, Ramon and De Kuthy, Kordula and Meurers, Detmar}, booktitle={Proceedings of the {J}oint {W}orkshop on {NLP} for {C}omputer {A}ssisted {L}anguage {L}earning and {NLP} for {L}anguage {A}cquisition}, pages={36--46}, publisher = {Link\:oping Electronic Conference Proceedings}, volume = {134}, editor = {Elena Volodina and Gintare Grigonyte and Ildik\'o Pil\'an and Kristina Nilsson Björkenstam and Lars Borin}, address = {Urme\aa, Sweden}, year={2017} } @book{Tannen:1990, title={You just don't understand: {W}omen and men in conversation}, author={Tannen, Deborah}, year={1990}, address = {New York}, publisher={Ballantine Books} } @book{Turkle-95, author = {Turkle, Sherry}, publisher = {Simon and Schuster}, address = {New York}, note = {Paperback edition by Touchstone, New York, 1997}, title = {Life on the Screen: Identity in the Age of the Internet}, year = {1995} } @article{Meurers-etal:2019, title={Scaling up intervention studies to investigate real-life foreign language learning in school}, author={Meurers, Detmar and De Kuthy, Kordula and Nuxoll, Florian and Rudzewitz, Bj{\"o}rn and Ziai, Ramon}, journal={Annual Review of Applied Linguistics}, volume={39}, pages={161--188}, year={2019}, doi = {10.1017/s0267190519000126} } @Book{Hopcroft.Motwani.Ullman-07, author = {Hopcroft, John Edward and Motwani, Rajeev and Ullman, Jeffrey David }, title = {Introduction to automata theory, languages, and computation}, address = {Boston, MA}, publisher = {Addison-Wesley}, year = 2007, edition = 3} @article{Terrace.Petitto.ea-79, author = {Terrace, H. S. and Petitto, L. A. and Sanders, R. J. and Bever, T. G.}, title = {Can an ape create a sentence?}, volume = {206}, number = {4421}, pages = {891--902}, year = {1979}, doi = {10.1126/science.504995}, abstract ={More than 19,000 multisign utterances of an infant chimpanzee (Nim) were analyzed for syntactic and semantic regularities. Lexical regularities were observed in the case of two-sign combinations: particular signs (for example, more) tended to occur in a particular position. These regularities could not be attributed to memorization or to position habits, suggesting that they were structurally constrained. That conclusion, however, was invalidated by videotape analyses, which showed that most of Nim's utterances were prompted by his teacher's prior utterance, and that Nim interrupted his teachers to a much larger extent than a child interrupts an adult's speech. Signed utterances of other apes (as shown on films) revealed similar non-human patterns of discourse.}, URL = {http://www.sciencemag.org/content/206/4421/891.abstract}, eprint = {http://www.sciencemag.org/content/206/4421/891.full.pdf}, journal = {Science} } @article{Patterson-81, author = {Patterson, Francine G.}, title = {Ape Language}, volume = {211}, number = {4477}, pages = {86--87}, year = {1981}, doi = {10.1126/science.211.4477.86-a}, URL = {http://www.sciencemag.org/content/211/4477/86.1.short}, eprint = {http://www.sciencemag.org/content/211/4477/86.1.full.pdf}, journal = {Science} } @book{Vygotsky:1978, title={Mind in society: {D}evelopment of higher psychological processes}, author={Vygotsky, Lev Semenovich}, year={1978}, address = {Cambridge, MA}, editor = {Michael Cole and Vera John-Steiner and Sylvia Scribner and Ellen Souberman}, note = {Translated from Russian original published 1930-1933}, publisher={Harvard University Press}, doi = {10.2307/j.ctvjf9vz4.17} } @article{Lingard:2023, title={Writing with {ChatGPT}: {A}n illustration of its capacity, limitations and implications for academic writers}, author={Lingard, Lorelei}, journal={Perspectives on Medical Education}, volume={12}, number={1}, pages={261--270}, year={2023}, publisher={Ubiquity Press}, doi = {10.5334/pme.1072} } @book{Tesniere:1929, title={Elements of structural syntax}, author={Tesni{\`e}re, Lucien}, year={2015 [1929]}, note = {Originally published in French in 1929, as \emph{\'El\'ements de syntaxe structurale}}, translator = {Timothy Osborne and Sylvain Kahane}, doi = {10.1075/z.185}, address = {Amsterdam}, publisher={John Benjamins} } @article{BockMiller:1991, title={Broken agreement}, author={Bock, Kathryn and Miller, Carol A.}, journal={Cognitive Psychology}, volume={23}, number={1}, pages={45--93}, year={1991}, publisher={Elsevier}, doi = {10.1016/0010-0285(91)90003-7} } @inproceedings{Sankoff:1992, title={Edit distance for genome comparison based on non-local operations}, author={Sankoff, David}, booktitle={Annual Symposium on Combinatorial Pattern Matching}, pages={121--135}, editor = {Alberto Apostolico and Maxime Crochemore and Zvi Galil and Udi Manber}, year={1992}, address = {Berlin}, organization={Springer}, doi = {10.1007/3-540-56024-6_10} } @book{Benenson:2010, author = {Benenson, Fred}, title = {Emoji {D}ick}, publisher = {Self-published}, note = {Translation of Herman Melville's novel \emph{Moby Dick} (1851) by workers on the Mechanical Turk platform}, year = {2010} } @article{White-etal:2008, title={Eye movements when reading transposed text: The importance of word-beginning letters}, author={White, Sarah J. and Johnson, Rebecca L. and Liversedge, Simon P and Rayner, Keith}, journal={Journal of Experimental Psychology: Human Perception and Performance}, volume={34}, number={5}, pages={1261--1276}, year={2008} } @Article{galletta-et-al:04, author = {D.F. Galletta and A. Durcikova and A. Everard and B. Jones}, title = {Does Spell-Checking Software Need a Warning Label?}, journal = {Communications of the ACM}, year = {2005}, volume = {48}, number = {7} } @inproceedings{Wilcox-etal:2008, title={Real-word spelling correction with trigrams: {A} reconsideration of the {M}ays, {D}amerau, and {M}ercer model}, author={Wilcox-O’Hearn, Amber and Hirst, Graeme and Budanitsky, Alexander}, booktitle={Computational {L}inguistics and {I}ntelligent {T}ext {P}rocessing ({CICL}ing)}, pages={605--616}, editor = {Alexander Gelbukh}, address = {Berlin}, publisher = {Springer-Verlag}, doi = {10.1007/978-3-540-78135-6_52}, year={2008} } @article{hirst:budanitsky:05, author = {Graeme Hirst and Alexander Budanitsky}, title = {Correcting real-word spelling errors by restoring lexical cohesion}, journal = {Natural Language Engineering}, volume = {11}, number = {1}, year = {2005}, pages = {87--111}, doi = {10.1017/s1351324904003560} } @article{mays-et-al:91, author = {Eric Mays and Fred J. Damerau and Robert L. Mercer}, year = {1991}, title = {Context based spelling correction}, journal = {Information Processing and Management}, volume = 23, number = 5, pages = {517--522} } @MastersThesis{verberne:02, author = {Suzan Verberne}, title = {Context-sensitive spell checking based on trigram probabilities}, school = {University of Nijmegen}, year = {2002} } @InProceedings{mangu:brill:97, author = {Lidia Mangu and Eric Brill}, title = {Automatic Rule Acquisition for Spelling Correction}, booktitle = {ICML}, year = {1997} } @InProceedings{cafarella:ea:07, author = {Michael J. Cafarella and Christopher Re and Dan Suciu and Oren Etzioni and Michele Banko}, year = {2007}, title = {Structured Querying of Web Text: A Technical Challenge}, booktitle = {Proceedings of the Conference on Innovative Data Systems Research (CIDR) 2007}, address = {Asilomar, CA} } @Book{manning-et-al:08, author = {Christopher D. Manning and Prabhakar Raghavan and Hinrich Sch\"utze}, title = {Introduction to Information Retrieval}, address = {Cambridge, UK}, publisher = {Cambridge University Press}, year = {2008}, doi = {10.1017/cbo9780511809071} } @techreport{pagerank:99, month = {09}, author = {Lawrence Page and Sergey Brin and Rajeev Motwani and Terry Winograd}, title = {The {P}age{R}ank Citation Ranking: {B}ringing Order to the Web}, type = {Technical report}, publisher = {Stanford InfoLab}, year = {1999}, institution = {Stanford InfoLab} } @Book{partee-et-al:90, author = {Partee, Barbara H. and Alice ter Meulen and Robert Wall}, title = {Mathematical Methods in Linguistics}, address = {Dordrecht}, publisher = {Kluwer}, year = 1990, doi = {10.1007/978-94-009-2213-6} } @Book{mcenery-et-al:06, author = {Tony McEnery and Richard Xiao and Yukio Tono}, title = {Corpus-Based Language Studies}, publisher = {Routledge}, year = {2006}, address = {Oxford, UK} } @InCollection{sharoff:06, author = {Serge Sharoff}, title = {Creating general-purpose corpora using automated search engine queries}, booktitle = {WaCky! Working papers on the Web as Corpus}, year = {2006}, editor = {Marco Baroni and Silvia Bernardini}, address = {Bologna}, publisher = {GEDIT}, note = {\url{http://wackybook.sslmit.unibo.it/pdfs/sharoff.pdf}} } @InProceedings{baroni:kilgarriff:06, author = {Marco Baroni and Adam Kilgarriff}, title = {Large linguistically-processed Web corpora for multiple languages}, booktitle = {Proceedings of EACL-06, Demonstration Session}, year = {2006}, address = {Trento, Italy}, note = {\url{http://aclweb.org/anthology-new/E/E06/E06-2001.pdf}} } @Article{Suominen.Lehtikunnas.ea-07, author = {Suominen, Hanna and Lehtikunnas, Tuija and Back, Barbro and Karsten, Helena and Salakoski, Tapio and Salanterä, Sanna}, file = {Suominen.Lehtikunnas.ea-07.pdf:Suominen.Lehtikunnas.ea-07.pdf:PDF}, issn = {1386-5056}, journal = {Int J Med Inform}, keywords = {Ethics, Natural language processing, Computerized patient records, Nursing records, Intensive care, Nursing}, month = {10}, pages = {S293--S301}, publisher = {Elsevier Science Ireland Ltd.,}, refid = {S1386-5056(07)00101-3}, timestamp = {2009.08.18}, title = {Applying language technology to nursing documents: Pros and cons with a focus on ethics}, url = {http://linkinghub.elsevier.com/retrieve/pii/S1386505607001013}, volume = {76}, year = {2007} } @Book{Crystal-11, author = {David Crystal}, title = {The {C}ambridge Encyclopedia of Language}, publisher = {Cambridge University Press}, year = 2011, address = {Cambridge, UK}, edition = {3}, doi = {10.1017/9781108528931} } @Article{Heisig-09, author = {Heisig, Ulrich}, journal = {International Handbook of Education for the Changing World of Work}, pages = {1639--1651}, timestamp = {2009.08.19}, title = {The Deskilling and Upskilling Debate}, doi = {10.1007/978-1-4020-5281-1_110}, year = {2009} } @ARTICLE{Bowerman-90, author = {Chris Bowerman}, title = {{ICALL}: An Underview of the State of the Art in Computer-aided language teaching}, journal = {CALL}, year = {1990}, volume = {3}, pages = {45--54}, file = {Bowerman-90.pdf:Bowerman-90.pdf:PDF}, owner = {cfath}, timestamp = {2009.03.06}, url = {http://www.cet.sunderland.ac.uk/cbowww/PAPERS/icai2.txt} } @BOOK{Heift.Schulze-07, title = {Errors and Intelligence in Computer-Assisted Language Learning: {P}arsers and Pedagogues}, address = {Oxford, UK}, publisher = {Routledge}, year = {2007}, author = {Trude Heift and Mathias Schulze}, doi = {10.4324/9780203012215} } @ARTICLE{Amaral.Meurers-11, author = {Luiz Amaral and Detmar Meurers}, title = {On Using Intelligent Computer-Assisted Language Learning in Real-Life Foreign Language Teaching and Learning}, journal = {ReCALL}, year = {2011}, volume = {23}, pages = {4--24}, number = {1}, month = {01}, file = {Published version:Amaral.Meurers-11.pdf:PDF;Submitted version:Amaral.Meurers-11-Submitted.pdf:PDF}, doi = {10.1017/s0958344010000261} } @PHDTHESIS{DiazNegrillo-07, author = {Ana Díaz-Negrillo}, title = {A Fine-Grained Error Tagger for Learner Corpora}, school = {University of Jaén, Spain}, year = {2007}, file = {DiazNegrillo-07.pdf:DiazNegrillo-07.pdf:PDF} } @ARTICLE{DiazNegrillo.Meurers.ea-09, author = {Ana {Díaz Negrillo} and Detmar Meurers and Salvador Valera and Holger Wunsch}, title = {Towards interlanguage {POS} annotation for effective learner corpora in {SLA} and {FLT}}, journal = {Language Forum}, year = {2010}, volume = {36}, pages = {139--154}, number = {1--2}, note = {Special issue on corpus linguistics for teaching and learning in honour of John Sinclair}, address = {New Delhi}, editor = {María Moreno Jaén and Carmen Pérez Basanta}, file = {DiazNegrillo.Meurers.ea-09.pdf:DiazNegrillo.Meurers.ea-09.pdf:PDF}, publisher = {Bahri Publications} } @Article{Lu-07, author = {Xiaofei Lu}, title = {A Hybrid Model for {C}hinese Word Segmentation}, journal = {LDV-Forum}, volume = 22, number = 1, pages = {71--88}, year = 2007, doi = {10.21248/jlcl.22.2007.90} } @Article{hauser:chomsky:fitch, author={Hauser, Marc D. and Chomsky, Noam and Fitch, W. Tecumseh }, title={The Faculty of Language: What Is It, Who Has It, and How Did It Evolve?}, journal={Science}, year=2002, volume=298, number=5598, pages={1569--1579} } @article{BarHillel:80, title = "The base-rate fallacy in probability judgments", journal = "Acta Psychologica", volume = "44", number = "3", pages = "211 - 233", year = "1980", issn = "0001-6918", author = "Maya Bar-Hillel", doi = "10.21236/ada045772" } @incollection{Meurers-20, address = {Oxford}, author = {Detmar Meurers}, booktitle = {The Concise Encyclopedia of Applied Linguistics}, editor = {Carol A. Chapelle}, pages = {817--831}, publisher = {Wiley}, title = {Natural Language Processing and Language Learning}, year = {2020}, doi = {10.1002/9781405198431.wbeal0858}} @Book{Holland.Kaplan.Sams-2013, editor = {Holland, V. Melissa and Kaplan, Jonathan D. and Sams, Michelle R. }, title = {Intelligent language tutors: {T}heory shaping technology}, edition = {3}, publisher = {Routledge}, address = {Oxford, UK}, year = {2013}, doi = {10.4324/9781315044811} } @unpublished{Alammar:2018, author = {Alammar, Jay}, title = {The illustrated transformer}, URL = {https://jalammar.github.io/illustrated-transformer/}, urldate = {2024-07-03}, note = {Blog post}, year = {2018} } @unpublished{Parrish:2018, author = {Parrish, Allison}, title = {Understanding word vectors}, URL = {https://gist.github.com/aparrish/2f562e3737544cf29aaf1af30362f469}, urldate = {2024-07-03}, note = {Blog post}, year = {2018} } @Book{LanguageFiles13, editor = {{The Ohio State University Department of Linguistics}}, title = {Language Files: {M}aterials for an Introduction to Language and Linguistics}, publisher = {The Ohio State University Press}, year = {2022}, address = {Columbus, OH}, edition = {13} } @book{DBLP:books/daglib/0070470, author = {William J. Hutchins and Harold L. Somers}, title = {An introduction to machine translation}, publisher = {Academic Press}, year = {1992}, isbn = {978-0-12-362830-5}, pages = {I-XXI, 1-362}, bibsource = {DBLP, http://dblp.uni-trier.de} } @Book{koehn, author={Phillip Koehn}, title={Statistical Machine Translation}, publisher={Cambridge University Press}, year= {2008}, address={Cambridge, England} } @inproceedings{Deng-etal:2009, title={Image{N}et: {A} large-scale hierarchical image database}, author={Deng, Jia and Dong, Wei and Socher, Richard and Li, Li-Jia and Li, Kai and Li, Fei-Fei}, booktitle={2009 {IEEE} ({I}nstitute of {E}lectrical and {E}lectronics {E}ngineers) {C}onference on {C}omputer {V}ision and {P}attern {R}ecognition}, pages={248--255}, year={2009}, editor = {Daniel Huttenlocher and Gerard Medioni and James Rehg}, publisher={Institute of Electrical and Electronics Engineers}, address = {Miami, FL}, doi = {10.1109/cvpr.2009.5206848} } @inproceedings{Dagan-etal:2005, title={The {P}ascal Recognising Textual Entailment challenge}, author={Dagan, Ido and Glickman, Oren and Magnini, Bernardo}, booktitle={Machine {L}earning {C}hallenges {W}orkshop}, pages={177--190}, year={2005}, editor = {Joaquin Qui\~nonero-Candela and Ido Dagan and Bernardo Magnini, Florence d’Alch\'e-Buc}, address={Southampton, UK}, doi = {10.1007/11736790_9} } @inproceedings{EthJurafsky:2020, title={Utility is in the eye of the user: {A} critique of {NLP} leaderboards}, author={Ethayarajh, Kawin and Jurafsky, Dan}, booktitle={Proceedings of the 2020 conference on {E}mpirical {M}ethods in {N}atural {L}anguage {P}rocessing ({EMNLP})}, pages = {4846–4853}, editor = {Bonnie Webber and Trevor Cohn and Yulan He and Yang Liu}, address = {Online}, publisher = {Association for Computational Linguistics}, year={2020}, doi = {10.18653/v1/2020.emnlp-main.393} } @inproceedings{Nie-etal:2020, title={Adversarial {NLI}: {A} new benchmark for natural language understanding}, author={Nie, Yixin and Williams, Adina and Dinan, Emily and Bansal, Mohit and Weston, Jason and Kiela, Douwe}, booktitle={Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics ({ACL})}, editor = {Dan Jurafsky and Joyce Chai and Natalie Schluter and Joel Tetreault}, pages = {4885–4901}, address = {Online}, year={2020}, doi = {10.18653/v1/2020.acl-main.441} } @inproceedings{Wang-etal:2019, title={Super{GLUE}: {A} stickier benchmark for general-purpose language understanding systems}, author={Wang, Alex and Pruksachatkun, Yada and Nangia, Nikita and Singh, Amanpreet and Michael, Julian and Hill, Felix and Levy, Omer and Bowman, Samuel}, editor = {Hanna Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch\'e-Buc and Edward Fox and Roman Garnett}, booktitle={Advances in {N}eural {I}nformation {P}rocessing {S}ystems}, volume={32}, year={2019}, publisher = {Curran Associates, Inc.}, address = {Vancouver} } @incollection{Wang-etal:2018, title={{GLUE}: {A} multi-task benchmark and analysis platform for natural language understanding}, author={Wang, Alex and Singh, Amanpreet and Michael, Julian and Hill, Felix and Levy, Omer and Bowman, Samuel R.}, booktitle={Proceedings of the {B}lackbox{NLP} {W}orkshop at {EMNLP}: {A}nalyzing and {I}nterpreting {N}eural {N}etworks for {NLP}}, year={2018}, address = {Brussels}, editor = {Tal Linzen and Grzegorz Chrupa{\l}a and Afra Alishahi}, pages = {353-355}, publisher = {Association for Computational Linguistics}, doi = {10.18653/v1/w18-5446} } @Book{Swartz.Yazdani-92, editor = {Swartz, Merryanna L. and Yazdani, Masoud}, title = {Intelligent tutoring systems for foreign language learning: {T}he bridge to international communication}, publisher = {Springer}, year = 1992, address = {Berlin}, doi = {10.1007/978-3-642-77202-3} } @inproceedings{Speer-etal:2017, title={Concept{N}et 5.5: {A}n open multilingual graph of general knowledge}, author={Speer, Robyn and Chin, Joshua and Havasi, Catherine}, booktitle={Proceedings of the {AAAI} {C}onference on {A}rtificial {I}ntelligence}, volume={31}, number={1}, year={2017}, address = {San Francisco, CA}, editor = {Singh, Satinder and Markovitch, Shaul}, publisher = {Association for Computing Machinery}, doi = {10.1609/aaai.v31i1.11164} } @ARTICLE{Amaral.Meurers-08, author = {Luiz Amaral and Detmar Meurers}, title = {From Recording Linguistic Competence to Supporting Inferences about Language Acquisition in Context: Extending the Conceptualization of Student Models for Intelligent Computer-Assisted Language Learning}, journal = {Computer-Assisted Language Learning}, year = 2008, volume = 21, pages = {323--338}, number = 4, file = {:Amaral.Meurers-08.pdf:PDF}, url = {http://purl.org/dm/papers/amaral-meurers-call08.html} } @Article{kilgarriff:07, author = {Adam Kilgarriff}, title = {Googleology is Bad Science}, journal = {Computational Linguistics}, year = {2007}, volume = {33}, number = {1}, pages = {147--151} } @article{madnani:09, Author = {Nitin Madnani}, Journal = {The Python Papers}, Title = {{Querying and Serving N-gram Language Models with Python}}, Volume = {4}, Number = {2}, Year = {2009}, url = {http://www.desilinguist.org/pdf/langmodel.pdf}} @InProceedings{stolcke:02, author = {Andreas Stolcke}, title = {{SRILM} -- An Extensible Language Modeling Toolkit}, booktitle = {Proceedings of the International Conference on Spoken Language Processing}, year = {2002}, address = {Denver, CO} } @Article{mccarthy:09, author = {Diana McCarthy}, title = {Word Sense Disambiguation: An Overview}, journal = {Language and Linguistics Compass}, year = {2009}, volume = {3}, number = {2}, pages = {537--558} } @Book{leacock-et-al:10, author = {Claudia Leacock and Martin Chodorow and Michael Gamon and Joel Tetreault}, title = {Automated Grammatical Error Detection for Language Learners}, publisher = {Morgan \& Claypool}, year = {2010}, series = {Synthesis Lectures on Human Language Technologies}, doi = {10.1007/978-3-031-02137-4}, address = {San Rafael, CA} } @Book{kleinberg-tardos, author = {Jon Kleinberg and Éva Tardos}, title = {Algorithm Design}, address = {Boston, MA}, publisher = {Addison-Wesley}, year = {2006} } @inproceedings{Carlini-etal:2019, title={The secret sharer: {E}valuating and testing unintended memorization in neural networks}, author={Carlini, Nicholas and Liu, Chang and Erlingsson, {\'U}lfar and Kos, Jernej and Song, Dawn}, booktitle={28th {USENIX} {S}ecurity {S}ymposium}, pages={267--284}, editor = {Nadia Heninger and Patrick Traynor}, year={2019} } @article{Stalnaker:2002, title={Common ground}, author={Stalnaker, Robert}, journal={Linguistics and Philosophy}, volume={25}, number={5/6}, pages={701--721}, year={2002}, doi={10.1023/a:1020867916902} }