@inbook{Butterworth:83, author = {Brian Butterworth}, booktitle = {Language production}, volume = {2: {Development}, writing and other language processes}, title = {Lexical representation}, pages = {257--294}, year = {1983}, publisher = {Academic Press}, location = {London} } @InCollection{Moon:2007, author = {Moon, Rosamund}, booktitle = {{Phraseology: An international handbook of contemporary research}}, title = {{Corpus linguistic approaches with English corpora}}, pages = {1045--1059}, crossref = {Burger:Dobrovolskij:eds:2007}, } @phdthesis{forsberg2006langage, author = {Forsberg, Fanny}, title = {{Le langage préfabriqué en français parlé L2: Étude acquisitionnelle et comparative}}, school = {Stockholm University}, location = {Stockholm}, year = {2006}, } @InCollection{suribats_2009, author = {Subirats, Carlos}, booktitle = {Multilingual {FrameNets} in {Computational} {Lexicography}}, title = {Spanish {FrameNet}: {A} frame-semantic analysis of the {Spanish} lexicon}, editor = {Boas, Hans C.}, pages = {135--162}, publisher = {Mouton de Gruyter}, address = {Berlin/New York}, year = {2009}, } @Article{GirjuEtAl:05, author = {Roxana Girju and Dan Moldovan and Marta Tatu and Daniel Antohe}, title = {On the semantics of noun compounds}, number = {4}, pages = {479--496}, volume = {19}, journal = {Journal of Computer Speech and Language}, year = {2005}, } @incollection{gala2013towards, author = {Gala, Núria and François, Thomas and Fairon, Cédrick}, booktitle = {Electronic lexicography in the 21st century: {Thinking} outside the paper. Proceedings of the e{L}ex 2013 conference}, title = {{Towards a French lexicon with difficulty measures: NLP helping to bridge the gap between traditional dictionaries and specialized lexicons}}, editor = {Kosem, Iztok and Kallas, Jelena and Gantar, Polona and Krek, Simon and Langemets, Margit and Tuulik, Maria}, pages = {132--151}, url = {http://eki.ee/elex2013/proceedings/eLex2013-proceedings.pdf}, year = {2013}, } @Book{Aijmer:1996, author = {Aijmer, Karin}, title = {Conversational Routines in {English}: {Convention} and Creativity}, publisher = {Routledge}, address = {London}, year = {1996}, } @incollection{hayoun_elhadad_2016, author = {Hayoun, Avi and Elhadad, Michael}, booktitle = {Proceedings of the Tenth International Conference on {Language} {Resources} and {Evaluation} ({LREC}'16)}, title = {The {Hebrew} {FrameNet} Project}, pages = {4341--4347}, publisher = {European Language Resources Association (ELRA)}, address = {Portorož, Slovenia}, year = {2016}, } @mastersthesis{sandry, author = {Sandry, Susan}, school = {University College London, School of Slavonic and East European Studies}, title = {{Phonology and morphology of Paševik Pomak with notes on the verb and fundamentals of syntax}}, year = {2013}, } @Book{kokkas, author = {Kokkas, Nikolaos}, title = {Uchem so {P}omátsko: {Μ}αθήματα πομακικής γλώσσας}, publisher = {Ξάνθη: Πολιτιστικό Αναπτυξιακό Κέντρο Θράκης}, volume = {A}, place = {Xanthi}, year = {2004}, } @Book{Schluecker2019CLU, title = {Complex Lexical Units: {Compounds} and Multi-Word Expressions}, doi = {10.1515/9783110632446}, editor = {Barbara Schlücker}, publisher = {De Gruyter}, address = {Berlin, Boston}, year = {2019}, } @incollection{Heide/Borgwaldt:09, author = {Claudia {von der Heide} and Susanne Borgwaldt}, booktitle = {Proceedings of the 9th {N}orddeutsches {L}inguistisches {K}olloquium}, title = {Assoziationen zu Unter-, Basis- und Oberbegriffen: Eine explorative Studie}, pages = {51--74}, langid = {german}, year = {2009}, } @Misc{Hajic:etal:2018, author = {Hajič, Jan and Bejček, Eduard and Bémová, Alevtina and Buráňová, Eva and Hajičová, Eva and Havelka, Jiří and Homola, Petr and Kárník, Jiří and Kettnerová, Václava and Klyueva, Natalia and Kolářová, Veronika and Kučová, Lucie and Lopatková, Markéta and Mikulová, Marie and Mírovský, Jiří and Nedoluzhko, Anna and Pajas, Petr and Panevová, Jarmila and Poláková, Lucie and Rysová, Magdaléna and Sgall, Petr and Spoustová, Johanka and Straňák, Pavel and Synková, Pavlína and Ševčíková, Magda and Štěpánek, Jan and Urešová, Zdeňka and Vidová Hladká, Barbora and Zeman, Daniel and Zikánová, Šárka and Žabokrtský, Zdeněk}, title = {{Prague Dependency Treebank 3.5}}, note = {{LINDAT}/{CLARIAH}-{CZ} digital library at the Institute of Formal and Applied Linguistics ({ÚFAL}), Faculty of Mathematics and Physics, Charles University}, url = {http://hdl.handle.net/11234/1-2621}, year = {2018}, } @TechReport{VanEynde:DCOITagSet:2005, author = {Frank {Van Eynde}}, institution = {Centrum voor Computerlinguïstiek, KU Leuven}, title = {Part Of Speech Tagging En Lemmatisering van het {D-COI} Corpus}, langid = {dutch}, type = {{LASSY} Report}, url = {http://www.let.rug.nl/vannoord/Lassy/POS_manual.pdf}, address = {Leuven, Belgium}, year = {2005}, } @Article{tasovac2020encoding, author = {Tasovac, Toma and Salgado, Ana and Costa, Rute}, title = {{Encoding polylexical units with TEI Lex-o}}, number = {2}, pages = {28--57}, volume = {8}, journal = {Slovenscina 2.0}, year = {2020}, } @incollection{schneider-etal-2014-comprehensive, author = {Schneider, Nathan and Onuffer, Spencer and Kazour, Nora and Danchik, Emily and Mordowanec, Michael T. and Conrad, Henrietta and Smith, Noah A.}, booktitle = {Proceedings of the ninth international conference on {Language Resources and Evaluation} ({LREC}'14)}, title = {Comprehensive annotation of multiword expressions in a social web corpus}, editor = {Calzolari, Nicoletta and Choukri, Khalid and Declerck, Thierry and Loftsson, Hrafn and Maegaard, Bente and Mariani, Joseph and Moreno, Asuncion and Odijk, Jan and Piperidis, Stelios}, pages = {455--461}, publisher = {European Language Resources Association (ELRA)}, url = {https://aclanthology.org/L14-1433/}, address = {Reykjavik, Iceland}, year = {2014}, } @incollection{zaninello_nissim_2010, author = {Zaninello, Andrea and Nissim, Malvina}, booktitle = {Proceedings of the seventh international conference on {Language} {Resources} and {Evaluation} ({LREC}'10)}, title = {Creation of lexical resources for a characterisation of multiword expressions in {Italian}}, pages = {654--661}, publisher = {European Language Resources Association (ELRA)}, address = {Valletta, Malta}, year = {2010}, } @Article{Benczes:14, author = {Réka Benczes}, title = {What can we learn about the mental lexicon from non-prototypical cases of compounding?}, pages = {205--220}, volume = {10}, journal = {Argumentum}, year = {2014}, } @Article{wray2000functions, author = {Wray, Alison and Perkins, Michael R.}, title = {The functions of formulaic language: {An} integrated model}, number = {1}, pages = {1--28}, volume = {20}, journal = {Language \& Communication}, year = {2000}, } @InCollection{Cermak:2016a, author = {Čermák, František}, booktitle = {Nový encyklopedický slovník češtiny}, langid = {czech}, title = {Frazeologie a idiomatika}, edition = {1}, editor = {Karlík, Petr and Nekula, Marek and Pleskalová, Jana}, pages = {530--532}, publisher = {Nakladatelství Lidové noviny}, url = {https://www.czechency.org/slovnik/FRAZEOLOGIE A IDIOMATIKA}, address = {Praha}, year = {2016}, } @incollection{zampieri-etal-2019-impact, author = {Zampieri, Nicolas and Ramisch, Carlos and Damnati, Geraldine}, booktitle = {Proceedings of the joint workshop on multiword expressions and {WordNet} ({MWE-WN} 2019)}, title = {The impact of word representations on sequential neural {MWE} identification}, editor = {Savary, Agata and Escartín, Carla Parra and Bond, Francis and Mitrović, Jelena and Mititelu, Verginica Barbu}, pages = {169--175}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/W19-5121}, address = {Florence, Italy}, year = {2019}, } @Article{kilgarriff2014sketch, author = {Kilgarriff, Adam and Baisa, Vít and Bušta, Jan and Jakubíček, Miloš and Kovář, Vojtěch and Michelfeit, Jan and Rychlỳ, Pavel and Suchomel, Vít}, title = {The Sketch Engine: {Ten} years on}, number = {1}, pages = {7--36}, volume = {1}, journal = {Lexicography}, publisher = {Springer}, year = {2014}, } @incollection{Bozdechova:2007, author = {Bozděchová, Ivana}, booktitle = {Sborník příspěvků věnovaných profesorce {{P}}h{{D}}r. {{M}}arii {{Č}}echové, {{D}}r{{S}}c.}, title = {Teorie terminologie v historických a obsahových proměnách}, pages = {65--74}, publisher = {Univerzita J. E. Purkyně, Ústí nad Labem}, year = {2007}, } @incollection{Koeper/SchulteImWalde:17b, author = {Köper, Maximilian and {Schulte im Walde}, Sabine}, booktitle = {Proceedings of the 13th Workshop on Multiword Expressions}, title = {Complex verbs are different: {E}xploring the visual modality in multi-modal models to predict compositionality}, pages = {200--206}, address = {Valencia, Spain}, year = {2017}, } @InCollection{baldwin2010multiword, author = {Baldwin, Timothy and Kim, Su Nam}, booktitle = {Handbook of natural language processing}, title = {Multiword expressions}, edition = {2}, editor = {Damerau, Fred J. and Nitin Indurkhya}, pages = {267--292}, publisher = {CRC Press, Taylor and Francis Group}, address = {Boca Raton, FL}, year = {2010}, } @InCollection{ekberg2013grammatik, author = {Ekberg, Lena}, booktitle = {Svenska som andraspråk}, title = {Grammatik och lexikon hos svenska i andraspråk på nästan infödd nivå}, langid = {swedish}, editor = {Hyltenstam, Kenneth and Lindberg, Inger}, pages = {259--279}, publisher = {Lund: Studentlitteratur}, year = {2013}, } @incollection{karahoga-morphologically, author = {Karahóǧa, Ritván and Krimpas, Panagiotis G. and Stamou, Vivian and Arampatzakis, Vasileios and Karamatskos, Dimitrios and Sevetlidis, Vasileios and Constantinides, Nikolaos and Kokkas, Nikolaos and Pavlidis, George and Markantonatou, Stella}, booktitle = {Proceedings of the Fifth Workshop on the Use of Computational Methods in the Study of Endangered Languages}, title = {Morphologically annotated corpora of {Pomak}}, doi = {10.18653/v1/2022.computel-1.22}, pages = {179--186}, url = {https://aclanthology.org/2022.computel-1.22}, address = {Dublin}, year = {2022}, } @incollection{saito_etal_2008, author = {Saito, Hiroaki and Kuboya, Shunta and Sone, Takaaki and Tagami, Hayato and Ohara, Kyoko}, booktitle = {Proceedings of the Sixth International Conference on {Language} {Resources} and {Evaluation} ({LREC}'08)}, title = {The {Japanese} {FrameNet} Software Tools}, publisher = {European Language Resources Association (ELRA)}, address = {Marrakech, Morocco}, year = {2008}, } @InCollection{odijk_2013, author = {Odijk, Jan}, booktitle = {Essential Speech and Language Technology for {Dutch}: {Results} by the {STEVIN} programme}, title = {Identification and Lexical Representation of Multiword Expressions}, doi = {10.1007/978-3-642-30910-6_12}, editor = {Spyns, Peter and Odijk, Jan}, pages = {201--217}, publisher = {Springer}, series = {Theory and Applications of {Natural} {Language} {Processing}}, address = {Berlin, Heidelberg}, year = {2013}, } @incollection{chiarcos2022modellingGlobalex, author = {Chiarcos, Christian and Gkirtzou, Katerina and Ionov, Maxim and Kabashi, Besim and Khan, Fahad and Truică, Ciprian-Octavian}, booktitle = {Proceedings of the {Globalex} Workshop on Linked Lexicography within the 13th {Language Resources and Evaluation} Conference}, title = {Modelling Collocations in {OntoLex-FrAC}}, editor = {Ilan Kernerman and Simon Krek}, location = {Paris}, publisher = {European Language Resources Association (ELRA)}, pages = {10--18}, year = {2022}, } @InBook{durrant2018formulaic, author = {Durrant, Phil}, booktitle = {Understanding formulaic language: {A} second language acquisition perspective}, title = {Formulaic language in {English} for academic purposes}, editor = {Siyanova-Chanturia, Anna and Pellicer-Sánchez, Ana}, pages = {211--227}, publisher = {Routledge}, year = {2018}, } @Article{gavriilidou_nn_2013, author = {Gavriilidou, Zoe}, title = {{NN} Combinations in {Greek}}, number = {1}, pages = {5--29}, volume = {13}, journal = {Journal of Greek Linguistics}, year = {2013}, } @Article{Piirainen_2005, author = {Piirainen, Elisabeth}, title = {Europeanism, internationalism or something else? {P}roposal for a cross-lingustic and cross-cultural research project on widespread idioms in {Europe} and beyond}, doi = {10.7146/hjlcb.v18i35.25816}, number = {35}, pages = {45--75}, url = {https://tidsskrift.dk/her/article/view/25816}, volume = {18}, journal = {HERMES: Journal of Language and Communication in Business}, year = {2005}, } @Article{babelnet2012, author = {Navigli, Roberto and Ponzetto, Simone Paolo}, title = {{BabelNet}: {The} automatic construction, evaluation and application of a wide-coverage multilingual semantic network}, pages = {217--250}, volume = {193}, journal = {Artificial Intelligence}, year = {2012}, doi = {10.1016/j.artint.2012.07.001} } @InCollection{petruck_1997, author = {Petruck, Miriam R. L.}, booktitle = {Handbook of Pragmatics}, title = {Frame semantics}, editor = {Verschueren, Jef and Östman, Jan-Ola and Blommaert, Jan and Bulcaen, Chris}, pages = {1--13}, publisher = {John Benjamins}, address = {Amsterdam}, year = {1997}, } @incollection{goldhahn2012building, author = {Goldhahn, Dirk and Eckart, Thomas and Quasthoff, Uwe}, booktitle = {Proceedings of the Eighth International Conference on {Language Resources and Evaluation} (LREC'12)}, title = {Building large monolingual dictionaries at the {Leipzig Corpora Collection}: {From} 100 to 200 languages}, pages = {759--765}, year = {2012}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Mehmet Uğur Doğan and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, location = {Istanbul}, publisher = {European Language Resources Association (ELRA)}, } @Article{CordeiroEtAl:19, author = {Silvio Cordeiro and Aline Villavicencio and Marco Idiart and Carlos Ramisch}, title = {Unsupervised compositionality prediction of nominal compounds}, number = {1}, pages = {1--57}, volume = {45}, journal = {Computational Linguistics}, year = {2019}, } @incollection{kim_etal_2016, author = {Kim, Jeong-uk and Hahm, Younggyun and Choi, Key-Sun}, booktitle = {Proceedings of {COLING} 2016, the 26th {International} {Conference} on {Computational} {Linguistics}: {System} Demonstrations}, title = {Korean {FrameNet} Expansion Based on Projection of {Japanese} {FrameNet}}, pages = {175--179}, publisher = {The COLING 2016 Organizing Committee}, address = {Osaka, Japan}, year = {2016}, } @incollection{skoldberg2013between, author = {Sköldberg, Emma and Bäckström, Linnéa and Borin, Lars and Forsberg, Markus and Lyngfelt, Benjamin and Olsson, Leif-Jöran and Prentice, Julia and Rydstedt, Rudolf and Tingsell, Sofia and Uppström, Jonatan}, booktitle = {{Electronic lexicography in the 21st century: Thinking outside the paper. Proceedings of the e{L}ex 2013 conference}}, title = {Between grammars and dictionaries: {A} {Swedish} Constructicon}, editor = {Kosem, Iztok and Kallas, Jelena and Gantar, Polona and Krek, Simon and Langemets, Margit and Tuulik, Maria}, pages = {310--327}, url = {http://eki.ee/elex2013/proceedings/eLex2013_21_Skoldberg+etal.pdf}, year = {2013}, } @incollection{baldwin2002multiword, author = {Baldwin, Timothy and Bond, Francis}, booktitle = {Proceedings of the 8th Annual Meeting of the {Association for Natural Language Processing}}, title = {Multiword expressions: {Some} problems for {Japanese} {NLP}}, pages = {379--382}, address = {Keihanna, Japan}, year = {2002}, } @incollection{Brin97, author = {Sergey Brin and Rajeev Motwani and Jeffrey D. Ullman and Shalom Tsur}, booktitle = {{ACM SIGMOD} International Conference on Management of Data, {May 13–15, 1997, Tucson, Arizona, USA}}, title = {Dynamic itemset counting and implication rules for market basket data}, doi = {10.1145/253260.253325}, editor = {Joan Peckham}, pages = {255--264}, publisher = {ACM Press}, year = {1997}, } @incollection{bonial_etal_2014, author = {Bonial, Claire and Green, Meredith and Preciado, Jenette and Palmer, Martha}, booktitle = {Proceedings of the 10th Workshop on Multiword Expressions ({MWE}2014)}, title = {An approach to \emph{take} multi-word expressions}, pages = {94--98}, publisher = {Association for Computational Linguistics}, address = {Gothenburg, Sweden}, year = {2014}, } @incollection{HueningSchluecker2015MWE, author = {Matthias Hüning and Barbara Schlücker}, booktitle = {Word-formation: {An} International Handbook of the Languages of {Europe}}, volume = {1}, title = {Multi-word expressions}, doi = {10.1515/9783110246254-026}, editor = {Peter O. Müller and Ingeborg Ohnheiser and Susan Olsen and Franz Rainer}, pages = {450--467}, publisher = {De Gruyter Mouton}, address = {Berlin}, year = {2015}, } @InCollection{Odijk:LiberAmicorum:2022, author = {Jan Odijk}, booktitle = {Liber amicorum {Francisci Affinii} alias {Frank Van Eynde}}, title = {Eenwoordsconstituenten in {GrETEL}}, pages = {143--150}, publisher = {KU Leuven}, address = {Leuven, Belgium}, year = {2022}, } @incollection{Machalek:2020, author = {Machálek, Tomáš}, booktitle = {Proceedings of the Twelfth {Language Resources and Evaluation} Conference}, title = {{K}on{T}ext: {Advanced} and flexible corpus query interface}, pages = {7003--7008}, publisher = {ELRA}, url = {https://aclanthology.org/2020.lrec-1.865}, address = {Marseille}, year = {2020}, } @Book{Levi:78, author = {Judith N. Levi}, title = {The syntax and semantics of complex nominals}, publisher = {Academic Press}, address = {London}, year = {1978}, } @Article{chechdatabase, author = {Vondřička, Pavel}, title = {Design of a Multiword Expressions Database}, pages = {83--101}, volume = {112}, journal = {The Prague Bulletin of Mathematical Linguistics}, year = {2019}, } @PhdThesis{giouli_2020, author = {Giouli, Voula}, title = {Το σημασιολογικό πεδίο των συναισθημάτων: {Ταξινόμηση} των ρημάτων της Νέας Ελληνικής που δηλώνουν συναίσθημα. (`{The} semantic field of {emotions}: {A} Lexicon-Grammar account of {Greek} verbs denoting {emotion}}, language = {Greek}, address = {Athens, Greece}, school = {National and Kapodistrian University of Athens}, year = {2020}, } @Book{Ralli2007, author = {Ralli, Angela}, title = {Η {Σύνθεση} των {Λέξεων}: {Διαγλωσσική}, {Μορφολογική} {Προσέγγιση} (`{Compounding}: {A} Cross-lingual, Morphological Approach')}, publisher = {Patakis}, address = {Athens}, year = {2007}, } @incollection{WellerEtAl:14b, author = {Marion Weller and Fabienne Cap and Stefan Müller and Sabine {Schulte im Walde} and Alexander Fraser}, booktitle = {Proceedings of the 1st Workshop on Computational Approaches to Compound Analysis}, title = {Distinguishing degrees of compositionality in compound splitting for statistical machine translation}, pages = {81--90}, address = {Dublin, Ireland}, year = {2014}, } @incollection{villavicencio-etal-2004-multilingual, author = {Villavicencio, Aline and Baldwin, Timothy and Waldron, Benjamin}, booktitle = {Proceedings of the Fourth International Conference on {Language Resources and Evaluation} ({LREC}{'}04)}, title = {A multilingual database of idioms}, pages = {1127--1130}, url = {http://www.lrec-conf.org/proceedings/lrec2004/pdf/760.pdf}, address = {Lisbon}, year = {2004}, } @incollection{ReddyEtAl:11b, author = {Siva Reddy and Ioannis P. Klapaftis and Diana McCarthy and Suresh Manandhar}, booktitle = {Proceedings of the 5th International Joint Conference on {Natural Language Processing}}, title = {Dynamic and Static Prototype Vectors for Semantic Composition}, pages = {705--713}, address = {Chiang Mai, Thailand}, year = {2011}, } @InCollection{de2014automated, author = {De Cock, Sylvie and Granger, Sylviane and Leech, Geoffrey and McEnery, Tony}, booktitle = {Learner {E}nglish on computer}, title = {An automated approach to the phrasicon of {EFL} learners}, editor = {Granger, Sylviane}, pages = {67--79}, publisher = {Routledge}, year = {2014}, } @Book{vallex:2014, author = {Lopatková, Markéta and Kettnerová, Václava and Bejček, Eduard and Skwarska, Karolína and Žabokrtský, Zdeněk}, title = {{VALLEX} 2.6.3: {Valency} lexicon of {Czech} verbs}, publisher = {Karolinum Press}, address = {Prague}, year = {2014}, } @incollection{Miletic/SchulteImWalde:23, author = {Miletic, Filip and {Schulte im Walde}, Sabine}, booktitle = {Proceedings of the 17th Conference of the {European} Chapter of the {Association for Computational Linguistics}}, title = {A systematic search for compound semantics in pretrained {BERT} architectures}, pages = {1499--1512}, address = {Dubrovnik, Croatia}, year = {2023}, } @Article{Przepiorkowski:etal:2016, author = {Przepiórkowski, Adam and Hajič, Jan and Hajnicz, Elżbieta and Urešová, Zdeňka}, title = {{Phraseology in two {S}lavic valency dictionaries: Limitations and perspectives}}, doi = {10.1093/ijl/ecv048}, number = {1}, pages = {1--38}, volume = {30}, journal = {International Journal of Lexicography}, year = {2017}, } @Article{Koeva2021, author = {Koeva, Svetla}, title = {{The Bulgarian WordNet: Structure and specific features}}, number = {1}, pages = {47--70}, volume = {8}, journal = {Papers of the Bulgarian Academy of Sciences}, year = {2021}, } @Article{palmer_etal_2005, author = {Palmer, Martha and Gildea, Daniel and Kingsbury, Paul}, title = {The {Proposition Bank}: {An} annotated corpus of semantic roles}, number = {1}, pages = {71--106}, volume = {31}, journal = {Computational Linguistics}, year = {2005}, } @incollection{bhalla2019evaluation, author = {Bhalla, Vishal and Klimcikova, Klara}, booktitle = {Proceedings of the 14th Workshop on Innovative Use of {NLP} for Building Educational Applications}, title = {Evaluation of automatic collocation extraction methods for language learning}, editor = {Yannakoudakis, Helen and Kochmar, Ekaterina and Leacock, Claudia and Madnani, Nitin and Pilán, Ildikó and Zesch, Torsten}, pages = {264--274}, publisher = {Association of Computational Linguistics}, year = {2019}, } @Book{hawkins2012criterial, author = {Hawkins, John A and Filipović, Luna}, title = {{Criterial features in L2 English: Specifying the reference levels of the Common European Framework}}, publisher = {Cambridge University Press}, volume = {1}, year = {2012}, } @incollection{ReddyEtAl:11a, author = {Siva Reddy and Diana McCarthy and Suresh Manandhar}, booktitle = {Proceedings of the 5th International Joint Conference on Natural Language Processing}, title = {An Empirical Study on Compositionality in Compound Nouns}, pages = {210--218}, address = {Chiang Mai, Thailand}, year = {2011}, } @incollection{ohara_etal_2003, author = {Ohara, Kyoko and Fujii, S. and Saito, Hiroaki and Ishizaki, S. and Ohori, T. and Suzuki, Ryoko}, booktitle = {Proceedings of {Pacific} {Association} for {Computational} {Linguistics} ({PACLING’03})}, title = {The {Japanese} {FrameNet} Project: {A} Preliminary Report}, pages = {249--254}, publisher = {Pacific {Association} for {Computational} {Linguistics}}, address = {Halifax, Canada}, year = {2003}, } @incollection{agatamultiflex, author = {Savary, Agata}, booktitle = {Implementation and Application of Automata}, title = {Multiflex: {A} multilingual finite-state tool for multi-word units}, doi = {10.1007/978-3-642-02979-0_27}, editor = {Maneth, Sebastian}, pages = {237--240}, publisher = {Springer}, address = {Berlin, Heidelberg}, year = {2009}, } @incollection{giouli_etal_2020, author = {Giouli, Voula and Pilitsidou, Vera and Christopoulos, Hephaestion}, booktitle = {Proceedings of the {International} {FrameNet} {Workshop} 2020: {Towards} a Global, Multilingual {FrameNet}}, title = {Greek within the {Global} {FrameNet} {Initiative}: {Challenges} and Conclusions so far}, pages = {48--55}, publisher = {European Language Resources Association, (ELRA)}, address = {Marseille, France}, year = {2020}, } @incollection{przepiorkowski-etal-2014, author = {Przepiórkowski, Adam and Hajnicz, Elżbieta and Patejuk, Agnieszka and Woliński, Marcin}, booktitle = {Proceedings of Workshop on Lexical and Grammatical Resources for Language Processing}, title = {Extended phraseological information in a valence dictionary for {NLP} applications}, doi = {10.3115/v1/W14-5811}, pages = {83--91}, publisher = {Association for Computational Linguistics and Dublin City University}, address = {Dublin, Ireland}, year = {2014}, } @incollection{villavicencio_etal_2004, author = {Villavicencio, Aline and Copestake, Ann and Waldron, Benjamin and Lambeau, Fabre}, booktitle = {Proceedings of the {Workshop} on {Multiword} {Expressions}: {Integrating} Processing}, title = {Lexical Encoding of {MWEs}}, pages = {80--87}, publisher = {Association for Computational Linguistics}, address = {Barcelona, Spain}, year = {2004}, } @Book{stoett1925nederlandsche, author = {Stoett, Frederik August}, date = {1923}, title = {Nederlandsche spreekwoorden, spreekwijzen, uitdrukkingen en gezegden}, edition = {4}, publisher = {W.J.\ Thieme \& Cie}, url = {https://www.dbnl.org/tekst/stoe002nede01_01/}, address = {Zutphen}, } @InCollection{caines2017effect, author = {Caines, Andrew and Buttery, Paula}, booktitle = {Learner corpus research: {New} perspectives and applications}, title = {The effect of task and topic on opportunity of use in learner corpora}, editor = {Brezina, Vaclav and Flowerdew, Lynne}, pages = {5--27}, publisher = {Bloomsbury Publishing Academic London}, year = {2017}, } @Article{ellis2012formulaic, author = {Ellis, Nick C.}, title = {Formulaic language and second language acquisition: {Zipf} and the phrasal teddy bear}, pages = {17--44}, volume = {32}, journal = {Annual Review of Applied Linguistics}, publisher = {Cambridge University Press}, year = {2012}, } @InCollection{Lichte:2019, author = {Lichte, Timm and Petitjean, Simon and Savary, Agata and Waszczuk, Jakub}, booktitle = {Representation and parsing of multiword expressions: {Current} trends}, title = {Lexical encoding formats for multi-word expressions: {T}he challenge of ``irregular'' regularities}, doi = {10.5281/zenodo.2579033}, editor = {Parmentier, Yannick and Waszczuk, Jakub}, pages = {1--33}, publisher = {Language Science Press}, address = {Berlin}, ids = {lichteagata,lichte-etal}, year = {2019}, } @InCollection{hartmann_etal_2012, author = {Hartmann, Silvana and Szarvas, György and Gurevych, Iryna}, booktitle = {Semi-Automatic Ontology Development: {Processes} and Resources}, title = {Mining multiword terms from {Wikipedia}}, editor = {Pazienza, Maria Teresa and Stellato, Armando}, pages = {226--258}, publisher = {IGI Global}, year = {2012}, } @Book{SchulteImWalde/Smolka:20, title = {The Role of Constituents in Multi-Word Expressions: {A}n Interdisciplinary, Cross-Lingual Perspective}, doi = {10.5281/zenodo.3598577}, editor = {Sabine {Schulte im Walde} and Eva Smolka}, number = {4}, publisher = {Language Science Press}, series = {Phraseology and Multiword Expressions}, address = {Berlin}, year = {2020}, } @Book{Popovicova:2020, author = {Popovičová, Snežana}, title = {{Česká a srbská frazeologie: Na cestě ke dvojjazyčnému frazeologickému slovníku}}, publisher = {Karolinum}, langid = {czech}, address = {Praha}, year = {2020}, } @incollection{Evert2009, author = {Stefan Evert}, booktitle = {Corpus {Linguistics}: {An} international handbook}, volume = {2}, title = {Corpora and collocations}, doi = {10.1515/9783110213881.2.1212}, editor = {Anke Lüdeling and Merja Kytö}, pages = {1212--1248}, publisher = {De Gruyter Mouton}, address = {Berlin}, year = {2009}, } @incollection{ostroski2022, author = {Ostroški Anić, Ana and Brač, Ivana}, booktitle = {Dictionaries and Society: {Proceedings} of the {XX} {EURALEX} International Congress}, title = {Airframe: {Mapping} the Field of Aviation Through Semantic Frames}, editor = {Klosa-Kückelhaus, Annette and Engelberg, Stefan and Möhrs, Christine and Storjohann, Petra}, pages = {334--345}, publisher = {IDS-Verlag}, address = {Mannheim}, year = {2022}, } @Book{akademien2015svenska, author = {{Svenska Akademien}}, title = {{Svenska Akademiens ordlista}}, edition = {14}, publisher = {Svenska Akademien and Norstedts ordbok}, url = {https://www.svenskaakademien.se/svenska-spraket/svenska-akademiens-ordlista-saol}, year = {2015}, } @Book{hullen, author = {Hüllen, Werner}, title = {A history of {Roget's “Thesaurus”}}, publisher = {Oxford University Press}, location = {New York}, year = {2004}, } @PhdThesis{Evert2005, author = {Stefan Evert}, title = {The statistics of word cooccurrences word pairs and collocations}, address = {Stuttgart}, school = {{Institut für maschinelle Sprachverarbeitung, Universität Stuttgart}}, year = {2005}, } @incollection{durlich2018efllex, author = {Dürlich, Luise and François, Thomas}, booktitle = {Proceedings of the Eleventh International Conference on {Language Resources and Evaluation} ({LREC})}, title = {{EFLLex: A graded lexical resource for learners of English as a foreign language}}, editor = {Calzolari, Nicoletta and Choukri, Khalid and Cieri, Christopher and Declerck, Thierry and Goggi, Sara and Hasida, Koiti and Isahara, Hitoshi and Maegaard, Bente and Mariani, Joseph and Mazo, Hélène and Moreno, Asuncion and Odijk, Jan and Piperidis, Stelios and Tokunaga, Takenobu}, publisher = {European Language Resources Association (ELRA)}, url = {https://aclanthology.org/L18-1140}, year = {2018}, } @InBook{constrgr, author = {Fried, Mirjam and Jan-Ola Östman}, booktitle = {{Construction Grammar} in a cross-language perspective}, title = {{Construction Grammar}: {A} thumbnail sketch}, editor = {Mirjam Fried and Jan-Ola Östman}, pages = {11--86}, publisher = {John Benjamins}, address = {Amsterdam}, year = {2004}, } @incollection{SalehiEtAl:15, author = {Bahar Salehi and Paul Cook and Timothy Baldwin}, booktitle = {Proceedings of the Conference of the {North American} Chapter of the {Association for Computational Linguistics}/Human Language Technologies}, title = {A word embedding approach to predicting the compositionality of multiword expressions}, pages = {977--983}, address = {Denver, Colorado, USA}, year = {2015}, } @incollection{SalehiEtAl:14, author = {Bahar Salehi and Paul Cook and Timothy Baldwin}, booktitle = {Proceedings of the Conference on Empirical Methods in {Natural Language Processing}}, title = {Detecting non-compositional {MWE} components using {Wiktionary}}, pages = {1792--1797}, address = {Doha, Qatar}, year = {2014}, } @Article{Gagne:02, author = {Christina L. Gagné}, title = {Lexical and relational influences on the processing of novel compounds}, pages = {723--735}, volume = {81}, journal = {Brain and Language}, year = {2002}, } @incollection{chiarcos2020modelling, author = {Chiarcos, Christian and Ionov, Maxim and de Does, Jesse and Depuydt, Katrien and Khan, Fahad and Stolk, Sander and Declerck, Thierry and McCrae, John Philip}, booktitle = {{Proceedings of the 2020 {Globalex} workshop on linked lexicography}}, title = {{Modelling frequency and attestations for Ontolex-Lemon}}, pages = {1--9}, year = {2020}, } @Article{al-hajetal2013, author = {Al-Haj, Hassan and Itai, Alon and Wintner, Shuly}, title = {Lexical representation of multiword expressions in morphologically-complex languages}, doi = {10.1093/ijl/ect036}, pages = {130--170}, volume = {27}, ids = {shuly2013}, journal = {International Journal of Lexicography}, year = {2013}, } @incollection{Roller/SchulteImWalde:13, author = {Stephen Roller and Sabine {Schulte im Walde}}, booktitle = {Proceedings of the Conference on Empirical Methods in Natural Language Processing}, title = {A Multimodal {LDA} Model integrating Textual, Cognitive and Visual Modalities}, pages = {1146--1157}, address = {Seattle, WA, USA}, year = {2013}, } @incollection{Roller/SchulteImWalde:14, author = {Stephen Roller and Sabine {Schulte im Walde}}, booktitle = {Proceedings of the 10th Workshop on Multiword Expressions}, title = {Feature Norms of {G}erman Noun Compounds}, pages = {104--108}, address = {Gothenburg, Sweden}, year = {2014}, } @Book{Kovarikova:2017, author = {Kováříková, Dominika}, title = {Kvantitativní charakteristiky termínů}, publisher = {Nakladatelství Lidové noviny -- Český národní korpus}, address = {Praha}, year = {2017}, } @incollection{Evert2011, author = {Stefan Evert and Andrew Hardie}, booktitle = {{Proceedings of the Corpus Linguistics 2011 conference, University of Birmingham, UK}}, title = {Twenty-first century {Corpus Workbench}: {Updating} a query architecture for the new millennium}, year = {2011}, } @Article{borin2013saldo, author = {Borin, Lars and Forsberg, Markus and Lönngren, Lennart}, title = {{SALDO: A touch of yin to WordNet’s yang}}, pages = {1191--1211}, volume = {47}, journal = {Language Resources and Evaluation}, publisher = {Springer}, year = {2013}, } @incollection{fotopoulou_etal_2014, author = {Fotopoulou, Aggeliki and Markantonatou, Stella and Giouli, Voula}, booktitle = {Proceedings of the 10th {Workshop} on {Multiword} {Expressions} ({MWE})}, title = {Encoding {MWEs} in a conceptual lexicon}, pages = {43--47}, publisher = {Association for Computational Linguistics}, address = {Gothenburg, Sweden}, ids = {Fotopoulou-et-al-2014, Fotopoulou2014}, year = {2014}, } @incollection{pilitsidou_giouli_2020, author = {Pilitsidou, Vera and Giouli, Voula}, booktitle = {Lexicography for {Inclusion}: {Proceedings} of the 19th {EURALEX} {International} {Congress}}, title = {Frame {Semantics} in the Specialized Domain of Finance: {Building} a Termbase to aid Translation}, editor = {Gavriilidou, Zoe and Mitsiaki, Maria and Fliatouras, Asimakis}, pages = {263--271}, publisher = {Democritus University of Thrace}, volume = {1}, address = {Alexandroupolis}, year = {2020}, } @Book{theocharidisg, author = {Theocharides, Petros}, title = {{Γραμματική της Πομακικής Γλώσσας}}, publisher = {Thessaloniki: Egiros}, place = {Thessaloniki}, year = {1996}, } @InCollection{LASSY:2013, author = {van Noord, Gertjan and Bouma, Gosse and Van Eynde, Frank and de Kok, Daniël and van der Linde, Jelmer and Schuurman, Ineke and Tjong Kim Sang, Erik and Vandeghinste, Vincent}, booktitle = {Essential Speech and Language Technology for {D}utch}, title = {Large Scale Syntactic Annotation of Written {D}utch: {Lassy}}, doi = {10.1007/978-3-642-30910-6_9}, editor = {Spyns, Peter and Odijk, Jan}, pages = {147--164}, publisher = {Springer}, location = {Berlin}, series = {Theory and Applications of Natural Language Processing}, year = {2013}, } @incollection{Odijk:etal:TLT16, author = {Jan Odijk and Martijn van der Klis and Sheean Spoel}, booktitle = {Proceedings of the 16th International Workshop on {Treebanks and Linguistic Theories} {(TLT16)}}, title = {Extensions to the {GrETEL} {Treebank Query Application}}, pages = {46--55}, url = {http://aclweb.org/anthology/W/W17/W17-7608.pdf}, address = {Prague}, year = {2018}, } @incollection{bonial_propbank_2014, author = {Bonial, Claire and Bonn, Julia and Conger, Kathryn and Hwang, Jena D. and Palmer, Martha}, booktitle = {Proceedings of the Ninth International Conference on {Language} {Resources} and {Evaluation} ({LREC}'14)}, title = {PropBank: {Semantics} of New Predicate Types}, pages = {3013--3019}, publisher = {European Language Resources Association (ELRA)}, address = {Reykjavik, Iceland}, year = {2014}, } @Article{fillmore_1985, author = {Fillmore, Charles J.}, title = {Frames and the Semantics of Understanding}, number = {2}, pages = {222--254}, volume = {6}, journal = {Quaderni di semantica}, year = {1985}, } @Book{prentice2010kappen, author = {Prentice, Julia}, title = {Käppen i hjulen: {Behärskning} av svenska konventionaliserade uttryck bland gymnasieelever med varierande språklig bakgrund}, langid = {swedish}, publisher = {University of Gothenburg}, series = {ROSA 12}, url = {http://hdl.handle.net/2077/23261}, year = {2010}, } @InCollection{fillmore_1982, author = {Fillmore, Charles J.}, booktitle = {Linguistics in the Morning Calm: {Selected} {Papers} from {SICOL}-1981}, title = {Frame {Semantics}}, pages = {111--137}, publisher = {Hanshin Publishing Company}, address = {Seul, Korea}, year = {1982}, } @incollection{BettingerEtAl:20, author = {Bettinger, Julia and Hätty, Anna and Dorna, Michael and {Schulte im Walde}, Sabine}, booktitle = {Proceedings of the 12th {Language Resources and Evaluation Conference} ({LREC'2020})}, title = {A domain-specific dataset of difficulty ratings for {G}erman noun compounds in the domains {DIY}, cooking and automotive}, publisher = {European Language Resources Association (ELRA)}, pages = {4359--4367}, address = {Marseille, France}, year = {2020}, } @phdthesis{lewis2008idiom, author = {Lewis, Margareta}, title = {{The idiom principle in L2 English: Assessing elusive formulaic sequences as indicators of idiomaticity, fluency, and proficiency}}, school = {Stockholm University}, year = {2008}, } @Book{theocharidisl, author = {Theocharides, Petros}, title = {{Πομακο-Ελληνικό Λεξικό / Πομάχτσκου-Ουρούμτσκου Λεκσικό}}, publisher = {Thessaloniki: Egiros}, place = {Thessaloniki}, year = {1996}, } @incollection{markantonatou-etal-2019-idion, author = {Markantonatou, Stella and Minos, Panagiotis and Zakis, George and Moutzouri, Vassiliki and Chantou, Maria}, booktitle = {Proceedings of the joint workshop on multiword expressions and {WordNet} ({MWE-WN} 2019) at {ACL} 2019}, title = {{IDION}: {A} database for {M}odern {G}reek multiword expressions}, doi = {10.18653/v1/W19-5115}, pages = {130--134}, address = {Florence}, year = {2019}, } @incollection{lenci_etal_2010, author = {Lenci, Alessandro and Johnson, Martina and Lapesa, Gabriella}, booktitle = {Proceedings of the Seventh International Conference on {Language} {Resources} and {Evaluation} ({LREC}'10)}, title = {Building an {Italian} {FrameNet} through semi-automatic corpus analysis}, pages = {12--19}, publisher = {European Language Resources Association (ELRA)}, address = {Valletta, Malta}, year = {2010}, } @TechReport{kuiper_etal_2003, author = {Kuiper, Koenraad and McCann, Heather and Quinn, Heidi and Aitchison, Therese and Kees van der Veer}, publisher = {Linguistic Data Consortium}, location = {Philadelphia}, title = {{SAID}}, doi = {10.35111/MSVM-T728}, year = {2003}, } @Article{BaroniEtAl:09, author = {Marco Baroni and Silvia Bernardini and Adriano Ferraresi and Eros Zanchetta}, title = {The {W}a{C}ky {W}ide {W}eb: {A} collection of very large linguistically processed web-crawled corpora}, number = {3}, pages = {209--226}, volume = {43}, journal = {Language Resources and Evaluation}, year = {2009}, } @incollection{Koeva2010, author = {Koeva, Svetla}, booktitle = {{Bulgarian-American} Dialogues}, title = {Bulgarian {WordNet}: {Current} state, applications and prospects}, pages = {120--132}, publisher = {Prof. M. Drinov Academic Publishing House}, address = {Sofia}, year = {2010}, } @incollection{SpaldingEtAl:10, author = {Thomas L. Spalding and Christina L. Gagné and A. C. Mullaly and Hongbo Ji}, title = {Relation-based interpretation of noun-noun phrases: {A} new theoretical approach}, series = {Linguistische Berichte Sonderhefte}, number = {17}, pages = {283-316}, editor = {Susan Olsen}, booktitle = {New Impulses in Word-Formation}, year = {2010}, } @Article{simov-osenova-2015-catenaKorea, author = {Simov, Kiril and Osenova, Petya}, title = {Modeling lexicon-syntax interaction with catenae}, number = {3}, pages = {287--322}, doi = {10.17791/jcs.2015.16.3.287}, volume = {16}, journal = {Journal of Cognitive Science}, year = {2015}, } @Article{wray2013formulaic, author = {Wray, Alison}, title = {Formulaic language}, number = {3}, pages = {316--334}, volume = {46}, journal = {Language teaching}, publisher = {Cambridge University Press}, year = {2013}, } @Article{BrysbaertEtAl:14, author = {Marc Brysbaert and Amy Beth Warriner and Victor Kuperman}, title = {Concreteness Ratings for 40 Thousand generally known {E}nglish Word Lemmas}, doi = {10.3758/s13428-013-0403-5}, pages = {904--911}, volume = {64}, journal = {Behavior Research Methods}, year = {2014}, } @Article{torrent_etal_2022, author = {Timponi Torrent, Tiago and Matos, Ely Edison Da Silva and Belcavello, Frederico and Viridiano, Marcelo and Gamonal, Maucha Andrade and Costa, Alexandre Diniz Da and Marim, Mateus Coutinho}, title = {Representing Context in {FrameNet}: {A} Multidimensional, Multimodal Approach}, doi = {10.3389/fpsyg.2022.838441 }, pages = {1--20}, volume = {13}, journal = {Frontiers in Psychology}, year = {2022}, } @incollection{ekberg1999anvandningen, author = {Ekberg, Lena}, booktitle = {{Svenskans beskrivning 23: förhandlingar vid tjugotredje Sammankomsten för svenskans beskrivning: Göteborg den 15--16 maj 1998}}, title = {{Användningen av komplexa predikat hos invandrarbarn i Rosengård.}}, editor = {Andersson, Lars-Gunnar and Lundqvist, Aina and Norén, Kerstin and Rogström, Lena}, langid = {swedish}, pages = {86--95}, location = {Lund}, publisher = {Lund University Press}, year = {1999}, } @InCollection{fillmore_1977, author = {Fillmore, Charles J.}, booktitle = {Linguistic Structures Processing: {Fundamental} Studies in Computer Science}, title = {Scenes-and-frames Semantics}, editor = {Zampolli, Antonio}, pages = {55--81}, publisher = {North Holland}, series = {Fundamental Studies in Computer Science}, volume = {59}, address = {Amsterdam; New York; Oxford}, year = {1977}, } @InCollection{Koprivova:Hnatkova:2014, author = {Kopřivová, Marie and Hnátková, Milena}, booktitle = {Phraseology in dictionaries and corpora}, title = {From Dictionary to Corpus}, editor = {Jesenšek, Vida and Grzybek, Peter}, pages = {155--168}, publisher = {Filozofska fakulteta Maribor}, address = {Maribor}, year = {2014}, } @Article{fillmore_1976, author = {Fillmore, Charles J.}, title = {Frame {Semantics} and the Nature of Language}, pages = {20--32}, volume = {280}, journal = {Annals of the New York Academy of Sciences}, year = {1976}, } @Book{council2001common, author = {{Council of Europe}}, title = {Common {European} {Framework} of {Reference} for {Languages}: {Learning}, teaching, assessment}, publisher = {Modern Languages Division (Strasbourg) and Cambridge University Press}, year = {2001}, } @Book{holton_etal_1997, author = {Holton, David and Mackridge, Peter and Philippaki-Warburton, Irene}, title = {Greek: {A} comprehensive grammar of the modern language}, publisher = {Routledge}, address = {London; New York}, year = {1997}, } @Article{Mitchell/Lapata:10, author = {Jeff Mitchell and Mirella Lapata}, title = {Composition in distributional models of semantics}, pages = {1388--1429}, volume = {34}, journal = {Cognitive Science}, year = {2010}, } @incollection{parsemeMWE15, author = {Savary, Agata and Sailer, Manfred and Parmentier, Yannick and Rosner, Michael and Rosén, Victoria and Przepiórkowski, Adam and Krstev, Cvetana and Vincze, Veronika and Wójtowicz, Beata and Losnegaard, Gyri and Parra Escartı́n, Carla and Waszczuk, Jakub and Constant, Matthieu and Osenova, Petya and Sangati, Federico}, booktitle = {{7th Language and Technology Conference: Human language technologies as a challenge for computer science and linguistics (LTC 2015)}}, title = {{PARSEME: {PARSing} and Multiword Expressions within a European multilingual network}}, url = {https://hal.archives-ouvertes.fr/hal-01223349}, address = {Poznań, Poland}, year = {2015}, } @Book{Plag:03, author = {Ingo Plag}, title = {Word-Formation in {E}nglish}, publisher = {Cambridge University Press}, year = {2003}, } @Book{Manning/Schuetze:99, author = {Christopher D. Manning and Hinrich Schütze}, title = {Foundations of Statistical Natural Language Processing}, publisher = {MIT Press}, address = {Cambridge, MA, USA}, ids = {Manning1999}, year = {1999}, } @incollection{AUGUSTINUS16.486, author = {Liesbeth Augustinus and Vincent Vandeghinste and Tom Vanallemeersch}, booktitle = {Proceedings of the Tenth International Conference on {Language Resources and Evaluation} ({LREC} 2016)}, title = {{Poly-GrETEL}: {Cross}-Lingual Example-based Querying of Syntactic Constructions}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Sara Goggi and Marko Grobelnik and Bente Maegaard and Joseph Mariani and Helene Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, location = {Portorož, Slovenia}, pages = {3549--3554}, publisher = {European Language Resources Association (ELRA)}, address = {Paris, France}, year = {2016}, } @InCollection{Kompan2011, author = {Michal Kompan and Mária Bieliková}, booktitle = {Advances in Intelligent and Soft Computing}, title = {News article classification based on a vector representation including words' collocations}, doi = {10.1007/978-3-642-23163-6_1}, pages = {1--8}, location = {Berlin Heidelberg}, publisher = {Springer}, year = {2011}, } @incollection{AUGUSTINUS16.362, author = {Liesbeth Augustinus and Peter Dirix and Daniel Van Niekerk and Ineke Schuurman and Vincent Vandeghinste and Frank Van Eynde and Gerhard Van Huyssteen}, booktitle = {Proceedings of the Tenth International Conference on {Language Resources and Evaluation} ({LREC} 2016)}, title = {{AfriBooms}: {An} Online Treebank for {Afrikaans}}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Sara Goggi and Marko Grobelnik and Bente Maegaard and Joseph Mariani and Helene Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, location = {Portorož, Slovenia}, pages = {677--682}, publisher = {European Language Resources Association (ELRA)}, address = {Paris, France}, year = {2016}, } @PhdThesis{moiron2005data, author = {Villada Moirón, María Begoña}, title = {Data-driven identification of fixed expressions and their modifiability}, school = {University of Groningen}, year = {2005}, } @InCollection{BurchardtPinkal2009, author = {Burchardt, Aljoscha and Katrin Erk and Anette Frank and Andrea Kowalski and Sebastian Padó and Manfred Pinkal}, booktitle = {Multilingual {FrameNets} in computational lexicography: {Methods} and Applications}, title = {Using {FrameNet} for the semantic analysis of {German}: {Annotation}, representation and automation}, editor = {Hans C. Boas}, pages = {209--244}, publisher = {De Gruyter Mouton}, address = {Berlin, New York}, year = {2009}, } @InCollection{SavaryEtAl:18, author = {Agata Savary and Marie Candito and Verginica Barbu Mititelu and Eduard Bejcek and Fabienne Cap and Slavomir Ceplo and Silvio Ricardo Cordeiro and Gulsen Eryigit and Voula Giouli and Maarten van Gompel and Yaakov HaCohen-Kerner and Jolanta Kovalevskaite and Simon Krek and Chaya Liebeskind and Johanna Monti and Carla Parra Escartin and Lonneke van der Plas and Behrang QasemiZadeh and Carlos Ramisch and Federico Sangati and Ivelina Stoyanova and Veronika Vincze}, booktitle = {Multiword expressions at length and in depth: {E}xtended Papers from the {MWE} 2017 Workshop}, title = {{PARSEME} multilingual corpus of verbal multiword expressions}, doi = {10.5281/zenodo.14715}, editor = {Stella Markantonatou and Carlos Ramisch and Agata Savary and Veronika Vincze}, publisher = {Language Science Press}, pages = {87--147}, address = {Berlin}, year = {2018}, } @InBook{Wiley2014, author = {Daniel T. Larose and Chantal D. Larose}, booktitle = {Discovering Knowledge in Data}, title = {Association Rules}, doi = {10.1002/9781118874059.ch12}, pages = {247--265}, publisher = {John Wiley and Sons}, year = {2014}, } @Book{Cechova:2011, author = {Čechová, Marie}, title = {Čeština: {Řeč} a jazyk}, publisher = {SPN}, address = {Praha}, year = {2011}, } @Article{abrahamsson2009age, author = {Abrahamsson, Niclas and Hyltenstam, Kenneth}, title = {Age of onset and nativelikeness in a second language: {Listener} perception versus linguistic scrutiny}, number = {2}, pages = {249--306}, volume = {59}, journal = {Language Learning}, publisher = {Wiley Online Library}, year = {2009}, } @Article{nesselhauf2003use, author = {Nesselhauf, Nadja}, title = {The use of collocations by advanced learners of {English} and some implications for teaching}, number = {2}, pages = {223--242}, volume = {24}, journal = {Applied Linguistics}, year = {2003}, } @incollection{irishdatabase, author = {Ní Loingsigh, Katie and Ó Raghallaigh, Brian}, booktitle = {{Proceedings of the 17th EURALEX International Congress}}, title = {Starting from scratch: {The} Creation of an {Irish}-language idiom database}, editor = {Margalitadze, Tinatin and Meladze, George}, publisher = {Tbilisi State University}, pages = {726--734}, address = {Tbilisi}, year = {2016}, } @InCollection{schmidt_kicktionary_2009, author = {Schmidt, Thomas C.}, booktitle = {Multilingual {FrameNets} in Computational Lexicography: {Methods} and Applications}, title = {The {Kicktionary}: {A} Multilingual Lexical Resource of Football Language}, editor = {Hans C. Boas}, pages = {101--134}, publisher = {De Gruyter Mouton}, address = {Berlin, New York}, year = {2009}, } @Book{teleman1999svenska, author = {Teleman, Ulf and Hellberg, Staffan and Andersson, Erik and Christensen, Lisa}, title = {{Svenska akademiens grammatik}}, publisher = {Norstedts ordbok and Svenska Akademien}, year = {1999}, } @incollection{Jelinek:2021, author = {Jelínek, Tomáš and Jan Křivan and Vladimír Petkevič and Hana Skoumalová and Jana Šindlerová}, booktitle = {Text, speech, and dialogue}, title = {SYN2020: {A} New Corpus of {Czech} with an Innovated Annotation}, doi = {10.1007/978-3-030-83527-9_4}, editor = {Ekštein, Kamil and Pártl, František and Konopík, Miloslav}, pages = {48--59}, publisher = {Springer}, address = {Cham}, year = {2021}, } @incollection{Jelinek:2020, author = {Jelínek, Tomáš}, booktitle = {Reproducible multiword expressions from a theoretical and empirical perspective}, title = {Multi-word lexical units with repetition of lexemes in {Czech} and identification of their variants}, editor = {Szerszunowicz, Joanna and Awier, Martyna}, pages = {141--153}, publisher = {University of Bialystok}, url = {http://hdl.handle.net/11320/11351}, address = {Białystok}, year = {2020}, } @incollection{Jelinek:2019, author = {Jelínek, Tomáš}, booktitle = {Text, speech, and dialogue: 22nd international conference}, title = {Using a database of multiword expressions in dependency parsing}, doi = {10.1007/978-3-030-27947-9_2}, editor = {Ekštein, Kamil}, pages = {19--31}, publisher = {Springer}, address = {Cham}, year = {2019}, } @Article{Jelinek:2018, author = {Jelínek, Tomáš and Kopřivová, Marie and Petkevič, Vladimír and Skoumalová, Hana}, title = {Variabilita českých frazémů v úzu}, number = {2}, pages = {151--175}, url = {https://casopispromodernifilologii.ff.cuni.cz/magazin/2018-100-2-2/}, volume = {100}, journal = {Časopis pro moderní filologii}, year = {2018}, } @InCollection{Chu2018, author = {Yen-Lun Chu and Tzone-I Wang}, series = {Lecture Notes in Computer Science}, booktitle = {{ICITL 2018}: {Innovative} technologies and learning}, number = {11003}, title = {A sentence-wide collocation recommendation system with error detection for academic writing}, editor = {Ting-Ting Wu and Yueh-Min Huang and Rustam Shadiev and Lin Lin and Istenič Starčič, Andreja}, pages = {307--316}, publisher = {Springer}, year = {2018}, doi = {10.1007/978-3-319-99737-7_33} } @Article{DimaEtAl:19, author = {Corina Dima and Daniel {de Kok} and Neele Witte and Erhard Hinrichs}, title = {No word is an island: {A} transformation weighting model for semantic composition}, pages = {437--451}, volume = {7}, journal = {Transactions of Computational Linguistics}, year = {2019}, } @Book{Rosettaboek:94, author = {M. T. Rosetta}, title = {Compositional {Translation}}, publisher = {Kluwer}, series = {Kluwer International Series in Engineering and Computer Science}, number = {273}, address = {Dordrecht}, year = {1994}, } @Article{BalkaNet, author = {Tufiș, Dan and Dan Cristea and Sophia Stamou}, title = {{BalkaNet}: {Aims}, Methods, Results and Perspectives. {A} General Overview}, number = {1-2}, pages = {9--43}, volume = {7}, journal = {Romanian Journal of Information Science and Technology}, year = {2004}, } @InCollection{Borin-Lars2021-311388, author = {Borin, Lars}, booktitle = {The {Swedish} {FrameNet++}: {Harmonization}, integration, method development, and practical language technology applications}, title = {Multiword expressions: {A} tough typological nut for {Swedish} {FrameNet++}}, editor = {Dannélls, Dana and Lars Borin and Karin Friberg Heppin}, pages = {221--259}, publisher = {John Benjamins}, address = {Amsterdam}, year = {2021}, } @Article{piao2005comparing, author = {Piao, Scott Songlin and Rayson, Paul and Archer, Dawn and McEnery, Tony}, title = {{Comparing and combining a semantic tagger and a statistical tool for MWE extraction}}, number = {4}, pages = {378--397}, volume = {19}, journal = {Computer Speech \& Language}, publisher = {Elsevier}, year = {2005}, } @incollection{Sag:Baldwin:2002, author = {Sag, Ivan A. and Baldwin, Timothy and Bond, Francis and Copestake, Ann and Flickinger, Dan}, booktitle = {{Proceedings of the third international conference on Intelligent Text Processing and Computational Linguistics (CICLing 2002)}}, title = {Multiword Expressions: {A} Pain in the Neck for {NLP}}, editor = {Gelbukh, Alexander F.}, pages = {1--15}, publisher = {Springer}, year = {2002}, } @incollection{BRUGMAN16.471, author = {Hennie Brugman and Martin Reynaert and Nicoline van der Sijs and René van Stipriaan and Erik Tjong Kim Sang and Antal van den Bosch}, booktitle = {Proceedings of the Tenth International Conference on {Language Resources and Evaluation} ({LREC} 2016)}, title = {Nederlab: {T}owards a Single Portal and Research Environment for Diachronic {Dutch} Text Corpora}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Sara Goggi and Marko Grobelnik and Bente Maegaard and Joseph Mariani and Helene Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, location = {Portorož, Slovenia}, pages = {1277--1281}, publisher = {European Language Resources Association (ELRA)}, address = {Paris, France}, year = {2016}, } @incollection{di_fabio_etal_2019, author = {Di Fabio, Andrea and Conia, Simone and Navigli, Roberto}, booktitle = {Proceedings of the 2019 Conference on {Empirical} {Methods} in {Natural} {Language} {Processing} and the 9th {International} {Joint} {Conference} on {Natural} {Language} {Processing} ({EMNLP}-{IJCNLP})}, title = {{VerbAtlas}: {A} Novel Large-Scale Verbal Semantic Resource and Its Application to Semantic Role Labeling}, pages = {627--637}, publisher = {Association for Computational Linguistics}, address = {Hong Kong, China}, year = {2019}, } @Book{Fellbaum:98, title = {{WordNet}: {A}n electronic lexical database}, editor = {Christiane Fellbaum}, publisher = {MIT Press}, series = {Language, Speech, and Communication}, address = {Cambridge, MA}, year = {1998}, } @incollection{HaettyEtAl:21, author = {Hätty, Anna and Julia Bettinger and Michael Dorna and Jonas Kuhn and Sabine {Schulte im Walde}}, booktitle = {Proceedings of the 10th Joint Conference on Lexical and Computational Semantics}, title = {Compound or Term Features? {A}nalyzing Salience in Predicting the Difficulty of {G}erman Noun Compounds across Domains}, pages = {252--262}, address = {Bangkok, Thailand}, year = {2021}, } @incollection{SchulteImWaldeEtAl:16b, author = {Sabine {Schulte im Walde} and Anna Hätty and Stefan Bott}, booktitle = {Proceedings of the 5th Joint Conference on Lexical and Computational Semantics}, title = {The role of modifier and head properties in predicting the compositionality of {E}nglish and {G}erman noun-noun compounds: {A} vector-space perspective}, pages = {148--158}, address = {Berlin, Germany}, year = {2016}, } @incollection{SchulteImWaldeEtAl:16a, author = {Sabine {Schulte im Walde} and Anna Hätty and Stefan Bott and Nana Khvtisavrishvili}, booktitle = {Proceedings of the 10th International Conference on {Language Resources and Evaluation}}, title = {{G$_h$ost-NN: A} Representative Gold Standard of {G}erman Noun-Noun Compounds}, pages = {2285--2292}, address = {Portoroz, Slovenia}, year = {2016}, } @incollection{you_liu_2005, author = {You, Liping and Liu, Kaiying}, booktitle = {2005 {International} {Conference} on {Natural} {Language} {Processing} and {Knowledge} {Engineering}}, title = {Building {Chinese} {FrameNet} Database}, pages = {301--306}, publisher = {IEEE}, address = {Wuhan, China}, year = {2005}, } @Article{gregoire_duelme_2010, author = {Grégoire, Nicole}, journaltitle = {Language Resources and Evaluation}, title = {{DuELME}: A {Dutch} electronic lexicon of multiword expressions}, number = {1}, pages = {23--39}, volume = {44}, journal = {Language Resources and Evaluation}, year = {2010}, } @InBook{FinkbeinerSchluecker2019CompoundsMWE, author = {Rita Finkbeiner and Barbara Schlücker}, booktitle = {Complex Lexical Units}, title = {{Compounds and multi-word expressions in the languages of Europe}}, doi = {10.1515/9783110632446-001}, editor = {Barbara Schlücker}, pages = {1--44}, publisher = {De Gruyter}, address = {Berlin, Boston}, lastchecked = {2023-02-26}, year = {2019}, } @Book{Dalrymple2023, title = {Handbook of {Lexical Functional Grammar}}, doi = {10.5281/zenodo.10037797}, editor = {Dalrymple, Mary}, number = {13}, publisher = {Language Science Press}, series = {Empirically Oriented Theoretical Morphology and Syntax}, address = {Berlin}, year = {2023}, } @incollection{virk_etal_2021, author = {Virk, Shafqat Mumtaz and Dannélls, Dana and Borin, Lars and Forsberg, Markus}, booktitle = {Proceedings of the International Conference on {Recent} {Advances} in {Natural} {Language} {Processing} ({RANLP} 2021)}, title = {A Data-Driven Semi-Automatic Framenet Development Methodology}, pages = {1471--1479}, publisher = {INCOMA}, address = {Held Online}, year = {2021}, } @Article{Rosen:Skoumalova:2018, author = {Rosen, Alexandr and Skoumalová, Hana}, title = {No way to have your say out of the frame: {Specifying} valency of multi-word expressions}, number = {72}, pages = {301--320}, url = {https://www.ceeol.com/search/article-detail?id=732446}, volume = {2018}, journal = {Prace Filologiczne}, year = {2018}, } @incollection{laskova-etal-2019-modeling, author = {Laskova, Laska and Osenova, Petya and Simov, Kiril and Radev, Ivajlo and Kancheva, Zara}, booktitle = {Proceedings of the joint workshop on multiword expressions and {WordNet} ({MWE-WN} 2019)}, title = {Modeling {MWE}s in {BTB}-{WN}}, editor = {Savary, Agata and Escartín, Carla Parra and Bond, Francis and Mitrović, Jelena and Mititelu, Verginica Barbu}, pages = {70--78}, publisher = {Association for Computational Linguistics}, doi = {10.18653/v1/W19-5109}, address = {Florence, Italy}, year = {2019}, } @Book{Vondricka:2014, author = {Vondřička, Pavel}, title = {Formalized contrastive lexical description: {A} framework for bilingual dictionaries}, publisher = {LINCOM}, address = {München}, year = {2014}, } @InCollection{mel1998collocations, author = {Mel’čuk, Igor}, booktitle = {Phraseology: {Theory}, analysis, and applications}, title = {Collocations and lexical functions}, editor = {Cowie, A. P.}, pages = {23--53}, publisher = {Clarendon Press}, place = {Oxford}, year = {1998}, } @Book{Bauer:17, author = {Laurie Bauer}, title = {Compounds and Compounding}, publisher = {Cambridge University Press}, year = {2017}, } @incollection{buchholz-marsi-2006-conllx, author = {Buchholz, Sabine and Erwin Marsi}, booktitle = {{Proceedings of the tenth conference on computational natural language learning (CoNLL-X)}}, title = {{CoNLL-X} shared task on multilingual dependency parsing}, url = {https://api.semanticscholar.org/CorpusID:13075323}, year = {2006}, } @incollection{giouli_etal_2019, author = {Giouli, Voula and Foufi, Vassiliki and Fotopoulou, Aggeliki}, booktitle = {13th {International} {Conference} on {Greek} {Linguistics}}, title = {Annotating {Greek} {VMWEs} in running text: {A} piece of cake or looking for a needle in a haystack?}, editor = {Chondrogianni, Maria and Courtenage, Simon and Horrocks, Geoffrey and Arvaniti, Amalia and Tsimpli, Ianthi}, pages = {125--134}, address = {University of Westminster, London, UK}, year = {2019}, } @incollection{OSeaghdha:07, author = {Diarmuid {Ó Séaghdha}}, booktitle = {Proceedings of the {Corpus Linguistics} {(CL2007)}}, editor = {Matthew Davies and Paul Rayson and Susan Hunston and Pernilla Danielsson}, title = {Designing and Evaluating a Semantic Annotation Scheme for Compound Nouns}, publisher = {University of Birmingham, UK}, address = {Birmingham, UK}, url = {https://ucrel.lancs.ac.uk/publications/cl2007/}, year = {2007}, } @InBook{barbu-mititelu-leseva-2018, author = {Barbu Mititelu, Verginica and Leseva, Svetlozara}, booktitle = {Multiword expressions: {I}nsights from a multi-lingual perspective}, title = {Derivation in the domain of multiword expressions}, doi = {10.5281/zenodo.1182601}, editor = {Sailer, Manfred and Markantonatou, Stella}, pages = {215--246}, publisher = {Language Science Press}, place = {Berlin}, year = {2018}, } @Article{VANEYNDE2016104, author = {Frank {Van Eynde} and Liesbeth Augustinus and Vincent Vandeghinste}, title = {Number agreement in copular constructions: {A} treebank-based investigation}, doi = {10.1016/j.lingua.2016.02.001}, pages = {104--126}, volume = {178}, journal = {Lingua}, year = {2016}, } @incollection{gurt2023, author = {Markantonatou, Stella and Th. Constantinides, Nicolaos and Stamou, Vivian and Arampatzakis, Vasileios and G. Krimpas, Panagiotis and Pavlidis, George}, booktitle = {Proceedings of the Sixth {Workshop on Universal Dependencies} {(UDW, GURT/SyntaxFest} 2023)}, title = {{Methodological issues regarding the semi-automatic {UD} treebank creation of under-resourced languages: The case of Pomak}}, pages = {27--35}, url = {https://aclanthology.org/2023.udw-1.4}, address = {Washington, D.C.}, year = {2023}, } @incollection{hnatkova-etal-2019, author = {Hnátková, Milena and Jelínek, Tomáš and Kopřivová, Marie and Petkevič, Vladimír and Rosen, Alexandr and Skoumalová, Hana and Vondřička, Pavel}, booktitle = {Trudy meždunarodnoj konferencii {Korpusnaja Lingvistika}}, title = {{Lexical database of multiword expressions in Czech}}, pages = {9--16}, publisher = {Saint Petersburg University Press}, address = {Saint Petersburg, Russian Federation}, year = {2019}, } @incollection{HaettyEtAl:19b, author = {Hätty, Anna and Ulrich Heid and Anna Moskvina and Julia Bettinger and Michael Dorna and Sabine {Schulte im Walde}}, booktitle = {Proceedings of the 15th Conference on Natural Language Processing ({KONVENS 2019})}, title = {{AkkuBohrHammer} vs. {AkkuBohrhammer}: {E}xperiments towards the evaluation of compound splitting tools for general language and specific domains}, pages = {59--67}, address = {Erlangen, Germany}, year = {2019}, publisher = {German Society for Computational Linguistics \& Language Technology} } @incollection{attia2010automatic, author = {Attia, Mohammed and Toral, Antonio and Tounsi, Lamia and Pecina, Pavel and Van Genabith, Josef}, booktitle = {Proceedings of the 2010 Workshop on Multiword Expressions: {From} Theory to Applications}, title = {{Automatic extraction of Arabic multiword expressions}}, editor = {Laporte, Éric and Nakov, Preslav and Ramisch, Carlos and Villavicencio, Aline}, pages = {19--27}, publisher = {Coling 2010 Organizing Committee}, year = {2010}, } @incollection{ramisch_etal_2020, author = {Ramisch, Carlos and Savary, Agata and Guillaume, Bruno and Waszczuk, Jakub and Candito, Marie and Vaidya, Ashwini and Barbu Mititelu, Verginica and Bhatia, Archna and Iñurrieta, Uxoa and Giouli, Voula and Güngör, Tunga and Jiang, Menghan and Lichte, Timm and Liebeskind, Chaya and Monti, Johanna and Ramisch, Renata and Stymne, Sara and Walsh, Abigail and Xu, Hongzhi}, editor = {Stella Markantonatou and John Mccrae and Jelena Mitrović and Carole Tiberiu and Carlos Ramisch and Ashwini Vaidya and Petya Osenova and Agata Savary}, booktitle = {Proceedings of the Joint Workshop on {Multiword} {Expressions} and {Electronic} {Lexicons} ({MWE-LEX} 2020)}, title = {Edition 1.2 of the {PARSEME} Shared Task on Semi-supervised Identification of Verbal Multiword Expressions}, pages = {107--118}, publisher = {Association for Computational Linguistics}, address = {Barcelona}, year = {2020}, } @incollection{DankersEtAl:22a, author = {Dankers, Verna and Bruni, Elia and Hupkes, Dieuwke}, booktitle = {Proceedings of the 60th Annual Meeting of the {Association for Computational Linguistics}}, title = {The paradox of the compositionality of natural language: {A} neural machine translation case study}, pages = {4154--4175}, address = {Dublin, Ireland}, year = {2022}, editor = {Smaranda Muresan and Preslav Nakov and Aline Villavicencio}, doi = {10.18653/v1/2022.acl-long.286} } @article{LibbenEtAl:97, author = {Gary Libben and Martha Gibson and Yeo Bom Yoon and Dominiek Sandra}, journal = {CLASNET Working Papers}, title = {Semantic Transparency and Compound Fracture}, number = {9}, pages = {1--13}, year = {1997}, } @incollection{Schaefer/Bildhauer:12, author = {Roland Schäfer and Felix Bildhauer}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Mehmet Uğur Doğan and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, booktitle = {Proceedings of the 8th International Conference on {Language Resources and Evaluation} ({LREC'12})}, title = {Building large corpora from the web using a new efficient tool chain}, pages = {486--493}, address = {Istanbul}, year = {2012}, url = {http://www.lrec-conf.org/proceedings/lrec2012/pdf/834_Paper.pdf} } @incollection{volodina2016swell, author = {Volodina, Elena and Pilán, Ildikó and Enström, Ingegerd and Llozhi, Lorena and Lundkvist, Peter and Sundberg, Gunlög and Sandell, Monica}, booktitle = {Proceedings of the Tenth International Conference on {Language Resources and Evaluation} ({LREC'16})}, title = {{Swell on the rise: Swedish learner language corpus for European reference level studies}}, editor = {Calzolari, Nicoletta and Choukri, Khalid and Declerck, Thierry and Goggi, Sara and Grobelnik, Marko and Maegaard, Bente and Mariani, Joseph and Mazo,Hélène and Moreno, Asuncion and Odijk, Jan and Piperidis, Stelios}, pages = {206--212}, url = {https://aclanthology.org/L16-1}, location = {Portorož, Slovenia}, publisher = {ACL}, year = {2016}, } @incollection{savary:hal-01917174, author = {Agata Savary and Marie Candito and Verginica Barbu Mititelu and Bejček, Eduard and Cap, Fabienne and Čéplö, Slavomír and Silvio Ricardo Cordeiro and Cebiroğlu Eryiğit, Gülşen and Giouli, Voula and Van Gompel, Maarten and HaCohen-Kerner, Yaakov and Kovalevskaite, Jolanta and Krek, Simon and Liebeskind, Chaya and Monti, Johanna and Parra Escartín, Carla and Van Der Plas, Lonneke and Qasemizadeh, Behrang and Carlos Ramisch and Sangati, Federico and Stoyanova, Ivelina and Veronika Vincze}, booktitle = {Multiword expressions at length and in depth: {Extended} papers from the {MWE} 2017 workshop}, title = {{PARSEME} multilingual corpus of verbal multiword expressions}, editor = {Stella Markantonatou and Carlos Ramisch and Agata Savary and Veronika Vincze}, pages = {87-147}, publisher = {Language Science Press}, location = {Berlin}, doi = {10.5281/zenodo.1471590}, ids = {Savary-et-al2018}, year = {2018}, } @incollection{Alipoor/SchulteImWalde:20, author = {Pegah Alipoor and {Schulte im Walde}, Sabine}, booktitle = {Proceedings of the 12th {Language Resources and Evaluation Conference} ({LREC'2020})}, title = {Variants of vector space reductions for predicting the compositionality of {E}nglish noun compounds}, editor = {Nicoletta Calzolari and Frédéric Béchet and Philippe Blache and Khalid Choukri and Christopher Cieri and Thierry Declerck and Sara Goggi and Hitoshi Isahara and Bente Maegaard and Joseph Mariani and Hélène Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, url = {https://aclanthology.org/2020.lrec-1.539}, pages = {4379--4387}, address = {Marseille, France}, publisher = {ACL}, year = {2020}, } @Article{Gantar2018, author = {Gantar, Polona and Colman, Lut and Parra Escartín, Carla and Martínez Alonso, Héctor}, title = {{Multiword expressions: Between lexicography and NLP}}, doi = {10.1093/ijl/ecy012}, number = {2}, pages = {138--162}, volume = {32}, journal = {International Journal of Lexicography}, year = {2018}, } @inproceedings{Role2011, author = {François Role and Mohamed Nadif}, booktitle = {Proceedings of the International Conference on {Knowledge Discovery and Information Retrieval} ({KDIR} 2011)}, title = {Handling the impact of low frequency events on co-occurrence based measures of word similarity: {A} case study of pointwise mutual information}, doi = {10.5220/0003655102260231}, pages = {218--223}, location = {Setúbal, Portugal}, publisher = {SciTePress}, year = {2011}, } @incollection{Vietri2014, author = {Vietri, Simonetta}, booktitle = {Proceedings of the Workshop on Lexical and Grammatical Resources for Language Processing ({LG-LP 2014})}, editor = {Jorge Baptista and Pushpak Bhattacharyya and Christiane Fellbaum and Mikel Forcada and Chu-Ren Huang and Svetla Koeva and Cvetana Krstev and Éric Laporte}, title = {The Lexicon-Grammar of {Italian} Idioms}, pages = {137--146}, publisher = {Association for Computational Linguistics and Dublin City University}, doi = {10.3115/v1/W14-5817}, address = {Dublin, Ireland}, year = {2014}, } @Book{enstrom1990feltyper, author = {Enström, Ingegerd}, title = {Feltyper i invandrargymnasisters användning av partikelverb, prefixverb och reflexiva verb}, langid = {swedish}, publisher = {Göteborgs universitet}, address = {Göteborg}, series = {Rapporter från institutionen för nordiska språk/svenska ({NORDRAPP})}, number = {4}, year = {1990}, } @incollection{shigeto2013construction, author = {Shigeto, Yutaro and Azuma, Ai and Hisamoto, Sorami and Kondo, Shuhei and Kose, Tomoya and Sakaguchi, Keisuke and Yoshimoto, Akifumi and Yung, Frances and Matsumoto, Yuji}, booktitle = {Proceedings of the 9th Workshop on Multiword Expressions ({MWE 2013})}, title = {{Construction of English MWE dictionary and its application to POS tagging}}, editor = {Kordoni, Valia and Ramisch, Carlos and Villavicencio, Aline}, pages = {139--144}, location = {Atlanta, GA}, publisher = {Association for Computaional Linguistics}, year = {2013}, } @Article{forsberg2010using, author = {Forsberg, Fanny}, title = {Using conventional sequences in {L2} {F}rench}, pages = {25--51}, volume = {48}, journal = {International Review of Applied Linguistics in Language Teaching}, year = {2010}, } @incollection{agirre2006lexicalization, author = {Agirre, Eneko and Aldezabal, Izaskun and Pociello, Eli}, booktitle = {Proceedings of Third International {WordNet} Conference}, title = {Lexicalization and multiword expressions in the {B}asque {W}ord{N}et}, editor = {Sojka, Petr and Choi, Key-Sun and Fellbaum, Christine and Vossen, Piek}, pages = {131--138}, year = {2006}, } @Article{kurtes2008english, author = {Kurtes, Svetlana and Saville, Nick}, title = {{The English profile programme: An overview}}, pages = {2--4}, volume = {33}, journal = {Research Notes}, year = {2008}, } @incollection{candito_etal_2014, author = {Candito, Marie and Amsili, Pascal and Barque, Lucie and Benamara, Farah and de Chalendar, Gaël and Djemaa, Marianne and Haas, Pauline and Huyghe, Richard and Mathieu, Yvette Yannick and Muller, Philippe and Sagot, Benoît and Vieu, Laure}, booktitle = {Proceedings of the Ninth International {Conference} on {Language} {Resources} and {Evaluation} ({LREC}'14)}, title = {Developing a {French} {FrameNet}: {Methodology} and First Results}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk, Stelios Piperidis}, pages = {1372--1379}, publisher = {European Language Resources Association (ELRA)}, address = {Reykjavik, Iceland}, year = {2014}, url = {https://aclanthology.org/L14-1411/} } @InCollection{tp:14406719669147366, author = {Broekhuis, Hans and Corver, Norbert and Vos, Riet}, booktitle = {Taalportaal}, title = {{The impersonal passive}}, url = {https://taalportaal.org/taalportaal/topic/link/syntax__Dutch__vp__V3_alternations__V3_alternations.}, year = {2020}, } @InCollection{prentice2013flerordsenheter, author = {Prentice, Julia and Sköldberg, Emma}, booktitle = {Svenska som andraspråk: {I} forskning, undervisning och samhälle}, title = {Flerordsenheter -- ur ett andraspråksperspektiv}, edition = {2}, editor = {Hyltenstam, Kenneth and Lindberg, Inger}, pages = {197--220}, publisher = {Studentlitteratur}, place = {Lund}, year = {2013}, } @incollection{ramisch_etal_2018, author = {Ramisch, Carlos and Cordeiro, Silvio Ricardo and Savary, Agata and Vincze, Veronika and Barbu Mititelu, Verginica and Bhatia, Archna and Buljan, Maja and Candito, Marie and Gantar, Polona and Giouli, Voula and Güngör, Tunga and Hawwari, Abdelati and Iñurrieta, Uxoa and Kovalevskaitė, Jolanta and Krek, Simon and Lichte, Timm and Liebeskind, Chaya and Monti, Johanna and Parra Escartín, Carla and QasemiZadeh, Behrang and Ramisch, Renata and Schneider, Nathan and Stoyanova, Ivelina and Vaidya, Ashwini and Walsh, Abigail}, booktitle = {Proceedings of the {Joint} {Workshop} on {Linguistic} {Annotation}, {Multiword} {Expressions} and {Constructions} ({LAW}-{MWE}-{CxG}-2018)}, editor = {Agata Savary and Carlos Ramisch and Jena D. Hwang and Nathan Schneider and Melanie Andresen and Sameer Pradhan and Miriam R. L. Petruck}, title = {Edition 1.1 of the {PARSEME} shared task on automatic identification of verbal multiword expressions}, pages = {222--240}, publisher = {Association for Computational Linguistics}, address = {Santa Fe, NM}, year = {2018}, } @Book{jackendoff1997architecture, author = {Jackendoff, Ray}, title = {The architecture of the language faculty}, number = {28}, series = {Linguistic Inquiry Monographs}, location = {Cambridge, MA}, publisher = {MIT Press}, year = {1997}, } @Book{sebatr, author = {Karahóǧa, Sebajdín}, title = {{Μεταφράσεις ελληνικής και αγγλικής ποίησης στην πομακική γλώσσα}}, publisher = {Ξάνθη: Πολιτιστικός Σύλλογος Πομάκων Ξάνθης}, place = {Xanthi}, year = {2017}, } @InBook{dyvik2019, author = {Dyvik, Helge and Losnegaard, Gyri Smørdal and Rosén, Victoria}, booktitle = {Representation and parsing of multiword expressions}, title = {Multiword expressions in an {LFG} grammar for {Norwegian}}, doi = {10.5281/zenodo.2579037}, editor = {Parmentier, Yannick and Waszczuk, Jakub}, pages = {69--108}, publisher = {Language Science Press}, year = {2019}, } @InCollection{kimbaldwin, author = {Timothy Baldwin and Su Nam Kim}, booktitle = {{Handbook of Natural Language Processing}}, title = {Multiword Expressions}, edition = {2}, editor = {Nitin Indurkhya and Fred J. Damerau}, pages = {267--292}, publisher = {CRC Press}, address = {Boca Raton, FL}, year = {2010}, } @InCollection{Camp:etal:CLC19, author = {Matje van de Camp and Martin Reynaert and Nelleke Oostdijk}, booktitle = {{CLARIN in the Low Countries}}, title = {{WhiteLab} 2.0: {A} web interface for corpus exploitation}, doi = {10.5334/bbi.19}, editor = {Jan Odijk and Arjan van Hessen}, pages = {231--243}, publisher = {Ubiquity Press}, address = {London, UK}, year = {2017}, } @PhdThesis{Gregoire:PhD:2009, author = {Nicole Grégoire}, title = {Untangling Multiword Expressions: {A} study on the representation and variation of {D}utch multiword expressions}, address = {Utrecht}, school = {Utrecht University}, year = {2009}, } @Book{Firth:57, author = {John R. Firth}, title = {Papers in Linguistics 1934--1951}, publisher = {Longmans}, address = {London, UK}, year = {1957}, } @incollection{Clouet/Daille:14, author = {Clouet, Elizaveta Loginova and Daille, Béatrice}, booktitle = {Proceedings of the 1st Workshop on {Computational Approaches to Compound Analysis} {(ComAComA 2014)}}, editor = {Ben Verhoeven and Walter Daelemans and Menno van Zaanen and Gerhard van Huyssteen}, title = {Splitting of compound terms in non-prototypical compounding languages}, pages = {11--19}, address = {Dublin, Ireland}, publisher = {ACL}, doi = {10.3115/v1/W14-5702}, year = {2014}, } @Book{green2012language, author = {Green, Anthony}, title = {Language functions revisited: {Theoretical} and empirical bases for language construct definition across the ability range}, publisher = {Cambridge University Press}, location = {Cambrdige, UK}, series = {English Profile Studies}, number = {2}, year = {2012}, } @incollection{Kunze:00, author = {Claudia Kunze}, booktitle = {Proceedings of the 2nd International {Conference on Language Resources and Evaluation (LREC'00)}}, title = {Extension and Use of {GermaNet}, a Lexical-Semantic Database}, editor = {M. Gavrilidou and G. Carayannis and S. Markantonatou and S. Piperidis and G. Stainhauer}, pages = {999--1002}, address = {Athens, Greece}, publisher = {European Language Resources Association (ELRA)}, url = {https://aclanthology.org/L00-1274/}, year = {2000}, } @Article{GagneEtAl:20, author = {Christina L. Gagné and Thomas L. Spalding and Patricia Spicer and Dixie Wong and Beatriz Rubio}, title = {Is \emph{buttercup} a Kind of Cup? {H}yponymy and Semantic Transparency in Compound Words}, volume = {113}, journal = {Journal of Memory and Language}, year = {2020}, doi = {10.1016/j.jml.2020.104110}, } @Article{Costello/Keane:00, author = {Fintan J. Costello and Mark T. Keane}, title = {Efficient Creativity: {C}onstraint-Guided Conceptual Combination}, number = {2}, pages = {299--349}, volume = {24}, journal = {Cognitive Science}, year = {2000}, } @Book{gross-1996, author = {Gaston Gross}, title = {Les expressions figées en français: {Noms} composés et autres locutions}, langid = {french}, publisher = {Ophrys}, address = {Paris}, year = {1996}, } @Article{Murphy:90, author = {Gregory L. Murphy}, title = {Noun Phrase Interpretation and Conceptual Combination}, pages = {259--288}, volume = {29}, journal = {Journal of Memory and Language}, year = {1990}, } @incollection{shudo_etal_2011, author = {Shudo, Kosho and Kurahone, Akira and Tanabe, Toshifumi}, booktitle = {Proceedings of the 49th {Annual} {Meeting} of the {Association} for {Computational} {Linguistics}: {Human} {Language} {Technologies}}, title = {A Comprehensive Dictionary of Multiword Expressions}, pages = {161--170}, publisher = {Association for Computational Linguistics}, address = {Portland, OR}, year = {2011}, } @incollection{erk-etal-2003-towards, author = {Erk, Katrin and Kowalski, Andrea and Padó, Sebastian and Pinkal, Manfred}, booktitle = {Proceedings of the 41st {Annual} {Meeting} of the {Association} for {Computational} {Linguistics} ({ACL'03})}, title = {Towards a Resource for Lexical Semantics: {A} Large {German} Corpus with Extensive Semantic Annotation}, pages = {537--544}, publisher = {Association for Computational Linguistics}, address = {Sapporo, Japan}, year = {2003}, doi = {10.3115/1075096.1075164} } @Article{duelme, author = {Grégoire, Nicole}, title = {{DuELME: A Dutch electronic lexicon of multiword expressions}}, doi = {10.1007/s10579-009-9094-z}, number = {1/2}, pages = {23--39}, volume = {44}, archive = {kast}, journal = {Language Resources and Evaluation}, year = {2010}, } @incollection{Schaefer:15, author = {Roland Schäfer}, booktitle = {Proceedings of the 3rd Workshop on {Challenges in the Management of Large Corpora (CMLC-3)}}, title = {Processing and Querying Large Web Corpora with the {COW14} Architecture}, editor = {Piotr Bański and Hanno Biber and Evelyn Breiteneder and Marc Kupietz and Harald Lüngen and Andreas Witt}, pages = {28--34}, address = {Mannheim, Germany}, year = {2015}, } @Article{GagneEtAl:19, author = {Christina L. Gagné and Thomas L. Spalding and Daniel Schmidtke}, title = {{LADEC: The} Large Database of {E}nglish Compounds}, pages = {2152--2179}, volume = {51}, journal = {Behavior Research Methods}, year = {2019}, } @Book{fellbaum_wordnet_1998, title = {{WordNet}: {An} Electronic Lexical Database}, editor = {Fellbaum, Christiane}, publisher = {The MIT Press}, address = {Cambridge, MA}, year = {1998}, } @Article{Ordelman:2007, author = {Ordelman, Roeland J.F. and de Jong, Franciska M.G. and van Hessen, A. J. and G. H. W. Hondorp}, title = {{TwNC}: A Multifaceted {Dutch} News Corpus}, number = {3-4}, volume = {12}, journal = {ELRA Newsletter}, year = {2007}, } @InBook{rown, author = {Tufiș, Dan and Barbu Mititelu, Verginica}, booktitle = {Language Production, Cognition, and the Lexicon}, title = {The lexical ontology for {R}omanian}, editor = {Nuria Gala and Reinhard Rapp and Nuria Bel-Enguix}, pages = {491--504}, publisher = {Springer}, location = {Cham}, year = {2014}, } @incollection{udpipe, author = {Straka, Milan}, booktitle = {Proceedings of the {C}o{NLL} 2018 Shared Task: {Multilingual} Parsing from Raw Text to Universal Dependencies}, title = {{UDPipe} 2.0 Prototype at {CoNLL} 2018 {UD} Shared Task}, doi = {10.18653/v1/K18-2020}, editor = {Daniel Zeman and Jan Hajič}, pages = {197--207}, publisher = {Association for Computational Linguistics}, address = {Brussels, Belgium}, year = {2018}, } @InCollection{SONAR:2013, author = {Nelleke Oostdijk and Martin Reynaert and Véronique Hoste and Ineke Schuurman}, booktitle = {Essential Speech and Language Technology for {D}utch: {Results} by the {STEVIN}-programme}, title = {The Construction of a 500 Million Word Reference Corpus of Contemporary Written {Dutch}}, editor = {Peter Spyns and Jan Odijk}, doi = {10.1007/978-3-642-30910-6_13}, pages = {219--247}, publisher = {Springer}, address = {Berlin}, year = {2013}, } @incollection{mccrae2016representing, author = {McCrae, John Philip and Cimiano, Philipp and Buitelaar, Paul and Bordea, Georgeta}, booktitle = {{PARSEME/ENeL workshop on MWE e-lexicons}}, title = {Representing multiword expressions on the web with the {OntoLex-Lemon} model}, year = {2016}, } @incollection{haspelmath, author = {Haspelmath, Martin}, booktitle = {Causatives and transitivity}, title = {More on the typology of inchoative/causative verb alternations}, doi = {10.1075/slcs.23.05has}, editor = {Bernard Comrie and Maria Polinsky}, pages = {87--120}, publisher = {John Benjamins}, address = {Amsterdam, Philadelphia}, year = {1993}, series = {Studies in Language Companion Series}, number = {23} } @incollection{watrin2011n, author = {Watrin, Patrick and François, Thomas}, booktitle = {Proceedings of the Workshop on Multiword Expressions: {From} Parsing and Generation to the Real World}, editor = {Valia Kordoni and Carlos Ramisch and Aline Villavicencio}, title = {An n-gram frequency database reference to handle {MWE} extraction in {NLP} applications}, editor = {Kordoni, Valia and Ramisch, Carlos and Villavicencio, Aline}, pages = {83--91}, publisher = {Association for Computational Linguistics}, location = {Portland, OR}, url = {https://aclanthology.org/W11-0813}, year = {2011}, } @Article{gross-1982, author = {Gross, Maurice}, title = {Une classification des phrases «figées» du français}, langid = {french}, doi = {10.7202/602492ar}, number = {2}, pages = {151}, volume = {11}, journal = {Revue québécoise de linguistique}, year = {1982}, } @incollection{copestake_etal_2002, author = {Copestake, Ann and Lambeau, Fabre and Villavicencio, Aline and Bond, Francis and Baldwin, Timothy and Sag, Ivan A. and Flickinger, Dan}, booktitle = {Proceedings of the Third International {Conference} on {Language} {Resources} and {Evaluation} ({LREC}'02)}, title = {Multiword expressions: {Linguistic} precision and reusability}, publisher = {European Language Resources Association (ELRA)}, address = {Las Palmas, Canary Islands}, year = {2002}, } @incollection{Odijk2013, author = {Odijk, Jan}, booktitle = {Essential Speech and Language Technology for {Dutch}: Results by the {STEVIN} programme}, title = {Identification and lexical representation of multiword expressions}, doi = {10.1007/978-3-642-30910-6_12}, editor = {Spyns, Peter and Odijk, Jan}, pages = {201--217}, publisher = {Springer}, address = {Berlin, Heidelberg}, year = {2013}, } @incollection{NIVRE16.348, author = {Joakim Nivre and Marie-Catherine de Marneffe and Filip Ginter and Yoav Goldberg and Jan Hajic and Christopher D. Manning and Ryan McDonald and Slav Petrov and Sampo Pyysalo and Natalia Silveira and Reut Tsarfaty and Daniel Zeman}, booktitle = {Proceedings of the Tenth International {Conference on Language Resources and Evaluation} ({LREC} 2016)}, title = {Universal Dependencies v1: {A} Multilingual Treebank Collection}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Sara Goggi and Marko Grobelnik and Bente Maegaard and Joseph Mariani and Helene Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, location = {Portorož, Slovenia}, pages = {1659--1666}, publisher = {European Language Resources Association (ELRA)}, address = {Paris, France}, year = {2016}, } @Article{romary2019lmf, author = {Laurent Romary and Mohamed Khemakhem and Anas Fahad Khan and Jack Bowers and Nicoletta Calzolari and Monte George and Mandy Pet and Piotr Banski}, title = {{LMF} Reloaded}, url = {http://arxiv.org/abs/1906.02136}, year = {2019}, } @InCollection{forsberg2010can, author = {Forsberg, Fanny and Bartning, Inge}, booktitle = {Communicative proficiency and linguistic development: {Intersections} between {SLA} and language testing research}, title = {Can linguistic features discriminate between the communicative {CEFR}-levels? {A} pilot study of written {L2 French}}, editor = {Bartning, Inge and Martin, Maisa and Vedder, Ineke}, pages = {133--158}, publisher = {EuroSLA}, series = {EuroSLA Monographs}, number = {1}, year = {2010}, } @thesis{Marsh:15, author = {Charles Marsh}, title = {Cigarette Helmets and Horse Wars: {T}owards a Better Understanding of Noun Compound Interpretability}, school = {Department of Computer Science, Princeton University}, type = {Bachelor thesis}, year = {2015}, } @Article{vondricka:2019, author = {Pavel Vondřička}, title = {Design of a multiword expressions database}, pages = {83--101}, url = {https://ufal.mff.cuni.cz/pbml/112/art-vondricka.pdf}, volume = {112}, ids = {Vondricka:2019}, journal = {The Prague Bulletin of Mathematical Linguistics}, year = {2019}, } @PhdThesis{alfter2021exploring, author = {Alfter, David}, title = {Exploring natural language processing for single-word and multi-word lexical complexity from a second language learner perspective}, school = {University of Gothenburg}, year = {2021}, } @Article{Kochova:Opavska:2016a, author = {Kochová, Pavla and Opavská, Zdeňka}, title = {Akademický slovník současné češtiny: {Z} přípravy {Akademického} slovníku současné češtiny}, number = {2}, pages = {57--83}, url = {https://ujc.avcr.cz/miranda2/export/sitesavcr/ujc/zakladni-informace/pracovnici/files/KochovaOpavskaASSC.pdf}, volume = {99}, journal = {Naše řeč}, year = {2016}, } @incollection{ELX2014-045, author = {Faber, Pamela and Buendía Castro, Miriam}, booktitle = {Proceedings of the 16th {EURALEX} International Congress}, title = {{EcoLexicon}}, editor = {Abel, Andrea and Vettori, Chiara and Ralli, Natascia}, pages = {601--607}, publisher = {EURAC Research}, address = {Bolzano, Italy}, year = {2014}, } @incollection{villavicencio-LexicalEncoding, author = {Villavicencio, Aline and Copestake, Ann and Waldron, Benjamin and Lambeau, Fabre}, booktitle = {Proceedings of the Second {ACL} Workshop on Multiword Expressions: {Integrating} Processing}, editor = {Takaaki Tanaka and Aline Villavicencio and Francis Bond and Anna Korhonen}, location = {Barcelona}, publisher = {ACL}, title = {Lexical Encoding of {MWEs}}, pages = {80--87}, year = {2004}, } @InCollection{Baldwin/Kim:10, author = {Baldwin, Timothy and Kim, Su Nam}, booktitle = {Handbook of {Natural Language Processing}}, title = {Multiword Expressions}, editor = {Indurkhya, Nitin and Damerau, Fred J.}, pages = {267--292}, publisher = {CRC Press}, address = {Boca Raton, FL}, year = {2010}, } @Book{akademien2021svensk, author = {{Svenska Akademien}}, title = {{Svensk ordbok utgiven av Svenska Akademien}}, edition = {2}, publisher = {Svenska Akademien and Nordstedts ordbok}, url = {https://www.svenskaakademien.se/svenska-spraket/svensk-ordbok-utgiven-av-svenska-akademien-so}, year = {2021}, } @Book{forsberg2008langage, author = {Forsberg, Fanny}, title = {Le langage préfabriqué: {Formes}, fonctions et fréquences en français parlé {L2} et {L1}}, langid = {french}, publisher = {Peter Lang}, number = {20}, series = {Contemporary Studies in Descriptive Linguistics}, location = {Oxford}, year = {2008}, } @incollection{SimovOsenova2014, author = {Kiril Simov and Petya Osenova}, booktitle = {Proceedings of the Thirteenth International Workshop on {Treebanks and Linguistic Theories} ({TLT}13)}, title = {Formalizing {MultiWords} as catenae in a treebank and in a lexicon}, editor = {Verena Henrich and Erhard Hinrichs and Daniël de Kok and Petya Osenova and Adam Przepiórkowski}, pages = {198--207}, year = {2014}, location = {Tübingen}, publisher = {University of Tübingen}, } @Article{faber_dynamics_2011, author = {Faber, Pamela}, title = {The dynamics of specialized knowledge representation: {Simulational} reconstruction or the perception–action interface}, number = {1}, pages = {9--29}, volume = {17}, journal = {Terminology}, year = {2011}, } @incollection{savary_etal_2017, author = {Savary, Agata and Ramisch, Carlos and Cordeiro, Silvio and Sangati, Federico and Vincze, Veronika and QasemiZadeh, Behrang and Candito, Marie and Cap, Fabienne and Giouli, Voula and Stoyanova, Ivelina and Doucet, Antoine}, booktitle = {Proceedings of the 13th {Workshop} on {Multiword} {Expressions} ({MWE} 2017)}, title = {The {PARSEME} Shared Task on Automatic Identification of Verbal Multiword Expressions}, pages = {31--47}, publisher = {Association for Computational Linguistics}, address = {Valencia, Spain}, year = {2017}, editor = {Stella Markantonatou and Carlos Ramisch and Agata Savary and Veronika Vincze}, doi = {10.18653/v1/W17-1704} } @InCollection{Osherson2010, author = {Osherson, Anne and Fellbaum, Christiane}, title = {The Representation of Idioms in {WordNet}}, booktitle = {Principles, construction and application of Multilingual Wordnets: {Proceedings} of the Fifth {Global} {WordNet} {Conference}}, editor = {Pushpak Bhattacharyya and Christiane Fellbaum and Piek Vossen}, year = {2010}, location = {Mumbai, India}, publisher = {Narosa Publishing House} } @incollection{fellbaum-et-al2009, author = {Fellbaum, Christiane and Osherson, Anne and Clark, Peter E.}, booktitle = {Human Language Technology: {Challenges} of the Information Society ({LTC 2007})}, title = {Putting semantics into {WordNet’s} “morphosemantic” links}, editor = {Vetulani, Zygmunt and Uszkoreit, Hans}, pages = {350--358}, publisher = {Springer}, number = {5603}, booktitle = {Lecture Notes in Computer Science}, location = {Berlin, Heidelberg}, year = {2009}, } @Article{savary_etal_2019, author = {Savary, Agata and Cordeiro, Silvio Ricardo and Lichte, Timm and Ramisch, Carlos and Iñurrieta, Uxoa and Giouli, Voula}, title = {Literal occurrences of multiword expressions: {Rare} birds that cause a stir}, number = {1}, pages = {5--54}, volume = {112}, journal = {The Prague Bulletin of Mathematical Linguistics}, year = {2019}, } @PhdThesis{Nastase:03, author = {Viviana A. Nastase}, title = {Semantic relations across syntactic levels}, school = {School of Information Technology and Engineering, University of Ottawa}, year = {2003}, } @incollection{hamp1997germanet, author = {Hamp, Birgit and Feldweg, Helmut}, booktitle = {Automatic information extraction and building of lexical semantic resources for {NLP} applications}, title = {{GermaNet}: {A} lexical-semantic net for {German}}, ids = {Hamp/Feldweg:97}, url = {https://aclanthology.org/W97-0802}, year = {1997}, } @incollection{anthony2005antconc, author = {Anthony, Laurence}, booktitle = {Proceedings of the {International} {Professional} {Communication} {Conference}, 2005 ({IPCC} 2005)}, title = {{AntConc}: {Design} and development of a freeware corpus analysis toolkit for the technical writing classroom}, publisher = {IEEE}, pages = {729--737}, year = {2005}, } @incollection{vanNoord:2008, author = {Gertjan van Noord}, title = {Huge Parsed Corpora in {LASSY}}, booktitle = {Proceedings of the Seventh International Workshop on {Treebanks and Linguistic Theories} ({TLT 7})}, editor = {Frank van Eynde and Anette Frank and Koenraad de Smedt and Gertjan van Noord}, pages = {115--126}, number = {12}, address = {Groningen}, series = {LOT Occasional Series}, publisher = {LOT}, year = {2008}, } @Article{Klegr:2016, author = {Klégr, Aleš}, title = {Lexikální kolokace: {Základní} přehled o vývoji pojetí}, number = {1}, langid = {czech}, pages = {95--103}, url = {http://hdl.handle.net/20.500.11956/96860}, volume = {98}, journal = {Časopis pro moderní filologii}, year = {2016}, } @InCollection{Does:etal:CLC20, author = {Jesse de Does and Jan Niestadt and Katrien Depuydt}, booktitle = {{CLARIN} in the {Low} {Countries}}, title = {Creating Research Environments with {BlackLab}}, doi = {10.5334/bbi.20}, editor = {Jan Odijk and Arjan van Hessen}, pages = {245--257}, publisher = {Ubiquity Press}, address = {London, UK}, year = {2017}, } @InCollection{lyngfelt2018constructicography, author = {Lyngfelt, Benjamin and Bäckström, Linnéa and Borin, Lars and Ehrlemark, Anna and Rydstedt, Rudolf}, booktitle = {Constructicography: {Constructicon} Development Across Languages}, title = {Constructicography at work: {Theory} meets practice in the {Swedish} constructicon}, pages = {41--106}, publisher = {John Benjamins}, address = {Amsterdam/Philadelphia}, editors = {Lyngfelt, Benjamin and Borin, Lars and Ohara, Kyoko and Timponi Torrent, Tiago}, year = {2018}, doi = {10.1075/cal.22.03lyn} } @Article{Nunberg_etal_1994, author = {Nunberg, Geoffrey and Sag, Ivan A. and Wasow, Thomas}, title = {Idioms}, number = {3}, pages = {491--538}, volume = {70}, journal = {Language}, year = {1994}, } @Article{paquot2019phraseological, author = {Paquot, Magali}, title = {The phraseological dimension in interlanguage complexity research}, number = {1}, pages = {121--145}, volume = {35}, journal = {Second Language Research}, year = {2019}, } @Article{MurakiEtAl:22, author = {Emiko J. Muraki and Summer Abdalla and Marc Brysbaert and Penny M. Pexman}, title = {Concreteness Ratings for 62 Thousand {E}nglish Multiword Expressions}, year = {2022}, doi = {10.31234/osf.io/m397u} } @InCollection{timm_lichte_2019_2579033, author = {Timm Lichte and Simon Petitjean and Agata Savary and Jakub Waszczuk}, booktitle = {Representation and parsing of multiword expressions}, title = {Lexical encoding formats for multi-word expressions: {The} challenge of ``irregular'' regularities}, doi = {10.5281/zenodo.2579033}, editor = {Yannick Parmentier and Jakub Waszczuk}, location = {Berlin}, pages = {1--33}, publisher = {Language Science Press}, year = {2019}, } @Article{OGrady, author = {William O'Grady}, title = {The Syntax of Idioms}, issue = {2}, pages = {279--312}, volume = {16}, journal = {Natural Language and Linguistic Theory}, year = {1998}, } @incollection{Bott/SchulteImWalde:17, author = {Bott, Stefan and Schulte im Walde, Sabine}, booktitle = {Proceedings of the 13th Workshop on Multiword Expressions {(MWE 2017)}}, title = {Factoring Ambiguity out of the Prediction of Compositionality for {G}erman Multi-Word Expressions}, editor = {Stella Markantonatou and Carlos Ramisch and Agata Savary and Veronika Vincze}, doi = {10.18653/v1/W17-1708}, pages = {66--72}, address = {Valencia, Spain}, year = {2017}, } @Article{miller, author = {Miller, George A.}, title = {{WordNet}: {A} Lexical Database for {English}}, number = {11}, pages = {39--41}, volume = {38}, journal = {Communications of the ACM}, year = {1995}, } @Book{Temmerman:2000, author = {Temmerman, Rita}, title = {Toward new ways of terminology description: {The} sociocognitive approach}, publisher = {John Benjamins}, address = {Amsterdam, Philadelphia}, year = {2000}, } @incollection{straka_strakova_2017, author = {Straka, Milan and Straková, Jana}, booktitle = {Proceedings of the {CoNLL} 2017 Shared Task: {Multilingual} Parsing from Raw Text to Universal Dependencies}, title = {Tokenizing, {POS} Tagging, Lemmatizing and Parsing {UD} 2.0 with {UDPipe}}, pages = {88--99}, publisher = {Association for Computational Linguistics}, address = {Vancouver, Canada}, year = {2017}, } @InCollection{cowie1994phraseology, author = {Cowie, Anthony P.}, booktitle = {Encyclopedia of Language and Linguistics}, title = {Phraseology}, editor = {Asher, R. E.}, pages = {3168--3171}, location = {Oxford}, publisher = {Pergamon}, year = {1994}, } @incollection{calzolari_etal_2002, author = {Calzolari, Nicoletta and Fillmore, Charles J. and Grishman, Ralph and Ide, Nancy and Lenci, Alessandro and MacLeod, Catherine and Zampolli, Antonio}, booktitle = {Proceedings of the Third International {Conference} on {Language} {Resources} and {Evaluation} ({LREC}'02)}, title = {Towards Best Practice for Multiword Expressions in Computational Lexicons}, pages = {1934--1940}, publisher = {European Language Resources Association (ELRA)}, address = {Las Palmas, Canary Islands}, year = {2002}, } @Book{papadimitrioudiap, author = {Papadimitriou, Panayotis}, title = {{Τα Πομάκικα: Συγχρονική περιγραφή μιας νότιας τοπικής ποικιλίας της αναλυτικής σλαβικής από τη Μύκη του Ν. Ξάνθης}}, publisher = {Thessaloniki: Kyriakides Bros}, place = {Thessaloniki}, year = {2008}, } @incollection{borin_etal_2010, author = {Borin, Lars and Danélls, Dana and Forsberg, Markus and Kokkinakis, Dimitrios and Gronostaj, Maria Toporowska}, booktitle = {Proceedings of the 14th {EURALEX} {International} {Congress}}, title = {The Past Meets the Present in {Swedish} {FrameNet++}}, pages = {269--281}, year = {2010}, } @incollection{yong-etal-2022-frame, author = {Yong, Zheng Xin and Watson, Patrick D. and Timponi Torrent, Tiago and Czulo, Oliver and Baker, Collin}, booktitle = {Proceedings of the Thirteenth {Language} {Resources} and {Evaluation} {Conference} ({LREC'13})}, title = {Frame Shift Prediction}, pages = {976--986}, publisher = {European Language Resources Association (ELRA)}, address = {Marseille, France}, year = {2022}, } @incollection{mel2006explanatory, author = {Mel’čuk, Igor}, title = {Explanatory combinatorial dictionary}, pages = {225--355}, booktitle = {Open Problems in Linguistics and Lexicography}, editor = {Giandomenico Sica}, publisher = {Polimetrica}, location = {Monza, Italy}, year = {2006}, ids = {ECD} } @InCollection{Odijk:etal:PaQu, author = {Jan Odijk and Gertjan van Noord and Peter Kleiweg and Erik {Tjong Kim Sang}}, booktitle = {{CLARIN} in the {L}ow {C}ountries}, title = {The Parse and Query ({PaQu}) Application}, chapter = {23}, doi = {10.5334/bbi.23}, editor = {Jan Odijk and Arjan van Hessen}, pages = {281--297}, publisher = {Ubiquity Press}, address = {London, UK}, year = {2017}, } @misc{unesco, author = {Brenzinger, Matthias and Yamamoto, Akira and Aikawa, Noriko and Koundiouba, Dmitri and Minasyan, Anahit and Dwyer, Arienne and Grinevald, Colette and Krauss, Michael and Miyaoka, Osahito and Sakiyama, Osamu and Villalón, María E. and Yamamoto, Akira Y. and Zepeda, Ofelia}, title = {Language vitality and endangerment}, note = {Document submitted to the International Expert Meeting on {UNESCO} {Programme Safeguarding of Endangered Languages}}, year = {2003}, } @Article{Taft/Forster:75, author = {Marcus Taft and Kenneth I. Forster}, title = {Lexical Storage and Retrieval of Prefixed Words}, pages = {638--648}, volume = {14}, journal = {Journal of Verbal Learning and Verbal Behavior}, year = {1975}, } @InCollection{faber_2015, author = {Faber, Pamela}, booktitle = {Handbook of {Terminology}}, title = {Frames as a framework for terminology}, editor = {Kockaert, Hendrik J. and Steurs, Frieda}, publisher = {John Benjamins}, volume = {1}, address = {Amsterdam/Philadelphia}, year = {2015}, } @Book{MultiWordExpressionsandMorphology, author = {Francesca Masini}, title = {Multi-Word Expressions and Morphology}, location = {Oxford}, publisher = {Oxford University Press}, year = {2019}, } @incollection{VanNoord:2006, author = {Gertjan van Noord}, booktitle = {Actes de la 13ème conférence sur le {Traitement Automatique des Langues Naturelles} ({TALN 2006})}, title = {At last parsing is now operational}, editor = {P. Mertens and C. Fairon and A. Dister and P. Watrin}, pages = {20--42}, address = {Leuven, Belgium}, publisher = {ATALA}, year = {2006}, url = {https://aclanthology.org/2006.jeptalnrecital-invite.2} } @incollection{gala2014modele, author = {Gala, Núria and François, Thomas and Bernhard, Delphine and Fairon, Cédrick}, booktitle = {{Proceedings of TALN 2014}}, title = {Un modèle pour prédire la complexité lexicale et graduer les mots}, editor = {Blache, Phillipe and Béchet, Frédéric and Bigi, Brigitte}, pages = {91--102}, publisher = {Association pour le Traitement Automatique des Langues}, langid = {french}, url = {https://aclanthology.org/F14-2000}, year = {2014}, } @incollection{volodina2014you, author = {Volodina, Elena and Pilán, Ildikó and Eide, Stian Rødven and Heidarsson, Hannes}, booktitle = {Proceedings of the 3rd Workshop on {NLP} for Computer-Assisted Language Learning ({NLP4CALL})}, title = {You get what you annotate: {A} pedagogically annotated corpus of coursebooks for {Swedish} as a second language}, editor = {Volodina, Elena and Borin, Lars and Pilán, Ildikó}, pages = {128--144}, url = {https://aclanthology.org/W14-3500}, year = {2014}, } @incollection{boas_2002, author = {Boas, Hans C.}, booktitle = {Proceedings of the Third International {Conference} on {Language} {Resources} and {Evaluation}}, title = {Bilingual {FrameN}et {Dictionaries} for {Machine} {Translation}}, editor = {González Rodríguez, M. and C. Paz Suárez Araujo}, pages = {1364--1371}, publisher = {European Language Resources Association (ELRA)}, address = {Las Palmas, Spain}, year = {2002}, } @incollection{AUGUSTINUS12.756, author = {Liesbeth Augustinus and Vincent Vandeghinste and Frank Van Eynde}, booktitle = {Proceedings of the Eighth International Conference on {Language Resources and Evaluation} ({LREC} 2012)}, title = {Example-Based Treebank Querying}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Mehmet Uğur Doğan and Bente Maegaard and Joseph Mariani and Asunción Moreno and Jan Odijk and Stelios Piperidis}, pages = {3161--3167}, publisher = {European Language Resources Association (ELRA)}, address = {Istanbul, Turkey}, year = {2012}, } @incollection{franccois2016svalex, author = {François, Thomas and Volodina, Elena and Pilán, Ildikó and Tack, Anaïs}, booktitle = {Proceedings of the tenth International Conference on {Language Resources and Evaluation} ({LREC})}, title = {{SVALex: A CEFR-graded lexical resource for Swedish foreign and second language learners}}, editor = {Calzolari, Nicoletta and Choukri, Khalid and Declerck, Thierry and Goggi, Sara and Grobelnik, Marko and Maegaard, Bente and Mariani, Joseph and Mazo,Hélène and Moreno, Asuncion and Odijk, Jan and Piperidis, Stelios}, pages = {213--219}, url = {https://aclanthology.org/L16-1}, year = {2016}, } @Article{Savary2008, author = {Savary, Agata}, title = {Computational Inflection of Multi-Word Units: {A} contrastive study of lexical approaches}, doi = {10.33011/lilt.v1i.1195}, volume = {1}, journal = {Linguistic Issues in Language Technology}, year = {2008}, } @incollection{schneider_etal_2016, author = {Schneider, Nathan and Hovy, Dirk and Johannsen, Anders and Carpuat, Marine}, booktitle = {Proceedings of the 10th International Workshop on {Semantic} {Evaluation} ({SemEval}-2016)}, title = {{SemEval}-2016 Task 10: {Detecting} Minimal Semantic Units and their Meanings ({DiMSUM})}, pages = {546--559}, publisher = {Association for Computational Linguistics}, address = {San Diego, California}, year = {2016}, } @Article{Grégoire2010, author = {Grégoire, Nicole}, title = {{DuELME}: {A} {Dutch} electronic lexicon of multiword expressions}, doi = {10.1007/s10579-009-9094-z}, number = {4}, pages = {23--39}, volume = {44}, journal = {Language Resources and Evaluation}, year = {2010}, } @Book{Cermak:2007, author = {Čermák, František}, title = {Czech and general phraseology}, publisher = {Karolinum}, address = {Prague}, year = {2007}, } @Article{erman2000idiom, author = {Erman, Britt and Warren, Beatrice}, title = {The idiom principle and the open choice principle}, number = {1}, pages = {29--62}, volume = {20}, journal = {Text \& Talk}, publisher = {De Gruyter Mouton}, year = {2000}, } @Book{Cermak:2009, author = {Čermák, František and others}, title = {{Slovník české frazeologie a idiomatiky (SČFI)}}, publisher = {Academia/Leda}, volume = {1--4}, address = {Praha}, year = {1983--2009}, } @Book{papadimitrioudial, author = {Papadimitriou, Panayotis}, title = {{Λαλιές Πομάκων της ελληνικής Ροδόπης: Περιφερειακή Αναλυτική Σλαβική και μουσουλμάνοι ομιλητές στη Νοτιοανατολική Ευρώπη}}, publisher = {Institute for Balkan Studies}, location = {Thessaloniki}, year = {2013}, } @InCollection{adamou, author = {Adamou, Evangelia and Fanciullo, Davide}, booktitle = {Linguistic regionalism in {Eastern Europe} and beyond: {Minority}, regional and literary microlanguages}, title = {{Why Pomak will not be the next Slavic literary language}}, editor = {D. Stern and M. Nomachi and B. Belić}, pages = {40--65}, publisher = {Peter Lang}, url = {https://halshs.archives-ouvertes.fr/halshs-02105739}, address = {Berlin}, year = {2018}, } @incollection{gross-2010-chains, author = {Groß, Thomas}, booktitle = {Proceedings of the 24th {P}acific {A}sia Conference on Language, Information and Computation}, title = {Chains in Syntax and Morphology}, editor = {Otoguro, Ryo and Ishikawa, Kiyoshi and Umemoto, Hiroshi and Yoshimoto, Kei and Harada, Yasunari}, pages = {143--152}, publisher = {Institute of Digital Enhancement of Cognitive Processing, Waseda University}, url = {https://aclanthology.org/Y10-1018}, address = {Tohoku University, Sendai, Japan}, year = {2010}, } @incollection{tayyar_madabushi_etal_2022, author = {Tayyar Madabushi, Harish and Gow-Smith, Edward and Garcia, Marcos and Scarton, Carolina and Idiart, Marco and Villavicencio, Aline}, booktitle = {Proceedings of the 16th International Workshop on {Semantic} {Evaluation} ({SemEval-2022})}, title = {{SemEval-2022} {Task} 2: {Multilingual} Idiomaticity Detection and Sentence Embedding}, pages = {107--121}, publisher = {Association for Computational Linguistics}, address = {Seattle, WA}, year = {2022}, } @incollection{markantonatou-etal-in-prep, author = {Markantonatou, Stella and Minos, Panagiotis and Zakis, George and Koletti, Erasmia and Margariti, Elpiniki and Stripeli, Emilia}, booktitle = {Multiword expressions in {Greek}: {Deltio} Epistimonikis Orologias ke Neologismon}, title = {IDION (IΔΙΟΝ): {A} lexicographic environment for the documentation of {Greek} idioms}, editor = {Markantonatou, Stella and Christofidou, Anastasia}, year = {2020}, } @incollection{franccois2014flelex, author = {François, Thomas and Gala, Núria and Watrin, Patrick and Fairon, Cédrick}, booktitle = {Proceedings of the ninth international conference on {Language Resources and Evaluation} ({LREC'14})}, title = {{FLELex: A graded lexical resource for French foreign learners}}, editor = {Calzolari, Nicoletta and Choukri, Khalid and Declerck, Thierry and Loftsson, Hrafn and Maegaard, Bente and Mariani, Joseph and Moreno, Asuncion and Odijk, Jan and Piperidis, Stelios}, pages = {3766--3773}, url = {https://aclanthology.org/L14-1}, location = {Reykjavik, Iceland}, publisher = {European Language Resources Association (ELRA)}, year = {2014}, } @incollection{lindstrom2022MWE, author = {Lindström Tiedemann, Therese and Alfter, David and Volodina, Elena}, booktitle = {{Svenskan i Finland 19: Föredrag vid den nittonde sammankomsten för beskrivningen av svenskan i Finland, Vasa den 6–7 maj 2021}}, title = {{CEFR-nivåer och svenska flerordsuttryck}}, editor = {Björklund, Siv and Haagensen, Bodil and Nordman, Marianne and Westerlund, Anders}, pages = {218--233}, publisher = {Svensk-österbottniska samfundet}, place = {Vasa}, year = {2022}, } @Article{UD, author = {de Marneffe, Marie-Catherine and Manning, Christopher D. and Nivre, Joakim and Zeman, Daniel}, title = {Universal dependencies}, doi = {10.1162/coli_a_00402}, number = {2}, pages = {255--308}, volume = {47}, journal = {Computational Linguistics}, year = {2021}, } @InCollection{pawley1983two, author = {Pawley, Andrew and Syder, Frances Hodgetts}, booktitle = {Language and communication}, title = {Two puzzles for linguistic theory: {Nativelike} selection and nativelike fluency}, editor = {Richards, Jack C. and Schmidt, R. W.}, pages = {203--239}, publisher = {Routledge}, year = {1983}, } @TechReport{LASSY:SA-MAN, author = {Gertjan van Noord and Ineke Schuurman and Gosse Bouma}, publisher = {RU Groningen}, title = {{Lassy syntactische annotatie (Revision 19455)}}, type = {{LASSY Report}}, url = {https://www.let.rug.nl/vannoord/Lassy/sa-man_lassy.pdf}, address = {Groningen}, year = {2011}, } @Book{krippendorff1980, author = {Krippendorff, Klaus}, title = {Content {A}nalysis: {A}n Introduction to Its Methodology}, publisher = {Sage}, address = {Beverly Hills, CA}, year = {1980}, } @InCollection{krimpas2022, author = {Panagiotis G. Krimpas}, booktitle = {{Γλωσσανθοί: Μελέτες αφιερωμένες στην Πηνελόπη Καμπάκη-Βουγιουκλή}}, title = {{Ευρωγλωσσολογία, νεοελληνική γλώσσα και ευρωπαϊκή ολοκλήρωση}}, editor = {Zoe Gavriilidou and Nikolaos Mathioudakis and Maria Mitsiaki and Asimakis Fliatouras}, pages = {153--169}, location = {Athens}, publisher = {Herodotus, Democritus University of Thrace}, year = {2022}, } @incollection{LaporteVoyatzi_2008, author = {Laporte, Éric and Voyatzi, Stavroula}, booktitle = {Proceedings of the {LREC} Workshop Towards a Shared Task for {Multiword} {Expressions} ({MWE 2008})}, title = {An Electronic Dictionary of {{French}} Multiword Adverbs}, pages = {31--34}, year = {2008}, } @InCollection{laport, author = {Laporte, Éric}, booktitle = {Multiword Expressions: {{I}}nsights from a Multi-lingual Perspective}, title = {Choosing features for classifying multiword expressions}, doi = {10.5281/zenodo.1182597}, editor = {Sailer, Manfred and Markantonatou, Stella}, pages = {143--186}, publisher = {{Language Science Press}}, address = {Berlin}, year = {2018}, } @incollection{Colson:2017, author = {Colson, Jean-Pierre}, booktitle = {{Computational and corpus-based phraseology}}, title = {{The IdiomSearch experiment: Extracting phraseology from a probabilistic network of constructions}}, editor = {Mitkov, Ruslan}, pages = {16--28}, publisher = {Springer}, address = {Cham}, year = {2017}, } @incollection{nielsen, author = {Nielsen, Jakob and Molich, Rolf}, booktitle = {{Proceedings of the SIGCHI conference on human factors in computing systems (CHI'90)}}, title = {Heuristic evaluation of user interfaces}, doi = {10.1145/97243.97281}, pages = {249--256}, year = {1990}, } @incollection{inurrieta-etal-2018-konbitzul, author = {Iñurrieta, Uxoa and Aduriz, Itziar and Díaz de Ilarraza, Arantza and Labaka, Gorka and Sarasola, Kepa}, booktitle = {{Proceedings of the eleventh international Conference on Language Resources and Evaluation ({LREC} 2018)}}, title = {{K}onbitzul: {An} {MWE}-specific database for {S}panish-{B}asque}, publisher = {European Language Resources Association (ELRA)}, url = {https://aclanthology.org/L18-1397}, address = {Miyazaki, Japan}, year = {2018}, } @TechReport{mccrae2010lemon, author = {McCrae, John Philip and Aguado-de-Cea, Guadalupe and Buitelaar, Paul and Cimiano, Philipp and Declerck, Thierry and Gómez Pérez, Asunción and Gracia, Jorge and Hollink, Laura and Montiel-Ponsoda, Elena and Spohr, Dennis and others}, title = {{The lemon cookbook}}, url = {https://lemon-model.net/lemon-cookbook}, year = {2010}, } @Article{LibbenEtAl:03, author = {Gary Libben and Martha Gibson and Yeo Bom Yoon and Dominiek Sandra}, title = {Compound Fracture: {T}he Role of Semantic Transparency and Morphological Headedness}, pages = {50--64}, volume = {84}, journal = {Brain and Language}, year = {2003}, } @incollection{tack2018nt2lex, author = {Tack, Anaïs and François, Thomas and Desmet, Piet and Fairon, Cédrick}, booktitle = {{Proceedings of the 13th workshop on innovative use of NLP for Building Educational Applications (BEA)}}, title = {{NT2Lex: A CEFR-graded lexical resource for Dutch as a foreign language linked to open Dutch WordNet}}, editor = {Tetreault, Joel and Burstein, Jill and Kochmar, Ekaterina and Leacock, Claudia and Yannakoudakis, Helen}, pages = {137--146}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/W18-05}, location = {New Orleans, LA}, year = {2018}, } @Article{GamalloEtAl:19, author = {Pablo Gamallo and Susana Sotelo and Jose Ramom Pichel and Mikel Artetxe}, title = {Contextualized Translations of Phrasal Verbs with Distributional Compositional Semantics and Monolingual Corpora}, number = {3}, pages = {395--421}, volume = {45}, journal = {Computational Linguistics}, year = {2019}, } @Article{constandinidestrip, author = {Constantinides, Nicolaos Th.}, title = {{Συγκλίσεις και αποκλίσεις στην Πομακική της ελληνικής Θράκης αφορούσες τα πεδία της αοριστίας, της οριστικότητας και του τριμερούς προσδιορισμού υπό το πρίσμα μιας σύνθετης λαογραφικής θέωρησης. (`Convergences and divergences in the {Pomak of Greek Thrace} concerning the fields of indeterminacy, finality and tripartite determination in the light of a complex folklore view')}}, pages = {56--76}, volume = {8}, number = {1}, journal = {Mare Ponticum}, year = {2020}, } @incollection{joshi-etal-2020-state, author = {Joshi, Pratik and Santy, Sebastin and Budhiraja, Amar and Bali, Kalika and Choudhury, Monojit}, booktitle = {{Proceedings of the 58th annual meeting of the Association for Computational Linguistics}}, title = {The state and fate of linguistic diversity and inclusion in the {NLP} world}, editor = {Dan Jurafsky and Joyce Chai and Natalie Schluter and Joel Tetreault}, doi = {10.18653/v1/2020.acl-main.560}, pages = {6282--6293}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/2020.acl-main.560}, address = {Online}, year = {2020}, } @Article{alpino-paper-2, author = {Gosse Bouma and Gertjan van Noord and Robert Malouf}, title = {{Alpino: Wide-coverage computational analysis of {Dutch}}}, number = {1}, pages = {45--59}, volume = {37}, journal = {Language and Computers}, year = {2001}, } @incollection{SalehiEtAl:14b, author = {Bahar Salehi and Paul Cook and Timothy Baldwin}, booktitle = {Proceedings of the 14th Conference of the {European} Chapter of the {Association for Computational Linguistics}}, title = {Using Distributional Similarity of Multi-way Translations to Predict Multiword Expression Compositionality}, pages = {472--481}, address = {Gothenburg, Sweden}, editor = {Shuly Wintner and Sharon Goldwater and Stefan Riezler}, doi = {10.3115/v1/E14-1050}, publisher = {ACL}, year = {2014}, } @incollection{alfter2016distributions, author = {Alfter, David and Bizzoni, Yuri and Agebjörn, Anders and Volodina, Elena and Pilán, Ildikó}, booktitle = {{Proceedings of the joint Workshop on NLP for Computer-Assisted Language Learning and NLP for Language Acquisition (NLP4CALL \& NLP4LA)}}, title = {{From distributions to labels: A lexical proficiency analysis using learner corpora}}, editor = {Volodina, Elena and Grigonytė, Gintarė and Pilán, Ildikó and Nilsson Björkenstam, Kristina and Borin, Lars}, pages = {1--7}, location = {Umeå}, publisher = {Linköping University Electronic Press}, year = {2016}, url = {https://aclanthology.org/W16-6501} } @Article{de2010alignment, author = {de Caseli, Helena Medeiros and Ramisch, Carlos and das Graças Volpe Nunes, Maria and Villavicencio, Aline}, title = {Alignment-based extraction of multiword expressions}, pages = {59--77}, volume = {44}, journal = {Language Resources and Evaluation}, year = {2010}, } @incollection{Pasquer:etal:2018, author = {Pasquer, Caroline and Savary, Agata and Antoine, Jean-Yves and Ramisch, Carlos}, booktitle = {{Proceedings of the 2018 conference of the {North} {A}merican Chapter of the Association for Computational Linguistics: Human language technologies, Volume 2 (Short Papers)}}, title = {Towards a Variability Measure for Multiword Expressions}, doi = {10.18653/v1/N18-2068}, pages = {426--432}, editor = {Marilyn Walker and Heng Ji and Amanda Stent}, publisher = {Association for Computational Linguistics}, address = {New Orleans, LA}, year = {2018}, } @incollection{mccrae2017ontolex, author = {McCrae, John Philip and Bosque-Gil, Julia and Gracia, Jorge and Buitelaar, Paul and Cimiano, Philipp}, booktitle = {{Proceedings of fifth biennial Conference on Electronic Lexicography, eLex 2017.}}, title = {The {Ontolex-Lemon} model: Development and applications}, pages = {19--21}, year = {2017}, } @Book{jespersen, author = {Jespersen, Otto}, title = {A {Modern English} grammar on historical principles}, volume = {6: {Morphology}}, location = {London}, publisher = {Allen \& Unwin}, year = {1965}, } @incollection{gregoire-2007, author = {Grégoire, Nicole}, booktitle = {{Proceedings of the Workshop on A Broader Perspective on Multiword Expressions}}, editor = {Nicole Gregoire and Stefan Evert and Su Nam Kim}, title = {Design and Implementation of a Lexicon of {D}utch Multiword Expressions}, pages = {17--24}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/W07-1103}, address = {Prague}, year = {2007}, } @incollection{baccianella-et-al2010, author = {Baccianella, Stefano and Esuli, Andrea and Sebastiani, Fabrizio}, booktitle = {{Proceedings of the seventh international Conference on Language Resources and Evaluation ({LREC}'10)}}, title = {{S}enti{W}ord{N}et 3.0: {An} enhanced lexical resource for sentiment analysis and opinion mining}, publisher = {European Language Resources Association (ELRA)}, url = {http://www.lrec-conf.org/proceedings/lrec2010/pdf/769_Paper.pdf}, address = {Valletta, Malta}, year = {2010}, } @Book{brewer1991brewer, author = {Brewer, Ebenezer Cobham and Isaacs, Alan and Pickering, David and Martin, Elizabeth A.}, title = {Brewer's dictionary of 20th-century phrase and fable}, publisher = {Cassell}, year = {1991}, } @mastersthesis{Constantinides, author = {Constantinides, Nicolaos Th.}, school = {Democritus University of Thrace}, title = {{Η πομακική πολιτισμική μονάδα στην ελληνική Θράκη από άποψη Παρευξεινίων Σπουδών: Σύντομη ιστορική επισκόπηση, γλώσσα, ταυ τότητες}}, year = {2007}, } @Article{TorrentEllsworth2013, author = {Timponi Torrent, Tiago and Ellsworth, Michael}, title = {Behind the labels: {{C}}riteria for defining analytical categories in {FrameNet} {Brasil}}, pages = {44--65}, volume = {17}, journal = {Veredas}, url = {https://periodicos.ufjf.br/index.php/veredas/article/view/25403}, year = {2013}, } @incollection{petruck-ellsworth-2016-representing, author = {Petruck, Miriam R. L. and Ellsworth, Michael}, booktitle = {Proceedings of the 12th Workshop on {Multiword} {Expressions}}, title = {Representing Support Verbs in {F}rame{N}et}, pages = {72--77}, publisher = {Association for Computational Linguistics}, address = {Berlin}, year = {2016}, } @Book{gross_methodes_1975, author = {Gross, Maurice}, title = {Méthodes en syntaxe: {{R}}égime des constructions complétives}, langid = {french}, publisher = {Hermann}, address = {Paris}, ids = {gross-methodes-1975}, year = {1975}, } @incollection{SalehiEtAl:15b, author = {Bahar Salehi and Nitika Mathur and Paul Cook and Timothy Baldwin}, booktitle = {Proceedings of the 11th Workshop on Multiword Expressions}, title = {The Impact of Multiword Expression Compositionality on Machine Translation Evaluation}, pages = {54--59}, address = {Denver, CO}, year = {2015}, } @Article{Salomão2009, author = {Salomão, Maria Margarida M.}, title = {FrameNet {Brasil}: {{{U}}}m trabalho em progresso}, number = {3}, pages = {171--182}, volume = {7}, journal = {Caleidoscópio}, sortname = {Salomao, Maria Margarida M.}, year = {2009}, } @Article{2012-The-Bulgarian-National-Co, author = {Koeva, Svetla and Stoyanova, Ivelina and Leseva, Svetlozara and Dekova, Rositsa and Dimitrova, Tsvetana and Tarpomanova, Ekaterina}, title = {The {B}ulgarian {N}ational {C}orpus: {T}heory and practice in corpus design}, doi = {10.15398/jlm.v0i1.33}, number = {1}, pages = {65--110}, journal = {Journal of Language Modelling}, year = {2012}, } @InCollection{Augustinusetal:GrETEL:2017, author = {Liesbeth Augustinus and Vincent Vandeghinste and Ineke Schuurman and Frank {Van Eynde}}, booktitle = {{CLARIN} in the {L}ow {C}ountries}, title = {{GrETEL}: {A} Tool for Example-Based Treebank Mining}, chapter = {22}, doi = {10.5334/bbi.22}, editor = {Jan Odijk and Arjan van Hessen}, pages = {269--280}, publisher = {Ubiquity}, address = {London, UK}, year = {2017}, } @incollection{EichelEtAl:23, author = {Eichel, Annerose and Schlipf, Helena and {Schulte im Walde}, Sabine}, booktitle = {Proceedings of the 17th Conference of the {European} Chapter of the {Association for Computational Linguistics}}, title = {\textit{{Made} of Steel?} {L}earning Plausible Materials for Components in the Vehicle Repair Domain}, pages = {1420--1435}, address = {Dubrovnik, Croatia}, year = {2023}, } @Article{capel2012completing, author = {Capel, Annette}, title = {{Completing the English vocabulary profile: C1 and C2 vocabulary}}, issue = {1}, volume = {3}, journal = {English Profile Journal}, year = {2012}, } @incollection{borin2012korp, author = {Borin, Lars and Forsberg, Markus and Roxendal, Johan}, booktitle = {Proceedings of the eighth international conference on {Language Resources and Evaluation} ({LREC})}, title = {{Korp: The corpus infrastructure of Språkbanken}}, editor = {Calzolari, Nicoletta and Choukri, Khalid and Declerch, Thierry and Doğan, Uğur, Mehmet and Maegaard, Bente and Mariani, Joseph and Moreno, Asuncion and Odijk, Jan and Piperidis, Stelios}, pages = {474--478}, publisher = {European Language Resources Association}, year = {2012}, } @Book{Burger:Dobrovolskij:eds:2007, title = {{Phraseology: An international handbook of contemporary research}}, editor = {Burger, Harald and Dobrovol'skij, Dmitri and Kühn, Peter and Norrick, Neal R.}, publisher = {Walter de Gruyter}, address = {Berlin}, year = {2007}, } @Book{Kochova:Opavska:2016, title = {Kapitoly z koncepce: {Akademického} slovníku současné češtiny}, editor = {Kochová, Pavla and Opavská, Zdeňka}, publisher = {Ústav pro jazyk český AV ČR}, address = {Praha}, year = {2016}, } @Article{Osborne-et.-al-2012, author = {Osborne, Timothy and Putnam, Michael and Groß, Thomas}, title = {Catenae: {Introducing} a Novel Unit of Syntactic Analysis}, doi = {10.1111/j.1467-9612.2012.00172.x}, number = {4}, pages = {354--396}, volume = {15}, journal = {Syntax}, publisher = {Blackwell Publishing Ltd}, year = {2012}, } @phdthesis{Evert, author = {Stefan Evert}, title = {The statistics of word cooccurrences: {Word} pairs and collocations}, publisher = {Institut für maschinelle Sprachverarbeitung, University of Stuttgart}, year = {2004}, } @incollection{barbu-mititelu-etal-2019-hear, author = {Barbu Mititelu, Verginica and Stoyanova, Ivelina and Leseva, Svetlozara and Mitrofan, Maria and Dimitrova, Tsvetana and Todorova, Maria}, booktitle = {{Proceedings of the joint workshop on Multiword Expressions and WordNet (MWE-WN 2019)}}, title = {{Hear about verbal multiword expressions in the {B}ulgarian and the {R}omanian Wordnets straight from the horse's mouth}}, doi = {10.18653/v1/W19-5102}, pages = {2--12}, publisher = {Association for Computational Linguistics}, address = {Florence, Italy}, year = {2019}, } @TechReport{tei-dict, author = {{Text Encoding Initiative}}, title = {{P5: Guidelines for electronic text encoding and interchange, Chap. 9 Dictionaries}}, note = {Version 4.4.0. Last updated on 19th April 2022, revision ff9cc28b0}, url = {https://tei-c.org/release/doc/tei-p5-doc/en/html/DI.html}, year = {2022}, } @Article{Schafroth2015, author = {Schafroth, Elmar}, title = {Italian Phrasemes as Constructions: {How} to Understand and Use Them}, doi = {10.3844/jssp.2015.317.337}, number = {11}, pages = {317--337}, volume = {3}, journal = {Journal of Social Sciences}, year = {2015}, } @Article{Hnatkova:Petkevic:2017, author = {Hnátková, Milena and Petkevič, Vladimír}, title = {Morphological disambiguation of multiword expressions and its impact on the disambiguation of their environment in a sentence}, doi = {10.1515/jazcas-2017-0025}, number = {2}, pages = {145--155}, volume = {68}, journal = {Jazykovedný Časopis}, year = {2017}, } @Book{Siegel/Castellan:88, author = {Sidney Siegel and N. John Castellan}, title = {Nonparametric Statistics for the Behavioral Sciences}, publisher = {McGraw-Hill}, address = {Boston, MA}, year = {1988}, } @Article{volodina2022single, author = {Volodina, Elena and Alfter, David and Lindström Tiedemann, Therese}, title = {Crowdsourcing ratings for single lexical items: {A} core vocabulary perspective}, doi = {10.4312/slo2.0.2022.2.5-61}, number = {2}, pages = {5--61}, volume = {10}, journal = {Slovenščina 2.0}, year = {2022}, } @phdthesis{Mini2009, author = {Mini, Marianna}, title = {Linguistic and psycholinguistic study of fixed verbal expressions with fixed subject in {Greek}: {{A}} morphosyntactic analysis, lexicosemantic gradation and processing by elementary school children}, school = {University of Patras}, year = {2009}, } @incollection{Osenova2011, author = {Petya Osenova}, booktitle = {The Languages of the new {EU} Member States}, title = {Bulgarian}, pages = {643--668}, volume = {88}, number = {3}, series = {Revue Belge de Pholologie et D’Historie}, year = {2010}, } @incollection{Uresova:2009, author = {Urešová, Zdeňka}, booktitle = {On-line proceedings of the fifth corpus linguistics conference}, title = {Building the {PDT-VALLEX} valency lexicon}, publisher = {University of Liverpool}, url = {https://ufal.mff.cuni.cz/~uresova/web.pdf/2012-CLC-Building%20the%20PDT-VALLEX.pdf}, year = {2009}, } @Book{vietri, author = {Simonetta Vietri}, title = {Idiomatic Constructions in {Italian}: {A} Lexicon-Grammar Approach}, publisher = {John Benjamins}, address = {Amsterdam/Philadelphia}, year = {2014}, } @incollection{Koeva-et-al2016, author = {Svetla Koeva and Ivelina Stoyanova and Maria Todorova and Svetlozara Leseva}, booktitle = {{Proceedings of the GLOBALEX 2016 workshop: Lexicographic Resources for Human Language Technology, LREC}}, title = {Semi-automatic Compilation of the Dictionary of {Bulgarian} Multiword Expressions}, editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Sara Goggi and Marko Grobelnik and Bente Maegaard and Joseph Mariani and Helene Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, pages = {86--95}, year = {2016}, publisher = {European Language Resources Association (ELRA)}, address = {Paris}, } @Article{meunier2012formulaic, author = {Meunier, Fanny}, title = {Formulaic language and language teaching}, pages = {111--129}, volume = {32}, journal = {Annual Review of Applied Linguistics}, publisher = {Cambridge University Press}, year = {2012}, } @Book{ruppenhofer_etal_2016, author = {Ruppenhofer, Josef and Ellsworth, Michael and Petruck, Miriam R.L. and Johnson, Christopher R. and Scheffczyk, Jan}, title = {{FrameNet} {II}: {Extended} Theory and Practice}, url = {https://framenet2.icsi.berkeley.edu/docs/r1.7/book.pdf}, year = {2016}, } @incollection{fellbaum-1998-towards, author = {Fellbaum, Christiane}, booktitle = {Usage of {W}ord{N}et in Natural Language Processing Systems}, title = {Towards a Representation of Idioms in {W}ord{N}et}, pages = {52--57}, url = {https://aclanthology.org/W98-0707}, year = {1998}, } @incollection{barbu-mititelu-etal-2019-romanian, author = {Barbu Mititelu, Verginica and Cristescu, Mihaela and Onofrei, Mihaela}, booktitle = {{Proceedings of the Joint Workshop on Multiword Expressions and WordNet (MWE-WN 2019)}}, title = {The {R}omanian Corpus Annotated with Verbal Multiword Expressions}, doi = {10.18653/v1/W19-5103}, pages = {13--21}, publisher = {Association for Computational Linguistics}, address = {Florence, Italy}, year = {2019}, } @incollection{CapEtAl:15, author = {Fabienne Cap and Manju Nirmal and Marion Weller and Sabine {Schulte im Walde}}, booktitle = {Proceedings of the 11th Workshop on Multiword Expressions}, title = {How to Account for Idiomatic {G}erman Support Verb Constructions in Statistical Machine Translation}, pages = {19--28}, address = {Denver, CO}, year = {2015}, } @Article{Linden_etal_2017, author = {Krister Lindén and Heidi Haltia and Juha Luukkonen and Antti Olavi Laine and Henri Roivainen and Niina Väisänen}, title = {{FinnFN} 1.0: {{T}}he {Finnish} frame semantic database}, number = {3}, pages = {287--311}, volume = {40}, journal = {Nordic Journal of Linguistics}, year = {2017}, } @incollection{Carpuat/Diab:10, author = {Marine Carpuat and Mona Diab}, booktitle = {Proceedings of the 11th Annual Conference of the {North American} Chapter of the {Association for Computational Linguistics}}, title = {Task-based Evaluation of Multiword Expressions: {A} Pilot Study in Statistical Machine Translation}, address = {Los Angeles, CA}, year = {2010}, } @incollection{yimam_etal_2013, author = {Yimam, Seid Muhie and Gurevych, Iryna and Eckart de Castilho, Richard and Biemann, Chris}, booktitle = {Proceedings of the 51st Annual Meeting of the {Association} for {Computational} {Linguistics}: {System} Demonstrations}, title = {{WebAnno}: {A} Flexible, Web-based and Visually Supported System for Distributed Annotations}, pages = {1--6}, publisher = {Association for Computational Linguistics}, address = {Sofia, Bulgaria}, year = {2013}, } @incollection{Koehn:05, author = {Philipp Koehn}, booktitle = {Proceedings of the 10th Machine Translation Summit}, title = {{Europarl: A parallel corpus for statistical machine translation}}, pages = {79--86}, address = {Phuket, Thailand}, ids = {koehn-2005-europarl}, year = {2005}, } @Article{Alpino:2002, author = {Leonoor van der Beek and Gosse Bouma and Gertjan van Noord}, title = {Een brede computationele grammatica voor het {Nederlands}}, pages = {353--374}, volume = {7}, journal = {Nederlandse Taalkunde}, year = {2002}, } @InCollection{granger2018formulaic, author = {Granger, Syviane}, booktitle = {{Understanding formulaic language: A second language acquisition perspective}}, title = {Formulaic Sequences in Learner Corpora}, editor = {Siyanova-Chanturia, Anna and Pellicer-Sanchez, Ana}, pages = {228--247}, publisher = {Routledge}, year = {2018}, } @InBook{bresnan, author = {Joan Bresnan}, booktitle = {Linguistic Theory and Psychological Reality}, title = {A realistic transformational grammar}, editor = {Morris Halle and Joan Bresnan and George A. Miller}, pages = {1--59}, publisher = {MIT Press}, year = {1978}, } @Article{bjorklund2007prep, author = {Björklund, Siv}, title = {Reflexiva verb och infinitivfraser}, issue = {1}, url = {https://www.sprakbruk.fi/-/reflexiva-verb-och-infinitivfraser}, journal = {Språkbruk}, year = {2007}, } @incollection{Monti2014, author = {Monti, Johanna}, booktitle = {{Proceedings of the first Italian conference on Computational Linguistics CLiC-it 2014 and of the fourth international workshop EVALITA}}, title = {{An English-Italian MWE dictionary}}, pages = {265--269}, publisher = {Pisa University Press}, address = {Pisa}, year = {2014}, } @incollection{klimek2019challenges, author = {Klimek, Bettina and McCrae, John Philip and Bosque-Gil, Julia and Ionov, Maxim and Tauber, James K. and Chiarcos, Christian}, booktitle = {Proceedings of Sixth Biennial Conference on {Electronic Lexicography}, ({eLex 2019})}, title = {Challenges for the Representation of Morphology in Ontology Lexicons}, year = {2019}, } @incollection{volodina2016swellex, author = {Volodina, Elena and Pilán, Ildikó and Llozhi, Lorena and Degryse, Baptiste and François, Thomas}, booktitle = {{Proceedings of the joint Workshop on NLP for Computer-Assisted Language Learning and NLP for Language Acquisition (NLP4CALL \& NLP4LA)}}, title = {{SweLLex: Second language learners’ productive vocabulary}}, editor = {Volodina, Elena and Grigonytė, Gintarė and Pilán, Ildikó and Nilsson Björkenstam, Kristina and Borin, Lars}, pages = {76--84}, publisher = {Linköping Electronic Conference Proceedings}, url = {https://aclanthology.org/W16-6500}, location = {Umeå}, year = {2016}, } @Article{anward1976om, author = {Anward, Jan and Linell, Per}, title = {{Om lexikaliserade fraser i svenskan}}, pages = {77--119}, volume = {55--56}, journal = {Nysvenska Studier}, year = {1976}, } @InCollection{Odijk:2013-382998, author = {Jan Odijk}, booktitle = {{LMF}: {Lexical} Markup Framework}, title = {{DUELME}: {Dutch} Electronic Lexicon of Multiword Expressions}, editor = {Francopoulo, Gil}, pages = {133--144}, publisher = {ISTE / Wiley}, address = {London, UK / Hoboken, US}, year = {2013}, } @Article{francopoulo2009multilingual, author = {Francopoulo, Gil and Bel, Nuria and George, Monte and Calzolari, Nicoletta and Monachini, Monica and Pet, Mandy and Soria, Claudia}, title = {{Multilingual resources for NLP in the lexical markup framework (LMF)}}, number = {1}, pages = {57--70}, volume = {43}, journal = {Language Resources and Evaluation}, publisher = {Springer}, year = {2009}, } @InBook{Odijk:2013-382996, author = {Jan Odijk}, booktitle = {Essential Speech and Language Technology for {Dutch}: {R}esults by the {STEVIN}-programme}, title = {Identification and Lexical Representation of Multiword Expressions}, editor = {Spyns, P. and Odijk, J. E. J. M.}, pages = {201--217}, publisher = {Springer}, series = {Theory and Applications of Natural Language Processing}, address = {Berlin/Heidelberg}, year = {2013}, } @PhdThesis{Fotopoulou1993, author = {Fotopoulou, Aggeliki}, title = {Une classification des phrases à compléments figés en grec moderne: étude morphosyntaxique des phrases figées}, school = {Université Paris VIII}, langid = {french}, year = {1993}, } @Misc{Mikolov:etal:2013, author = {Mikolov, Tomas and Chen, Kai and Corrado, Greg and Dean, Jeffrey}, title = {{Efficient estimation of word representations in vector space}}, doi = {10.48550/arxiv.1301.3781}, year = {2013}, } @InCollection{krimpas, author = {Panagiotis G. Krimpas}, booktitle = {{Οι Πομάκοι της Θράκης: πολυεπιστημονικές και διεπιστημονικές προσεγγίσεις}}, title = {{Η} γλώσσα και η καταγωγή των {Πομάκων υπό το φως της Βαλκανικής Ζώνης Γλωσσικής Επαφής}}, editor = {Manolis Varvounis and Antonis Bartsiokas and Nadia Macha-Bizoumi}, pages = {167--204}, series = {{Μελέτες Λαογραφίας και Κοινωνικής Ανθρωπολογίας 7}}, year = {2020}, } @Article{SchulteImWalde/Borgwaldt:15, author = {Sabine {Schulte im Walde} and Susanne Borgwaldt}, title = {Association Norms for {G}erman Noun Compounds and their Constituents}, number = {4}, pages = {1199--1221}, volume = {47}, journal = {Behavior Research Methods}, year = {2015}, } @Book{rudebeck2021swell, author = {Rudebeck, Lisa and Sundberg, Gunlög and Wirén, Mats}, title = {{SweLL normalization guidelines}}, publisher = {University of Gothenburg}, series = {GU-ISS Research report series}, url = {http://hdl.handle.net/2077/69432}, year = {2021}, } @incollection{alfter2019legato, author = {Alfter, David and Lindström Tiedemann, Therese and Volodina, Elena}, booktitle = {{22nd Nordic Conference on Computational Linguistics (NoDaLiDa)}}, title = {{LEGATO: A flexible lexicographic annotation tool}}, editor = {Hartmann, Mareike and Plank, Barbara}, pages = {382--388}, publisher = {Linköping University Electronic Press}, year = {2019}, } @Book{karlsson2017svenska, author = {Karlsson, Ola}, title = {Svenska skrivregler}, publisher = {Liber}, year = {2017}, } @Article{Hardie2012, author = {Andrew Hardie}, title = {{CQPweb: Combining power, flexibility and usability in a corpus analysis tool}}, number = {3}, pages = {380--409}, volume = {17}, journal = {{International Journal of Corpus Linguistics}}, year = {2012}, } @incollection{Rychly2008, author = {Pavel Rychlý}, booktitle = {{RASLAN 2008}}, title = {A Lexicographer-Friendly Association Score}, location = {Brno}, pages = {6--9}, publisher = {Masarykova Univerzita}, url = {https://nlp.fi.muni.cz/raslan/2008/papers/13.pdf}, address = {Brno}, year = {2008}, } @incollection{Haetty/SchulteImWalde:18b, author = {Hätty, Anna and {Schulte im Walde}, Sabine}, booktitle = {Proceedings of the {COLING} Joint Workshop on Linguistic Annotation, Multiword Expressions and Constructions}, title = {Fine-grained Termhood Prediction for {G}erman Compound Terms using Neural Networks}, pages = {62--73}, address = {Santa Fe, NM}, year = {2018}, } @incollection{Venturi2009, author = {Giulia Venturi and Alessandro Lenci and Simonetta Montemagni and Eva Maria Vecchi and Maria-Teresa Sagri and Daniela Tiscornia and Tommaso Agnoloni}, booktitle = {Proceedings of the 3rd Workshop on {Legal Ontologies} and {Artificial} {Intelligence} {Techniques}, held in conjunction with the 2nd Workshop on {Semantic} {Processing} of {Legal} {Text}}, title = {Towards a {FrameNet} Resource for the Legal Domain}, pages = {67--76}, address = {Barcelona, Spain}, year = {2009}, editor = {Núria Casellas and Enrico Francesconi and Rinke Hoekstra and Simonetta Montemagni}, url = {https://ceur-ws.org/Vol-465/paper8.pdf}, series = {CEUR Workshop Proceedings}, number = {465} } @incollection{Torrent_etal_2018, author = {Timponi Torrent, Tiago and Michael Ellsworth and Collin Baker and Ely Edison da Silva Matos}, booktitle = {Multilingual {FrameNets} and Constructions, {The} International {FrameNet} Workshop 2018}, title = {The {Multilingual} {FrameN}et Shared Annotation Task: {{A}} Preliminary Report}, year = {2018}, } @incollection{SchulteImWaldeEtAl:13, author = {Sabine {Schulte im Walde} and Stefan Müller and Stephen Roller}, booktitle = {Proceedings of the 2nd Joint Conference on {Lexical and Computational Semantics}}, title = {Exploring Vector Space Models to Predict the Compositionality of {G}erman Noun-Noun {C}ompounds}, pages = {255--265}, address = {Atlanta, GA}, editor = {Mona Diab and Tim Baldwin and Marco Baroni}, year = {2013}, url = {https://aclanthology.org/S13-1038} } @Article{constant-etal-2017-survey, author = {Constant, Mathieu and Eryiǧit, Gülşen and Monti, Johanna and van der Plas, Lonneke and Ramisch, Carlos and Rosner, Michael and Todirascu, Amalia}, title = {Multiword Expression Processing: {A} Survey}, doi = {10.1162/COLI_a_00302}, number = {4}, pages = {837--892}, volume = {43}, address = {Cambridge, MA}, journal = {Computational Linguistics}, publisher = {MIT Press}, year = {2017}, } @incollection{Ma:etal:2018, author = {Ma, Xuezhe and Hu, Zecong and Liu, Jingzhou and Peng, Nanyun and Neubig, Graham and Hovy, Eduard}, booktitle = {{Proceedings of the 56th annual meeting of the Association for Computational Linguistics}}, title = {Stack-Pointer Networks for Dependency Parsing}, doi = {10.18653/v1/P18-1130}, pages = {1403--1414}, publisher = {Association for Computational Linguistics}, address = {Melbourne}, year = {2018}, } @InBook{helge_dyvik_2019_2579037, author = {Helge Dyvik and Gyri Smørdal Losnegaard and Victoria Rosén}, booktitle = {Representation and parsing of multiword expressions: {Current} trends}, title = {{Multiword expressions in an LFG grammar for Norwegian}}, doi = {10.5281/zenodo.2579037}, editor = {Yannick Parmentier and Jakub Waszczuk}, pages = {69--108}, publisher = {Language Science Press}, year = {2019}, } @incollection{chiarcos2022computational, author = {Chiarcos, Christian and Gkirtzou, Katerina and Khan, Fahad and Labropoulou, Penny and Passarotti, Marco and Pellegrini, Matteo}, booktitle = {{Proceedings of the 8th workshop on Linked Data in Linguistics within the 13th Language Resources and Evaluation Conference}}, editor = {Thierry Declerck and John P. McCrae and Elena Montiel and Christian Chiarcos and Maxim Ionov}, title = {Computational Morphology with {OntoLex-Morph}}, location = {Marseille}, publisher = {European Language Resources Association}, url = {https://aclanthology.org/2022.ldl-1.0}, pages = {78--86}, year = {2022}, } @incollection{Bell/Schaefer:13, author = {Melanie J. Bell and Martin Schäfer}, booktitle = {Proceedings of the {IWCS 2013} Workshop on Formal Distributional Semantics}, editor = {Aurelie Herbelot and Roberto Zamparelli and Gemma Boleda}, title = {Semantic Transparency: {C}hallenges for Distributional Semantics}, pages = {1--10}, address = {Potsdam, Germany}, year = {2013}, } @Article{Kilgarriff2014, author = {Kilgarriff, Adam and Baisa, Vít and Bušta, Jan and Jakubíček, Miloš and Kovář, Vojtěch and Michelfeit, Jan and Rychlý, Pavel and Suchomel, Vít}, title = {The {Sketch} {Engine}: {{T}}en years on}, pages = {7--36}, volume = {1}, journal = {Lexicography}, year = {2014}, } @Article{capel2015english, author = {Capel, Annette}, title = {{The English vocabulary profile}}, pages = {9--27}, volume = {5}, journal = {English profile in practice}, publisher = {Cambridge University Press Cambridge}, year = {2015}, } @Article{erman2007cognitive, author = {Erman, Britt}, title = {{Cognitive processes as evidence of the idiom principle}}, number = {1}, pages = {25--53}, volume = {12}, address = {Amsterdam/Philadelphia}, journal = {International Journal of Corpus Linguistics}, publisher = {John Benjamins}, year = {2007}, } @Article{Giouli.2023, author = {Giouli, Voula}, title = {A model for representing the semantics of {MWEs}: {From} lexical semantics to the semantic annotation of complex predicates}, doi = {10.3389/frai.2023.802218}, volume = {6}, journal = {Frontiers in Artificial Intelligence}, year = {2023}, } @incollection{schmidt2012attention, author = {Schmidt, Richard}, title = {Attention, awareness, and individual differences in language learning}, pages = {27--50}, booktitle = {Perspectives on individual characteristics and foreign language education}, editor = {Wai Meng Chan and Kwee Nyet Chin and Sunil Kumar Bhatt and Izumi Walker}, series = {SSFLE}, number = {6}, publisher = {De Gruyter Mouton}, doi = {10.1515/9781614510932.27}, year = {2012}, } @Article{Wisniewski:96, author = {Edward J. Wisniewski}, title = {Construal and Similarity in Conceptual Combination}, pages = {434--453}, volume = {35}, journal = {Journal of Memory and Language}, year = {1996}, } @incollection{Gyri2016, author = {Gyri Smørdal Losnegaard and Federico Sangati and Carla Parra Escartín and Agata Savary and Sascha Bargmann and Johanna Monti}, booktitle = {{10th international conference on Language Resources and Evaluation (LREC 2016)}}, title = {{PARSEME survey on MWE resources}}, pages = {2299--2306}, url = {https://hal.science/hal-01316351}, address = {Portorož}, year = {2016}, } @incollection{leseva-etal-2020-takes, author = {Leseva, Svetlozara and Mititelu, Verginica Barbu and Stoyanova, Ivelina}, booktitle = {{Proceedings of the 4th international conference on Computational Linguistics in Bulgaria (CLIB 2020)}}, title = {It Takes Two to Tango: {Towards} a Multilingual {MWE} Resource}, pages = {101--111}, publisher = {Department of Computational Linguistics, IBL -- BAS}, url = {https://aclanthology.org/2020.clib-1.11}, address = {Sofia, Bulgaria}, year = {2020}, } @incollection{torrent-etal-2014-copa, author = {Timponi Torrent, Tiago and Salomão, Maria Margarida M. and Campos, Fernanda C. A. and Braga, Regina M. M. and Matos, Ely E. S. and Gamonal, Maucha A. and Gonçalves, Julia A. and Souza, Bruno C. P. and Gomes, Daniela S. and Peron, Simone R.}, booktitle = {Proceedings of {COLING} 2014, the 25th International Conference on {Computational} {Linguistics}: {System} Demonstrations}, title = {Copa 2014 {F}rame{N}et {Brasil}: a frame-based trilingual electronic dictionary for the {Football} {World} {Cup}}, pages = {10--14}, publisher = {Dublin City University and Association for Computational Linguistics}, address = {Dublin, Ireland}, year = {2014}, } @InCollection{borin2021multiword, author = {Borin, Lars}, booktitle = {{The Swedish FrameNet++: harmonization, integration, method development and practical language technology applications}}, title = {Multiword expressions: {A} tough typological nut for Swedish FrameNet++}, editor = {Dannélls, Dana and Borin, Lars and Friberg Heppin, Karin}, pages = {221--260}, publisher = {John Benjamins}, address = {Amsterdam/Philadelphia}, year = {2021}, } @Article{alfter2021mwe, author = {Alfter, David and Lindström Tiedemann, Therese and Volodina, Elena}, title = {Crowdsourcing Relative Rankings of Multi-Word Expressions: {Experts} versus Non-Experts}, issue = {1}, volume = {7}, journal = {Northern European Journal of Language Technology}, year = {2021}, } @incollection{volodina2022annotation, author = {Volodina, Elena and Alfter, David and Lindström Tiedemann, Therese and Lauriala, Maisa and Piipponen, Daniela}, booktitle = {{Selected papers from the {CLARIN} Annual Conference 2021}}, title = {{Reliability of automatic linguistic annotation: {Native} vs non-native texts}}, doi = {10.3384/9789179294441}, editor = {Monachini, Monica and Eskevich, Maria}, pages = {151--167}, publisher = {Linköping Electronic Press}, year = {2022}, } @InCollection{Sheinfux:2019, author = {Sheinfux, Livnat Herzig and Greshler, Tali Arad and Melnik, Nurit and Wintner, Shuly}, booktitle = {Representation and parsing of multiword expressions: {Current} trends}, title = {Verbal Multiword Expressions: {I}diomaticity and flexibility}, doi = {10.5281/zenodo.2579035}, editor = {Parmentier, Yannick and Waszczuk, Jakub}, pages = {35--68}, publisher = {Language Science Press}, address = {Berlin}, year = {2019}, } @Article{MTT, author = {Mel’čuk, Igor}, title = {Meaning-Text Models: {A} Recent Trend in {Soviet} Linguistics}, pages = {27--62}, volume = {10}, journal = {Annual Review of Anthropology}, year = {1981}, } @InCollection{cieslicka2015idiom, author = {Cieślicka, Anna B.}, booktitle = {{Bilingual figurative language processing}}, title = {{Idiom acquisition and processing by second/foreign language learners}}, editor = {Heredia, Roberto R. and Cieślicka, Anna B.}, pages = {288--244}, publisher = {Cambridge University Press}, year = {2015}, } @incollection{Hnatkova:etal:2017, author = {Hnátková, Milena and Jelínek, Tomáš and Kopřivová, Marie and Petkevič, Vladimír and Rosen, Alexandr and Skoumalová, Hana and Vondřička, Pavel}, booktitle = {{Computational and corpus-based phraseology}}, title = {Eye of a Needle in a Haystack}, doi = {10.1007/978-3-319-69805-2_12}, editor = {Mitkov, Ruslan}, pages = {160--175}, publisher = {Springer}, address = {Cham}, year = {2017}, } @incollection{Hnatkova:etal:2014, author = {Hnátková, Milena and Křen, Michal and Procházka, Pavel and Skoumalová, Hana}, booktitle = {{Proceedings of the ninth international conference on Language Resources and Evaluation (LREC'14)}}, title = {{The SYN-series corpora of written Czech}}, pages = {160--164}, publisher = {{ELRA}}, url = {https://aclanthology.org/L14-1267/}, address = {Reykjavík}, year = {2014}, } @PhdThesis{Gruen:2010, author = {Christian Grün}, title = {Storing and Querying Large {XML} Instances}, school = {University of {Konstanz}}, year = {2010}, } @Book{af2008finlandssvensk, author = {af Hällström, Charlotta and Reuter, Mikael}, title = {{Finlandssvensk ordbok}}, edition = {Electronic version of the 4th edition}, publisher = {Schildts förlag and Forskningscentralen för de inhemska språken}, url = {https://kaino.kotus.fi/fsob/}, year = {2008}, } @incollection{yamaguchi2022towards, author = {Yamaguchi, Nami and Alfter, David and Sugiyama, Kaori and François, Thomas}, booktitle = {Proceedings of the 11th Workshop on {NLP} for Computer Assisted Language Learning}, title = {Towards a Verb Profile: {Distribution} of verbal tenses in {FFL} textbooks and in learner productions}, editor = {Alfter, David and Volodina, Elena and François, Thomas and Desmet, Piet and Cornillie, Frederik and Jönsson, Arne and Rennes, Evelina}, pages = {123--142}, publisher = {LiU Electronic Press}, url = {https://aclanthology.org/2022.nlp4call-1.13}, address = {Louvain-la-Neuve, Belgium}, year = {2022}, } @Article{gross_1982, author = {Gross, Maurice}, title = {Une classification des phrases « figées » du français}, langid = {french}, number = {2}, pages = {36--41}, volume = {11}, journal = {Revue québécoise de linguistique}, year = {1982}, } @Article{okeeffe2017english, author = {O’Keeffe, Anne and Mark, Geraldine}, title = {The {English} Grammar Profile of learner competence: {Methodology} and key findings}, number = {4}, pages = {457--489}, volume = {22}, address = {Amsterdam/Philadelphia}, journal = {International Journal of Corpus Linguistics}, publisher = {John Benjamins}, year = {2017}, } @incollection{baker_etal_1998, author = {Baker, Collin F. and Fillmore, Charles J. and Lowe, John B.}, booktitle = {36th Annual Meeting of the {Association} for {Computational} {Linguistics} and 17th {International} {Conference} on {Computational} {Linguistics}}, title = {The {Berkeley} {FrameNet} Project}, pages = {86--90}, publisher = {Association for Computational Linguistics}, volume = {1}, address = {Montreal}, year = {1998}, } @Book{coe2020companion, author = {{Council of Europe}}, title = {{Common European Framework of Reference for Languages: learning, teaching, assessment}}, publisher = {Council of Europe Publishing}, year = {2020}, } @Article{deJongEtAl:02, author = {Nicole H. {de Jong} and Laurie B. Feldman and Robert Schreuder and Michael Pastizzo and R. Harald Baayen}, title = {The Processing and Representation of {D}utch and {E}nglish Compounds: {P}eripheral Morphological and Central Orthographic Effects}, pages = {555--567}, volume = {81}, journal = {Brain and Language}, year = {2002}, } @Book{RamischHab, author = {Carlos Ramisch}, title = {{Multiword expressions in computational linguistics: Down the rabbit hole and through the looking glass}}, publisher = {Aix Marseille Université {(AMU)}}, year = {2023}, url = {https://theses.hal.science/tel-04216223} } @incollection{Martins:etal:2013, author = {Martins, André and Almeida, Miguel and Smith, Noah A.}, booktitle = {{Proceedings of the 51st annual meeting of the Association for Computational Linguistics}}, title = {Turning on the Turbo: {Fast} Third-Order Non-Projective Turbo Parsers}, pages = {617--622}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/P13-2109/}, address = {Sophia}, year = {2013}, } @incollection{chiarcos-etal-2022-lrec-morph, author = {Christian Chiarcos and Christian Fäth and Maxim Ionov}, booktitle = {Proceedings of the 13th International Conference on Language Resources and Evaluation ({LREC-2022})}, title = {Unifying Morphology Resources with {OntoLex-Morph}: {A} Case Study in {German}}, address = {Marseille, France}, year = {2022}, } @Book{coe2009relating, author = {{Council of Europe}}, title = {{Relating language examinations to the Common European Framework of Reference for Languages: Learning, teaching, assessment (CEFR)}}, editor = {Figueras, Neus and North, Brian and Takala, Sauli and Van Avermaet, Piet and Verhelst, Norman}, publisher = {Council of Europe, Language policy division}, year = {2009}, } @Book{Fellbaum1998, title = {{WordNet: An electronic lexical database}}, editor = {Christiane Fellbaum}, publisher = {The MIT Press}, address = {Cambridge, MA}, year = {1998}, } @incollection{declerck2016towards, author = {Declerck, Thierry and Lendvai, Piroska}, booktitle = {{Proceedings of the 14th SIGMORPHON workshop on computational research in phonetics, phonology, and morphology}}, editor = {Micha Elsner and Sandra Kuebler}, title = {Towards a Formal Representation of Components of {German} Compounds}, pages = {104--109}, year = {2016}, location = {Berlin}, publisher = {ACL}, doi = {10.18653/v1/W16-2017} } @Book{Müller2021, title = {{Head}-{Driven} {Phrase} {Structure} {Grammar}: {The} handbook}, doi = {10.5281/zenodo.5543318}, editor = {Müller, Stefan and Abeillé, Anne and Borsley, Robert D. and Koenig, Jean-Pierre}, number = {9}, publisher = {Language Science Press}, series = {Empirically Oriented Theoretical Morphology and Syntax}, address = {Berlin}, year = {2021}, } @incollection{Brouwer:etal:MTAS:2016, author = {Brouwer, Matthijs and Hennie Brugman and Marc Kemps-Snijders}, booktitle = {Selected papers from the {CLARIN} Annual Conference 2016, 26--28 {October}, {Aix-en-Provence}}, title = {A {SOLR / Lucene} based Multi Tier Annotation Search solution}, pages = {29--37}, publisher = {Linköping University Electronic Press}, url = {https://ep.liu.se/ecp/article.asp?issue=136&article=002&volume=0}, address = {Linköping, Sweden}, keywords = {CMDI}, year = {2016}, } @Book{Anastasiadis-Symeonidis1986, author = {Anastasiadis-Symeonidis, Anna}, title = {Η νεολογία στην κοινή νεοελληνική (`{Neology} in {Modern} {Greek}')}, publisher = {Aristotle University of Thessaloniki}, address = {Thessaloniki}, year = {1986}, } @Book{Sager1990, author = {Sager, Juan C.}, title = {A Practical Course in Terminology Processing}, publisher = {John Benjamins}, address = {Amsterdam}, year = {1990}, } @TechReport{owl:2004, author = {Bechhofer, Sean and van Harmelen, Frank and Hendler, Jim and Horrocks, Ian and McGuinness, Deborah and Patel-Schneijder, Peter and Stein, Lynn Andrea}, institution = {{World Wide Web Consortium (W3C)}}, title = {{OWL Web Ontology Language Reference}}, url = {http://www.w3.org/TR/owl-ref/}, editor = {Dean, Mike and Schreijber, Guus}, year = {2004}, } @TechReport{lexicog-2019, author = {Julia Bosque-Gil and Jorge Gracia}, institution = {W3C}, title = {The {OntoLex Lemon} Lexicography Module ({Final} Community Group Report)}, url = {https://www.w3.org/2019/09/lexicog/}, year = {2019}, } @InBook{Autelli2020, author = {Autelli, Erica}, booktitle = {Applied linguistics perspectives on reproducible multiword units: {Foreign} language teaching and lexicography}, series = {Intercontinental Dialogue on Phraseology}, number = {8}, title = {Phrasemes in {Genoese} and {Genoese-Italian} lexicography}, doi = {10.1007/978-3-642-30910-6_12}, editor = {Szerszunowicz, Joanna and Gorlewska, Eva}, pages = {101--127}, publisher = {University of Białystok Publishing House}, address = {Białystok}, year = {2020}, } @incollection{simov-osenova-2015-catena, author = {Simov, Kiril and Osenova, Petya}, booktitle = {Proceedings of the Third International Conference on Dependency Linguistics (Depling 2015)}, title = {Catena Operations for Unified Dependency Analysis}, editor = {Nivre, Joakim and Hajičová, Eva}, pages = {320--329}, publisher = {Uppsala University}, url = {https://aclanthology.org/W15-2135}, address = {Uppsala, Sweden}, year = {2015}, } @incollection{suchanek2020case, author = {Suchánek, Marek and Pergl, Robert}, booktitle = {{2020 IEEE 22nd Conference on Business Informatics (CBI)}}, title = {Case-study-based review of approaches for transforming {UML} class diagrams to {OWL} and vice versa}, organization = {IEEE}, pages = {270--279}, volume = {1}, year = {2020}, } @Article{ringbom2012country, author = {Ringbom, Håkan}, title = {A country in focus: {Review} of recent applied linguistics research in {Finland} and {S}weden, with specific reference to foreign language learning and teaching}, number = {4}, pages = {490--514}, volume = {45}, journal = {Language Teacher}, year = {2012}, } @incollection{przepiorkowski-etal-2014-walenty, author = {Przepiórkowski, Adam and Hajnicz, Elżbieta and Patejuk, Agnieszka and Woliński, Marcin and Skwarski, Filip and Świdziński, Marek}, booktitle = {Proceedings of the Ninth International Conference on {Language Resources and Evaluation} ({LREC}'14)}, title = {{W}alenty: {Towards} a comprehensive valence dictionary of {P}olish}, editor = {Calzolari, Nicoletta and Choukri, Khalid and Declerck, Thierry and Loftsson, Hrafn and Maegaard, Bente and Mariani, Joseph and Moreno, Asuncion and Odijk, Jan and Piperidis, Stelios}, pages = {2785--2792}, publisher = {European Language Resources Association (ELRA)}, url = {http://www.lrec-conf.org/proceedings/lrec2014/pdf/279_Paper.pdf}, address = {Reykjavik, Iceland}, year = {2014}, } @incollection{savary-etal-2019-without, author = {Savary, Agata and Cordeiro, Silvio and Ramisch, Carlos}, booktitle = {Proceedings of the Joint Workshop on {Multiword Expressions} and {WordNet} ({MWE-WN} 2019)}, title = {Without lexicons, multiword expression identification will never fly: {A} position statement}, doi = {10.18653/v1/W19-5110}, pages = {79--91}, address = {Florence}, year = {2019}, } @PhdThesis{Hermann:14, author = {Hermann, Karl Moritz}, title = {Distributed Representations for Compositional Semantics}, school = {University of Oxford}, year = {2014}, } @incollection{chiarcos2021embeddings, author = {Chiarcos, Christian and Declerck, Thierry and Ionov, Maxim}, booktitle = {{Proceedings of the 6th Workshop on {Semantic Deep Learning} (SemDeep-6)}}, editor = {Luis Espinosa-Anke and Dagmar Gromann and Thierry Declerck and Anna Breit and Jose Camacho-Collados and Mohammad Taher Pilehvar and Artem Revenko}, title = {Embeddings for the Lexicon: {Modelling} and Representation}, pages = {13--19}, year = {2021}, } @Article{fellbaum2005, author = {Fellbaum, Christiane and Geyken, Alexander}, title = {{Transforming a corpus into a lexical resource: The Berlin Idiom Project}}, doi = {10.3917/rfla.102.62}, number = {2}, pages = {49--62}, volume = {10}, journal = {Revue française de linguistique appliquée}, year = {2005}, } @incollection{pedersen1998dependent, author = {Pedersen, Ted}, booktitle = {{Proceedings of the 10th Conference on Innovative Applications of Artificial Intelligence (IAAI 1998)}}, title = {Dependent Bigram Identification}, location = {Madison, WI}, publisher = {AAAI}, year = {1998}, } @incollection{Kovarikova:Kovarik:2019, author = {Kováříková, Dominika and Kovářík, Oleg}, booktitle = {{Computational and corpus-based phraseology (EUROPHRAS 2019)}}, title = {Automatic Identification of Academic Phrases for {Czech}}, doi = {10.1007/978-3-030-30135-4_17}, editor = {Corpas Pastor, Gloria and Mitkov, Ruslan}, number = {11755}, series = {Lecture Notes in Computer Science}, publisher = {Springer}, location = {Cham}, year = {2019}, } @Book{hpsg-1, author = {Carl Pollard and Ivan A. Sag}, title = {Information-based syntax and semantics}, volume = {1: {Fundamentals}}, publisher = {CSLI Publications}, address = {Stanford}, year = {1987}, } @Book{hpsg-2, author = {Carl Pollard and Ivan A. Sag}, title = {{Head-Driven Phrase Structure Grammar}}, publisher = {University of Chicago Press}, address = {Chicago}, year = {1994}, } @Article{Hnatkova:2002, author = {Hnátková, Milena}, title = {{Značkování frazémů a idiomů v Českém národním korpusu s pomocí Slovníku české frazeologie a idiomatiky}}, number = {2}, pages = {117--126}, url = {http://sas.ujc.cas.cz/archiv.php?art=4064}, volume = {63}, journal = {Slovo a Slovesnost}, year = {2002}, } @Article{boers2006formulaic, author = {Boers, Frank and Eyckmans, June and Kappel, Jenny and Stengers, Hélène and Demecheleer, Murielle}, title = {Formulaic sequences and perceived oral proficiency: {Putting} a lexical approach to the test}, number = {3}, pages = {245--261}, volume = {10}, journal = {Language Teaching Research}, publisher = {Sage Publications Sage CA: Thousand Oaks, CA}, year = {2006}, } @incollection{lion-bouton-etal-2023-mwe, author = {Lion-Bouton, Adam and Savary, Agata and Antoine, Jean-Yves}, booktitle = {Proceedings of the 19th Workshop on Multiword Expressions ({MWE} 2023)}, title = {A {MWE} lexicon formalism optimised for observational adequacy}, editor = {Bhatia, Archna and Evang, Kilian and Garcia, Marcos and Giouli, Voula and Han, Lifeng and Taslimipoor, Shiva}, pages = {121--130}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/2023.mwe-1.16}, address = {Dubrovnik, Croatia}, year = {2023}, } @Book{Coulmas:ed:1981, title = {{Conversational routine: Explorations in standardized communication situations and prepatterned speech}}, editor = {Coulmas, Florian}, publisher = {Mouton}, address = {The Hague}, year = {1981}, } @Book{wray2002formulaic, author = {Wray, Alison}, title = {Formulaic language and the lexicon}, publisher = {Cambridge University Press}, place = {Cambridge, UK}, year = {2002}, } @incollection{savary_etal_2023, author = {Savary, Agata and Ben Khelil, Cherifa and Ramisch, Carlos and Giouli, Voula and Barbu Mititelu, Verginica and Hadj Mohamed, Najet and Krstev, Cvetana and Liebeskind, Chaya and Xu, Hongzhi and Stymne, Sara and Güngör, Tunga and Pickard, Thomas and Guillaume, Bruno and Bejček, Eduard and Bhatia, Archna and Candito, Marie and Gantar, Polona and Iñurrieta, Uxoa and Gatt, Albert and Kovalevskaite, Jolanta and Lichte, Timm and Ljubešić, Nikola and Monti, Johanna and Parra Escartín, Carla and Shamsfard, Mehrnoush and Stoyanova, Ivelina and Vincze, Veronika and Walsh, Abigail}, booktitle = {Proceedings of the 19th {Workshop} on {Multiword} {Expressions} ({MWE} 2023)}, title = {{PARSEME} corpus release 1.3}, pages = {24--35}, publisher = {Association for Computational Linguistics}, url = {https://aclanthology.org/2023.mwe-1.6}, address = {Dubrovnik, Croatia}, ids = {savary-etal-2023-parseme}, year = {2023}, } @Article{Harris:54, author = {Zellig Harris}, title = {Distributional Structure}, number = {23}, pages = {146--162}, volume = {10}, journal = {Word}, year = {1954}, } @Book{lyons, author = {Lyons, John}, title = {Semantics}, doi = {10.1017/CBO9781139165693}, publisher = {Cambridge University Press}, volume = {1}, place = {Cambridge}, year = {1977}, } @incollection{manfredstella, author = {Sailer, Manfred and Markantonatou, Stella}, booktitle = {{Posters from the PARSEME 6th general meeting, 7–8 April 2016, Struga, North Macedonia}}, title = {{Affectees in MWEs: German and Modern Greek}}, url = {https://typo.uni-konstanz.de/parseme/images/Meeting/2016-04-07-Struga-meeting/WG1-MARKANTONATOU-SAILER-poster-1.pdf}, year = {2016}, } @incollection{chiarcos2022modelling, author = {Chiarcos, Christian and Apostol, Elena-Simona and Kabashi, Besim and Truică, Ciprian-Octavian}, booktitle = {{Proceedings of the 29th International Conference on Computational Linguistics}}, title = {Modelling Frequency, Attestation, and Corpus-Based Information with {OntoLex-FrAC}}, pages = {4018--4027}, year = {2022}, } @incollection{Cholakov_Kordoni:14, author = {Kostadin Cholakov and Valia Kordoni}, booktitle = {Proceedings of the Conference on {Empirical Methods in Natural Language Processing}}, title = {Better Statistical Machine Translation through Linguistic Treatment of Phrasal Verbs}, pages = {196--201}, address = {Doha, Qatar}, year = {2014}, } @Article{kipper_etal_2008, author = {Kipper, Karin and Korhonen, Anna and Ryant, Neville and Palmer, Martha}, title = {A large-scale classification of {English} verbs}, number = {1}, pages = {21--40}, volume = {42}, journal = {Language Resources and Evaluation}, year = {2008}, } @TechReport{Hoekstra:etal:2003, author = {Heleen Hoekstra and Michael Moortgat and Bram Renmans and Machteld Schouppe and Ineke Schuurman and Ton van der Wouden}, institution = {Utrecht University}, title = {{CGN} {Syntactische} {Annotatie}}, type = {{CGN} report}, url = {http://lands.let.kun.nl/cgn/doc_Dutch/topics/version_1.0/annot/syntax/syn_prot.pdf}, address = {Utrecht, the Netherlands}, year = {2003}, } @Article{Ellis:02, author = {Nick C. Ellis}, title = {Frequency Effects in Language Processing: {A} Review with Implications for Theories of Implicit and Explicit Language Acquisition}, number = {2}, pages = {143--188}, volume = {24}, journal = {Studies in Second Language Acquisition}, year = {2002}, } @Article{cimiano2011lexinfo, author = {Cimiano, Philipp and Buitelaar, Paul and McCrae, John Philip and Sintek, Michael}, title = {{LexInfo: A declarative model for the lexicon-ontology interface}}, number = {1}, pages = {29--51}, volume = {9}, journal = {Journal of Web Semantics}, publisher = {Elsevier}, year = {2011}, } @incollection{DolbeyES06, author = {Andrew Dolbey and Michael Ellsworth and Jan Scheffczyk}, booktitle = {{Formal} Biomedical Knowledge Representation: {Proceedings} of the Second International Workshop on {Formal} {Biomedical} {Knowledge} {Representation} ({KR-MED} 2006), Collocated with the 4th {International} {Conference} on {Formal} {Ontology} in {Information} {Systems} ({FOIS}-2006)}, title = {{BioFrameNet}: {A} Domain-Specific {FrameNet} Extension with Links to Biomedical Ontologies}, editor = {Olivier Bodenreider}, location = {{Baltimore}}, publisher = {CEUR}, series = {{CEUR} {Workshop} {Proceedings}}, number = {222}, year = {2006}, } @incollection{Salehi/Cook:13, author = {Bahar Salehi and Paul Cook}, booktitle = {Proceedings of the 2nd Joint Conference on Lexical and Computational Semantics}, title = {Predicting the Compositionality of Multiword Expressions Using Translations in Multiple Languages}, pages = {266--275}, address = {Atlanta, GA}, year = {2013}, } @incollection{borin2016sparv, author = {Borin, Lars and Forsberg, Markus and Hammarstedt, Martin and Rosén, Dan and Schäfer, Roland and Schumacher, Anne}, booktitle = {The Sixth {Swedish} Language Technology Conference ({SLTC})}, title = {{Sparv: Språkbanken’s corpus annotation pipeline infrastructure}}, address = {Umeå University}, year = {2016}, } @Book{Butterworth-vol:83, title = {Language Production}, editor = {Brian Butterworth}, publisher = {Academic Press}, address = {London}, year = {1983}, }