[{"id":362238,"last_updated":"2024-01-16 16:10:37","id_people":485252,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"An interface for linking ancient languages","year":2024,"authors_people":"Michele Mallia, Michela Bandini, Valeria Quochi","authors_cnr":["Mallia, Michele","Bandini, Michela","Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":[""],"authors":["Mallia, M.","Bandini, M.","Quochi, V."],"abstract":"The paper focuses on the linking potentials offered by the EpiLexO web-based front-end for the creation and editing of an ecosystem of digital resources for ancient languages, developed in the context of a project on the languages of fragmentary attestation of ancient Italy. The focus is particularly on mechanisms introduced for linking lexical information to other information bits either internally or externally, e.g. for creating attestations by linking lexical forms to their variants in relevant inscriptions, as well as for linking lexical data to external independent LOD datasets available on a remote endpoint. Finally, in the conclusions, we briefly introduce some future planned or desired enhancements as well as the final platform component, a parallel interface that constitutes the fruition application, which will be open to anyone on the web and will allow for browsing, searching, cross-querying and visualising the created set of interlinked resources.","keywords":["eLexicography","Ancient languages","Linguistic Linked Open Data","Digital historical linguistics"],"pages":"1-12","url":"https:\/\/publications.cnr.it\/doc\/485252","volume":"","doi":"","editors_people":"Kiril Simov and Petya Osenova","editors":["Simov, K.","Osenova, P."],"published":"Proceedings of the CLaDA-BG 2023 Conference: Language Technologies and Digital Humanities: Resources and Applications (LTaDH-RA), Sofia, Bulgaria, 10-12 May 2023","publisher":"CEUR-WS. org (Aachen, DEU)","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":366734,"last_updated":"2024-01-11 08:33:24","id_people":491319,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"EpiLexO-User Manual","year":2024,"authors_people":"Michela Bandini Valeria Quochi","authors_cnr":["Bandini, Michela","Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":[""],"authors":["Bandini, M.","Quochi, V."],"abstract":"This document contains a user manual for EpiLexO, a specialized web platform designed for the creation and editing of lexical resources, associated evidence, references, and relevant bibliography of fragmentary languages of ancient Italy such as Oscan, Faliscan, and Venetic in the context of the project: Languages and Cultures of Ancient Italy. Historical Linguistics and Digital Models (PRIN 2017XJLE8J). The platform, a single-page web application, includes several sections, each of which provides functionality for generating or editing lexical resources and establishing connections and links between their elements and different sets of internal and external resources. This User Manual aims to help users understand the interface by illustrating its functions with step-by-step instructions, examples, and troubleshooting guidance. Its target audience includes historical linguists, digital humanists and epigraphists whose research is based on linguistics and philology.","keywords":["Digital Epigraphy","Restsprachen","Lexicon Linking","Ancient Languages","eLexicography","User Manual","Interface"],"pages":"1-77","url":"https:\/\/doi.org\/10.5281\/zenodo.10475219","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":360065,"last_updated":"2023-08-09 13:04:35","id_people":485254,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Describing Inscriptions of Ancient Italy. The ItAnt Project and Its Information Encoding Process","year":2023,"authors_people":"Francesca Murano; Valeria Quochi; Angelo Mario Del Grosso; Luca Rigobianco; Mariarosaria Zinzi","authors_cnr":["Quochi, Valeria","Del Grosso, Angelo Mario"],"authors_cnr_id":["11893","17769"],"authors_cnr_institute":[""],"authors":["Murano, F.","Quochi, V.","Del Grosso, A. M.","Rigobianco, L.","Zinzi, M."],"abstract":"This paper discusses the challenges addressed in the digital scholarly encoding of the fragmentary texts of the languages of Ancient Italy according to the TEI\/EpiDoc Guidelines in XML format. This contribution describes the solutions and customisations that have been adopted for dealing with the peculiarities of our epigraphical documentation and with the formalisation of epigraphical information deemed interesting for data retrieval in a historical linguistic perspective. The making of a digital corpus consisting of new critical editions of selected inscriptions is a work carried out in the context of the project \"Languages and Cultures of Ancient Italy. Historical Linguistics and Digital Models\", which aims to investigate the languages of Ancient Italy by combining the traditional methods, proper to historical linguistics, with methods and technologies proper to the digital humanities and computational lexicography. More specifically, the purpose of the project is to create a collection of interrelated digital language resources which comprise: 1) the digital corpus of texts editions; 2) a computational lexicon compliant with the Web Semantic requirements; 3) a relevant bibliographic reference dataset encoded according to the FRBRoo\/LRMoo specifications. Additionally, selected textual data and scientific interpretations will be encoded by using CIDOC CRM and its extensions, namely CRMtex and CRMinf. The present contribution tackles one of the main aspects of the project, and proposes significant innovations in the encoding of critical editions for epigraphic texts of fragmentary languages, which will hopefully foster future interoperability and integration with other external datasets, a paramount concern of the project.","keywords":["text encoding","ancient languages","digital epigraphy","TEI\/EpiDoc"],"pages":"15","url":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3606703","volume":"16","doi":"10.1145\/3606703","editors_people":"","editors":[""],"published":"Journal on computing and cultural heritage (Online)","publisher":"Association for Computing Machinery (New York, NY, Stati Uniti d'America)","issn":"1556-4711","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":340477,"last_updated":"2023-07-07 11:25:29","id_people":469112,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Italian Language Resources. From CLARIN-IT to the VLO and Back: Sketching a Methodology for Monitoring LRs Visibility","year":2022,"authors_people":"Dario Del Fante, Francesca Frontini. Monica Monachini, Valeria Quochi","authors_cnr":["Del Fante, Dario","Monachini, Monica","Quochi, Valeria","Frontini, Francesca"],"authors_cnr_id":["8945","11893","15911"],"authors_cnr_institute":[""],"authors":["Del Fante, D.","Frontini, F.","Monachini, M.","Quochi, V."],"abstract":"This paper sketches a user-oriented, qualitative methodology for both (i) monitoring the existence and availability of language resources relevant for a given CLARIN national community and language and (ii) assessing the offering potential of CLARIN, in terms of Language Resources provided to national consortia. From the user perspective, the methodology has been applied to investigate the visibility of language resources available for Italian within the CLARIN central services, in particular the Virtual Language Observatory. As a proof-of-concept, the methodology has been tested on the resources available through the CLARIN-IT data centres, but, ideally, it could be applied by any national data centre aiming to assess the existence of LRs in CLARIN for any given languages and check their accessibility for the interested users. It is thus argued that such an assessment might be a useful instrument in the hands of national coordinators and centre managers for (i) bringing to the fore both strengths and critical issues about their data providing community and (ii) for planning targeted actions to improve and increase both visibility and accessibility of their LRs.","keywords":["Virtual Language Observatory","CLARIN-IT","CLARIN-ERIC","Qualitative Assessment Methodology","User Involvement"],"pages":"10-22","url":"https:\/\/ecp.ep.liu.se\/index.php\/clarin\/article\/view\/413\/371","volume":"","doi":"10.3384\/9789179294441","editors_people":"Monachini, Monica and Eskevich, Maria","editors":["Monachini","Monica","Eskevich","Maria"],"published":"Selected Papers from the CLARIN Annual Conference 2021","publisher":"","issn":"","isbn":"978-91-7929-444-1","conference_name":"","conference_place":"","conference_date":""},{"id":343148,"last_updated":"2022-10-21 15:19:30","id_people":472294,"institutes":["ILC","IGSG"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Making Italian Parliamentary Records Machine-Actionable: the Construction of the ParlaMint-IT corpus","year":2022,"authors_people":"Tommaso Agnoloni, Roberto Bartolini, Francesca Frontini, Simonetta Montemagni, Carlo Marchetti, Valeria Quochi, Manuela Ruisi, Giulia Venturi","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Agnoloni, Tommaso","Quochi, Valeria","Frontini, Francesca","Venturi, Giulia"],"authors_cnr_id":["5595","10441","11403","11893","15911","17692"],"authors_cnr_institute":[""],"authors":["Agnoloni, T.","Bartolini, R.","Frontini, F.","Montemagni, S.","Marchetti, C.","Quochi, V.","Ruisi, M.","Venturi, G."],"abstract":"This paper describes the process of acquisition, cleaning, interpretation, coding and linguistic annotation of a collection of parliamentary debates from the Senate of the Italian Republic covering the COVID-19 pandemic emergency period and a former period for reference and comparison according to the CLARIN ParlaMint prescriptions. The corpus contains 1199 sessions and 79,373 speeches for a total of about 31 million words, and was encoded according to the ParlaCLARIN TEI XML format. It includes extensive metadata about the speakers, sessions, political parties and parliamentary groups. As required by the ParlaMint initiative, the corpus was also linguistically annotated for sentences, tokens, POS tags, lemmas and dependency syntax according to the universal dependencies guidelines. Named entity annotation and classification is also included. All linguistic annotation was performed automatically using state-of-the-art NLP technology with no manual revision. The Italian dataset is freely available as part of the larger ParlaMint 2.1 corpus deposited and archived in CLARIN repository together with all other national corpora. It is also available for direct analysis and inspection via various CLARIN services and has already been used both for research and educational purposes.","keywords":["parliamentary debates","CLARIN ParlaMint","corpus creation","corpus annotation"],"pages":"117-124","url":"https:\/\/aclanthology.org\/2022.parlaclarin-1.17\/","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"","conference_name":"Workshop ParlaCLARIN III within the 13th Language Resources and Evaluation Conference","conference_place":"Marseille, France","conference_date":"20\/06\/2022"},{"id":340372,"last_updated":"2022-10-18 23:27:09","id_people":468964,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"CLARIN-IT: An Overview on the Italian Clarin Consortium After Six Years of Activity","year":2022,"authors_people":"Dario Del Fante, Francesca Frontini, Monica Monachini, Valeria Quochi","authors_cnr":["Del Fante, Dario","Monachini, Monica","Quochi, Valeria","Frontini, Francesca"],"authors_cnr_id":["8945","11893","15911"],"authors_cnr_institute":[""],"authors":["Del Fante, D.","Frontini, F.","Monachini, M.","Quochi, V."],"abstract":"This paper offers an overview of the Italian CLARIN consortium after six years since its establishment. The members, the centres and the repositories and the most important collections are described. Lastly, in order to showcase the visibility and the accessiblity of Language Resources provided by CLARIN-IT from a user-perspective, we show how Italian resources are findable within CLARIN ERI","keywords":["Language Resources","Data Repositories and Archives","Research Infrastructures","CLARIN"],"pages":"8","url":"http:\/\/ceur-ws.org\/Vol-3160\/short21.pdf","volume":"","doi":"","editors_people":"Giorgio Maria Di Nunzio, Beatrice Portelli, Domenico Redavid, Gianmaria Silvello","editors":["Di Nunzio, G. M.","Portelli, B.","Redavid, D.","Silvello, G."],"published":"Proceedings of the 18th Italian Research Conference on Digital Libraries","publisher":"CEUR-WS. org (Aachen, DEU)","issn":"1613-0073","isbn":"","conference_name":"Italian Research Conference on Digital Libraries","conference_place":"Universit\u00e0 degli Studi di Padova","conference_date":"24\/02\/2022"},{"id":343201,"last_updated":"2023-07-10 10:33:07","id_people":472419,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"From Inscriptions to Lexica and Back: A Platform for Editing and Linking the Languages of Ancient Italy","year":2022,"authors_people":"Valeria Quochi, Andrea Bellandi, Fahad Khan, Michele Mallia, Francesca Murano, Silvia Piccini, Luca Rigobianco, Alessandro Tommasi, Cesare Zavattari","authors_cnr":["Mallia, Michele","Zavattari, Cesare","Quochi, Valeria","Bellandi, Andrea","Piccini, Silvia","Khan, Anas Fahad Aslam"],"authors_cnr_id":["11893","17627","17738","18790"],"authors_cnr_institute":[""],"authors":["Quochi, V.","Bellandi, A.","Khan, F.","Mallia, M.","Murano, F.","Piccini, S.","Rigobianco, L.","Tommasi, A.","Zavattari, C."],"abstract":"Available language technology is hardly applicable to scarcely attested ancient languages, yet their digital semantic representation, though challenging, is an asset for the purpose of sharing and preserving existing cultural knowledge. In the context of a project on the languages and cultures of ancient Italy, we took up this challenge. This paper thus describes the development of a user friendly web platform, EpiLexO, for the creation and editing of an integrated system of language resources for ancient fragmentary languages centered on the lexicon, in compliance with current digital humanities and Linked Open Data principles. EpiLexo allows for the editing of lexica with all relevant cross-references: for their linking to their testimonies, as well as to bibliographic information and other (external) resources and common vocabularies. The focus of the current implementation is on the languages of ancient Italy, in particular Oscan, Faliscan, Celtic and Venetic; however, the technological solutions are designed to be general enough to be potentially applicable to different contexts and scenarios.","keywords":["Digital Epigraphy","Restsprachen","Lexicon Editing and Linking","tools for DH"],"pages":"59-67","url":"https:\/\/aclanthology.org\/2022.lt4hala-1.0\/","volume":"","doi":"","editors_people":"Sprugnoli, Rachele; Passarotti, Marco","editors":["Sprugnoli, R.","Passarotti, M."],"published":"Proceedings of the Second Workshop on Language Technologies for Historical and Ancient Languages (LT4HALA 2022)","publisher":"European language resources association (ELRA) (Paris, FRA)","issn":"","isbn":"979-10-95546-78-8","conference_name":"Second Workshop on Language Technologies for Historical and Ancient Languages (LT4HALA 2022)","conference_place":"Marseille, France","conference_date":"25\/06\/2022"},{"id":343203,"last_updated":"2023-07-10 09:45:37","id_people":472422,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Supporting Ancient Historical Linguistics and Cultural Studies with EpiLexO","year":2022,"authors_people":"Valeria Quochi, Andrea Bellandi, Michele Mallia, Alessandro Tommasi and Cesare Zavattari","authors_cnr":["Mallia, Michele","Zavattari, Cesare","Quochi, Valeria","Bellandi, Andrea"],"authors_cnr_id":["11893","17627"],"authors_cnr_institute":[""],"authors":["Quochi, V.","Bellandi, A.","Mallia, M.","Tommasi, A.","Zavattari, C."],"abstract":"This contribution presents a system of independent software components meant to support the creation of ecosystems of interrelated language data (i.e. lexica linked to textual testimonies, concepts, metadata, bibliographic references, and other external lexical resources) according to the current state-of-the-art representational models for the semantic web. The system is implemented as a set of autonomous servers exposing Restful APIs that in principle can serve different frontend applications and use cases. In this work they serve the EpiLexO GUI application designed and geared to support scholars of ancient languages of fragmentary attestation in their studies. The development of both the back-ends and the front-end is still work-in progress, but a first version is ready for use.","keywords":["tools for DH","ancient languages","restsprachen","lexicon editor","corpus management","lexicon-text linking"],"pages":"39-43","url":"https:\/\/office.clarin.eu\/v\/CE-2022-2118-CLARIN2022_ConferenceProceedings.pdf","volume":"ISSN 2773-2177","doi":"","editors_people":"Erjavec, T.; Eskevich, M","editors":["Erjavec, T.","Eskevich, M."],"published":"CLARIN Annual Conference Proceedings 2022","publisher":"","issn":"","isbn":"","conference_name":"CLARIN Annual Conference 2022","conference_place":"Prague, Czechia","conference_date":"10-12\/10\/2022"},{"id":355806,"last_updated":"2023-07-12 11:52:47","id_people":479194,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Challenges in Encoding Fragmentary Attested Languages","year":2022,"authors_people":"Anna Marinetti; Francesca Murano; Valeria Quochi; Monica Ballerini, Federico Boschetti, Angelo Mario Del Grosso, Silvia Piccini, Luca Rigobianco, Patrizia Solinas, Mariarosaria Zinzi; Michele Mallia; Edoardo Middei","authors_cnr":["Mallia, Michele","Quochi, Valeria","Boschetti, Federico","Piccini, Silvia","Del Grosso, Angelo Mario"],"authors_cnr_id":["11893","14630","17738","17769"],"authors_cnr_institute":[""],"authors":["Marinetti, A.","Murano, F.","Quochi, V.","Ballerini, M.","Boschetti, F.","Del Grosso, A. M.","Piccini, S.","Rigobianco, L.","Solinas, P.","Zinzi, M.","Mallia, M.","Middei, E."],"abstract":"The ItAnt project investigates the langages of ancient Italy, whose only attestation consist in epigraphic evidence, focusing on Venetic, Oscan, Faliscan and Celtic languages. For this purpose, the project combines the traditional method proper to historical linguistics with the setting up of digital technologies, developing computational tools specifically designes to create a digital set of interrelated resources.","keywords":["digital epigraphy","eLexicography","Linguistic Linked Open Data","Text Encoding"],"pages":"","url":"https:\/\/ciegl2022.sciencesconf.org\/resource\/page\/id\/30","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"XVI Congresso Internazionale di Epigrafia greca e latina","conference_place":"Bordeaux","conference_date":"29 agosto-settembre 2022"},{"id":343202,"last_updated":"2022-11-10 11:00:10","id_people":472421,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D3. 8 Lexical-semantic analytics for NLP","year":2022,"authors_people":"Federico Martelli, Marco Maru, Cesare Campagnano, Roberto Navigli, Paola Velardi, Rafael-J Ure\u00f1a-Ruiz, Francesca Frontini, Valeria Quochi, Jelena Kallas, Kristina Koppel, Margit Langemets, Jesse de Does, Rob Tempelaars, Carole Tiberius, Rute Costa, Ana Salgado, Simon Krek, Jaka ?ibej, Kaja Dobrovoljc, Polona Gantar, Tina Munda","authors_cnr":["Quochi, Valeria","Frontini, Francesca"],"authors_cnr_id":["11893","15911"],"authors_cnr_institute":[""],"authors":["Martelli, F.","Maru, M.","Campagnano, C.","Navigli, R.","Velardi, P.","Ure\u00f1a Ruiz, R.","Frontini, F.","Quochi, V.","Kallas, J.","Koppel, K.","Langemets, M.","De Does, J.","Tempelaars, R.","Tiberius, C.","Costa, R.","Salgado, A.","Krek, S.","\u010cibej, J.","Dobrovoljc, K.","Gantar, P.","Munda, T."],"abstract":"The present document illustrates the work carried out in task 3.3 (work package 3) focused on lexicalsemantic analytics for Natural Language Processing (NLP). This task aims at computing analytics for lexicalsemantic information such as words, senses and domains in the available resources, investigating their role in NLP applications. Specifically, this task concentrates on three research directions, namely i) which grouping senses based on their semantic similari sense clustering , in ty improves the performance of NLP tasks such as Word Sense Disambiguation (WSD), ii) domain labeling of text , in which the lexicographic resources made available by the ELEXIS project for research purposes allow better performances to be achieved, and fin senses ally iii) analysing the , for which a software package is made available. diachronic distribution of In this deliverable, we illustrate the research activities aimed at achieving the aforementioned goals and put forward suggestions for future works. Importantly, we stress the crucial role played by highquality lexicalsemantic r esources when investigating such linguistic aspects and their impact on NLP applications. To this end, as an additional contribution, we address the paucity of manually the ELEXIS parallelannotated data in the lexical senseannotated datasetsemantic research field and introduce , a novel entirely manuallyavailable in 10 European languages and featuring 5 annotation layers.","keywords":["research infrastructures","lexicography","lexical resources","word-sense disambiguation","WSD","sense-annotated language data","multilinguality"],"pages":"67","url":"https:\/\/elex.is\/wp-content\/uploads\/ELEXIS_D3_8_Lexical-Semantic_Analytics_for_NLP_final_report.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132494,"last_updated":"2022-05-05 11:42:29","id_people":463877,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D5. 3 Overview of Online Tutorials and Instruction Manuals","year":2022,"authors_people":"Toma Tasovac, Carole Tiberius, Claudia Bamberg, Andrea Bellandi, Thomas Burch, Rute Costa, Matej ?ur?o, Francesca Frontini, Julia Hennemann, Kris Heylen, Milo? Jakub\u00ed?ek, Fahad Khan, Anne Klee, Iztok Kosem, Vojt?ch Kov\u00e1?, Ond?ej Matu?ka, John McCrae, Monica Monachini, Karlheinz M\u00f6rth, Tina Munda, Valeria Quochi, Andra? Repar, Christophe Roche, Ana Salgado, Henrike Sievers, Tam\u00e1s V\u00e1radi, Sandra Weyand, Anna Woldrich, Susanne Zhanial","authors_cnr":["Monachini, Monica","Quochi, Valeria","Frontini, Francesca","Bellandi, Andrea","Khan, Anas Fahad Aslam"],"authors_cnr_id":["8945","11893","15911","17627","18790"],"authors_cnr_institute":[""],"authors":["Tasovac, T.","Tiberius, C.","Bamberg, C.","Bellandi, A.","Burch, T.","Costa, R.","\u010eur\u010do, M.","Frontini, F.","Hennemann, J.","Heylen, K.","Jakub\u00ed\u010dek, M.","Khan, F.","Klee, A.","Kosem, I.","Kov\u00e1\u0159, V.","Matu\u0161ka, O.","McCrae, J.","Monachini, M.","M\u00f6rth, K.","Munda, T.","Quochi, V.","Repar, A.","Roche, C.","Salgado, A.","Sievers, H.","V\u00e1radi, T.","Weyand, S.","Woldrich, A.","Zhanial, S."],"abstract":"The ELEXIS Curriculum is an integrated set of training materials which contextualizes ELEXIS tools and services inside a broader, systematic pedagogic narrative. This means that the goal of the ELEXIS Curriculum is not simply to inform users about the functionalities of particular tools and services developed within the project, but to show how such tools and services are a) embedded in both lexicographic theory and practice; and b) representative of and contributing to the development of digital skills among lexicographers. The scope and rationale of the curriculum are described in more detail in the Deliverable D5.2 Guidelines for Producing ELEXIS Tutorials and Instruction Manuals. The goal of this deliverable, as stated in the project DOW, is to provide \"a clear, structured overview of tutorials and instruction manuals developed within the project.\"","keywords":["ELEXIS","lexicography","training materials"],"pages":"31","url":"https:\/\/elex.is\/wp-content\/uploads\/ELEXIS_D5_3_Overview-of-Online-Tutorials-and-Instruction-Manuals.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132483,"last_updated":"2022-07-29 11:50:57","id_people":463506,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"CLARIN Tools and Resources for Lexicographic Work","year":2022,"authors_people":"Francesca Frontini Andrea Bellandi Valeria Quochi Monica Monachini Karlheinz M\u00f6rth Susanne Zhanial Matej ?ur?o Anna Woldrich","authors_cnr":["Quochi, Valeria","Monachini, Monica","Frontini, Francesca","Bellandi, Andrea"],"authors_cnr_id":["8945","15911","17627"],"authors_cnr_institute":[""],"authors":["Frontini, F.","Bellandi, A.","Quochi, V.","Monachini, M.","M\u00f6rth, K.","Zhanial, S.","\u010eur\u010do, M.","Woldrich, A."],"abstract":"This course introduces lexicographers to the CLARIN Research Infrastructure and highlights language resources and tools useful for lexicographic practices. The course consists of two parts. In Part 1, you will learn about CLARIN, its technical and knowledge infrastructure, and about how to deposit and find lexical resources in CLARIN. In Part 2, you will become acquainted with CLARIN tools that can be used to create lexical resources.","keywords":["CLARIN","lexicography"],"pages":"","url":"https:\/\/elexis.humanistika.org\/id\/UnwYPq70Dewbn7XDEjsMM","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":343122,"last_updated":"2022-10-20 17:20:56","id_people":472295,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Parallel sense-annotated corpus ELEXIS-WSD 1. 0","year":2022,"authors_people":"Federico Martelli, Roberto Navigli, Simon Krek, Jelena Kallas, Polona Gantar, Svetla Koeva, Sanni Nimb, Bolette Sandford Pedersen, Sussi Olsen, Margit Langemets, Kristina Koppel, Tiiu \u00dcksik, Kaja Dobrovoljc, Rafael Ure\u00f1a-Ruiz, Jos\u00e9-Luis Sancho-S\u00e1nchez, Veronika Lipp, Tam\u00e1s V\u00e1radi, Andr\u00e1s Gy?rffy, Simon L\u00e1szl\u00f3, Valeria Quochi, Monica Monachini, Francesca Frontini, Carole Tiberius, Rob Tempelaars, Rute Costa, Ana Salgado, Jaka ?ibej, Tina Munda","authors_cnr":["Monachini, Monica","Quochi, Valeria","Frontini, Francesca"],"authors_cnr_id":["8945","11893","15911"],"authors_cnr_institute":[""],"authors":["Martelli, F.","Navigli, R.","Krek, S.","Kallas, J.","Gantar, P.","Koeva, S.","Nimb, S.","Pedersen, B. S.","Olsen, S.","Langemets, M.","Koppel, K.","\u00dcksik, T.","Dobrovoljc, K.","Ure\u00f1a Ruiz, R.","Sancho S\u00e1nchez, J.","Lipp, V.","V\u00e1radi, T.","Gy\u0151rffy, A.","L\u00e1szl\u00f3, S.","Quochi, V.","Monachini, M.","Frontini, F.","Tiberius, C.","Tempelaars, R.","Costa, R.","Salgado, A.","\u010cibej, J.","Munda, T."],"abstract":"ELEXIS-WSD is a parallel sense-annotated corpus in which content words (nouns, adjectives, verbs, and adverbs) have been assigned senses. Version 1.0 contains sentences for 10 languages: Bulgarian, Danish, English, Spanish, Estonian, Hungarian, Italian, Dutch, Portuguese, and Slovene. The corpus was compiled by automatically extracting a set of sentences from WikiMatrix (Schwenk et al., 2019), a large open-access collection of parallel sentences derived from Wikipedia, using an automatic approach based on multilingual sentence embeddings. The sentences were manually validated according to specific formal, lexical and semantic criteria (e.g. by removing incorrect punctuation, morphological errors, notes in square brackets and etymological information typically provided in Wikipedia pages). To obtain a satisfying semantic coverage, we filtered out sentences with less than 5 words and less than 2 polysemous words were filtered out. Subsequently, in order to obtain datasets in the other nine target languages, for each selected sentence in English, the corresponding WikiMatrix translation into each of the other languages was retrieved. If no translation was available, the English sentence was translated manually. The resulting corpus is comprised of 2,024 sentences for each language.","keywords":["Word Sense Disambiguation","corpus parallelo","disambiguazione automatica del senso","annotazione semantica multilingue"],"pages":"","url":"http:\/\/hdl.handle.net\/11356\/1674","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132488,"last_updated":"2022-02-11 06:36:56","id_people":463856,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"LexO editor: the basics-video tutorial","year":2022,"authors_people":"Valeria Quochi, Andrea Bellandi","authors_cnr":["Quochi, Valeria","Bellandi, Andrea"],"authors_cnr_id":["11893","17627"],"authors_cnr_institute":[""],"authors":["Quochi, V.","Bellandi, A."],"abstract":"Video tutorial sull'uso di LexO, un editor di lessici secondo il modello Ontolex-lemon. Il tutoria \u00e8 parte dell' ELEXIS training programme disponibile sulla piattaforma DARIAH-teach.","keywords":["lexicon editor","video tutorial","training material","lexO","online web application"],"pages":"","url":"https:\/\/www.youtube.com\/watch?v=9KE0laMaTAs&list=PLoD829qNERpYKq8JRkY4EIGgZCdi0QHOd","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132472,"last_updated":"2022-02-16 15:49:26","id_people":461705,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Designing the ELEXIS Parallel Sense-Annotated Dataset in 10 European Languages","year":2021,"authors_people":"Martelli, Federico and Navigli, Roberto and Krek, Simon and Tiberius, Carole and Kallas, Jelena and Gantar, Polona and Koeva, Svetla and Nimb, Sanni and Pedersen, Bolette Sandford and Olsen, Sussi and Langements, Margit and Koppel, Kristina and ?ksik, Tiiu and Dobrovolijc, Kaja and Ure?a-Ruiz, Rafael-J. and Sancho-S?nchez, Jos?-Luis and Lipp, Veronika and Varadi, Tamas and Gy?rffy, Andr?s and L?szl?, Simon and Quochi, Valeria and Monachini, Monica and Frontini, Francesca and Tempelaars, Rob and Costa, Rute and Salgado, Ana and ?ibej, Jaka and Munda, Tina","authors_cnr":["Monachini, Monica","Quochi, Valeria","Frontini, Francesca"],"authors_cnr_id":["8945","11893","15911"],"authors_cnr_institute":[""],"authors":["Martelli, F.","Navigli, R.","Krek, S.","Tiberius, C.","Kallas, J.","Gantar, P.","Koeva, S.","Nimb, S.","Pedersen, B. S.","Olsen, S.","Langements, M.","Koppel, K.","\u00dcksik, T.","Dobrovolijc, K.","Ure\u00f1a Ruiz, R.","Sanchos\u00e1nchez, J.","Lipp, V.","Varadi, T.","Gy\u00f6rffy, A.","L\u00e1szl\u00f3, S.","Quochi, V.","Monachini, M.","Frontini, F.","Tempelaars, R.","Costa, R.","Salgado, A.","\u010cibej, J.","Munda, T."],"abstract":"Over the course of the last few years, lexicography has witnessed the burgeoning of increasingly reliable automatic approaches supporting the creation of lexicographic resources such as dictionaries, lexical knowledge bases and annotated datasets. In fact, recent achievements in the field of Natural Language Processing and particularly in Word Sense Disambiguation have widely demonstrated their effectiveness not only for the creation of lexicographic resources, but also for enabling a deeper analysis of lexical-semantic data both within and across languages. Nevertheless, we argue that the potential derived from the connections between the two fields is far from exhausted. In this work, we address a serious limitation affecting both lexicography and Word Sense Disambiguation, i.e. the lack of high-quality sense-annotated data and describe our efforts aimed at constructing a novel entirely manually annotated parallel dataset in 10 European languages. For the purposes of the present paper, we concentrate on the annotation of morpho-syntactic features. Finally, unlike many of the currently available sense-annotated datasets, we will annotate semantically by using senses derived from high-quality lexicographic repositories.","keywords":["Digital lexicography","Natural Language Processing","Computational Linguistics","Corpus Linguistics","Word Sense Disambiguation"],"pages":"377-396","url":"https:\/\/static-curis.ku.dk\/portal\/files\/279888836\/eLex_2021_22_pp377_395.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of the eLex 2021 conference","publisher":"","issn":"","isbn":"","conference_name":"eLex 2021","conference_place":"","conference_date":"05\/-7\/2021-07\/07\/2021"},{"id":132468,"last_updated":"2022-06-08 16:07:54","id_people":461529,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Languages and Cultures of Ancient Italy. Historical Linguistics and Digital Models","year":2021,"authors_people":"A. Marinetti, F. Murano, V. Quochi, M. Ballerini, F. Boschetti, A.M. Del Grosso, S. Piccini , L. Rigobianco, P. Solinas","authors_cnr":["Quochi, Valeria","Boschetti, Federico","Piccini, Silvia","Del Grosso, Angelo Mario"],"authors_cnr_id":["11893","14630","17738","17769"],"authors_cnr_institute":[""],"authors":["Marinetti, A.","Murano, F.","Quochi, V.","Ballerini, M.","Boschetti, F.","Del Grosso, A. M.","Piccini, S.","Rigobianco, L.","Solinas, P."],"abstract":"The abstract accompanies a poster presenting an overview of the project \"Languages and cultures of Ancient Italy\", which had just started. The project brings together competences from Historical Linguistics, Computational Lexicography and Digital Humanities. The main objective of the project is to investigate the cultures of ancient Italy on the basis of theirlinguistic documentation (7th - 1stc. B.C.) by means of digital tools specifically tailored for their peculiarities.","keywords":["digital epigraphy","computational lexicons","text-lexicon linking","restsprachen","digital models","digital humanities"],"pages":"528-532","url":"https:\/\/aiucd2021.labcd.unipi.it\/en\/book-of-abstracts-conference\/","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"10th National Conference of Associazione per l'Informatica Umanistica e la Cultura Digitale","conference_place":"Pisa (Virtuale)","conference_date":"19-22 gennaio 2021"},{"id":132489,"last_updated":"2022-05-05 11:44:08","id_people":463861,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Linguistically annotated multilingual comparable corpora of parliamentary debates ParlaMint. ana 2. 1","year":2021,"authors_people":"Toma? Erjavec, Maciej Ogrodniczuk, Petya Osenova, Nikola Ljube?i?, Kiril Simov, Vladislava Grigorova, Micha? Rudolf, Andrej Pan?ur, Maty\u00e1? Kopp, Starka\u00f0ur Barkarson, Stein\u00feor Steingr\u00edmsson, Henk van der Pol, Griet Depoorter, Jesse de Does, Bart Jongejan, Dorte Haltrup Hansen, Costanza Navarretta, Mar\u00eda Calzada P\u00e9rez, Luciana D. de Macedo, Ruben van Heusden, Maarten Marx, \u00c7a?r? \u00c7\u00f6ltekin, Matthew Coole, Tommaso Agnoloni, Francesca Frontini, Simonetta Montemagni, Valeria Quochi, Giulia Venturi, Manuela Ruisi, Carlo Marchetti, Roberto Battistoni, Mikl\u00f3s Seb?k, Orsolya Ring, Roberts Dar?is, Andrius Utka, Mindaugas Petkevi?ius, Monika Briedien\u00e9, Tomas Krilavi?ius, Vaidas Morkevi?ius, Roberto Bartolini, Andrea Cimino, Sascha Diwersy, Giancarlo Luxardo, Paul Rayson","authors_cnr":["Cimino, Andrea","Montemagni, Simonetta","Bartolini, Roberto","Agnoloni, Tommaso","Quochi, Valeria","Frontini, Francesca","Venturi, Giulia"],"authors_cnr_id":["5595","10441","11403","11893","15911","17692"],"authors_cnr_institute":[""],"authors":["Erjavec, T.","Ogrodniczuk, M.","Osenova, P.","Ljube\u0161i\u0107, N.","Simov, K.","Grigorova, V.","Rudolf, M.","Pan\u010dur, A.","Kopp, M.","Barkarson, S.","Steingr\u00edmsson, S.","Van Der Pol, H.","Depoorter, G.","De Does, J.","Jongejan, B.","Haltrup Hansen, D.","Navarretta, C.","Calzada P\u00e9rez, M.","De Macedo, L. D.","Van Heusden, R.","Marx, M.","\u00c7\u00f6ltekin, \u00c7.","Coole, M.","Agnoloni, T.","Frontini, F.","Montemagni, S.","Quochi, V.","Venturi, G.","Ruisi, M.","Marchetti, C.","Battistoni, R.","Seb\u0151k, M.","Ring, O.","Dar\u0123is, R.","Utka, A.","Petkevi\u010dius, M.","Briedien\u0117, M.","Krilavi\u010dius, T.","Morkevi\u010dius, V.","Diwersy, S.","Luxardo, G.","Rayson, P."],"abstract":"ParlaMint 2.1 is a multilingual set of 17 comparable corpora containing parliamentary debates mostly starting in 2015 and extending to mid-2020, with each corpus being about 20 million words in size. The sessions in the corpora are marked as belonging to the COVID-19 period (from November 1st 2019), or being \"reference\" (before that date). The corpora have extensive metadata, including aspects of the parliament; the speakers (name, gender, MP status, party affiliation, party coalition\/opposition); are structured into time-stamped terms, sessions and meetings; with speeches being marked by the speaker and their role (e.g. chair, regular speaker). The speeches also contain marked-up transcriber comments, such as gaps in the transcription, interruptions, applause, etc. Note that some corpora have further information, e.g. the year of birth of the speakers, links to their Wikipedia articles, their membership in various committees, etc. The corpora are encoded according to the Parla-CLARIN TEI recommendation (https:\/\/clarin-eric.github.io\/parla-clarin\/), but have been validated against the compatible, but much stricter ParlaMint schemas. This entry contains the linguistically marked-up version of the corpus, while the text version is available at http:\/\/hdl.handle.net\/11356\/1432. The ParlaMint.ana linguistic annotation includes tokenization, sentence segmentation, lemmatisation, Universal Dependencies part-of-speech, morphological features, and syntactic dependencies, and the 4-class CoNLL-2003 named entities. Some corpora also have further linguistic annotations, such as PoS tagging or named entities according to language-specific schemes, with their corpus TEI headers giving further details on the annotation vocabularies and tools.","keywords":["dibattiti parlamentari","covid-19","ParlaCLARIN","parlamenti","discorso politico","CLARIN","linguistic annotation","pos-tagging","ner","linguistic dependency annotation","UD"],"pages":"","url":"http:\/\/hdl.handle.net\/11356\/1432","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132490,"last_updated":"2022-05-05 11:44:28","id_people":463865,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Multilingual comparable corpora of parliamentary debates ParlaMint 2. 1","year":2021,"authors_people":"Toma? Erjavec, Maciej Ogrodniczuk, Petya Osenova, Nikola Ljube?i?, Kiril Simov, Vladislava Grigorova, Micha? Rudolf, Andrej Pan?ur, Maty\u00e1? Kopp, Starka\u00f0ur Barkarson, Stein\u00feor Steingr\u00edmsson, Henk van der Pol, Griet Depoorter, Jesse de Does, Bart Jongejan, Dorte Haltrup Hansen, Costanza Navarretta, Mar\u00eda Calzada P\u00e9rez, Luciana D. de Macedo, Ruben van Heusden, Maarten Marx, \u00c7a?r? \u00c7\u00f6ltekin, Matthew Coole, Tommaso Agnoloni, Francesca Frontini, Simonetta Montemagni, Valeria Quochi, Giulia Venturi, Manuela Ruisi, Carlo Marchetti, Roberto Battistoni, Mikl\u00f3s Seb?k, Orsolya Ring, Roberts Dar?is, Andrius Utka, Mindaugas Petkevi?ius, Monika Briedien\u00e9, Tomas Krilavi?ius, Vaidas Morkevi?ius, Roberto Bartolini, Andrea Cimino, Sascha Diwersy, Giancarlo Luxardo, Paul Rayson","authors_cnr":["Montemagni, Simonetta","Agnoloni, Tommaso","Quochi, Valeria","Frontini, Francesca","Venturi, Giulia"],"authors_cnr_id":["5595","11403","11893","15911","17692"],"authors_cnr_institute":[""],"authors":["Erjavec, T.","Ogrodniczuk, M.","Osenova, P.","Ljube\u0161i\u0107, N.","Simov, K.","Grigorova, V.","Rudolf, M.","Pan\u010dur, A.","Kopp, M.","Barkarson, S.","Steingr\u00edmsson, S.","Van Der Pol, H.","Depoorter, G.","De Does, J.","Jongejan, B.","Haltrup Hansen, D.","Navarretta, C.","Calzada P\u00e9rez, M.","De Macedo, L. D.","Van Heusden, R.","Marx, M.","\u00c7\u00f6ltekin, \u00c7.","Coole, M.","Agnoloni, T.","Frontini, F.","Montemagni, S.","Quochi, V.","Venturi, G.","Ruisi, M.","Marchetti, C.","Battistoni, R.","Seb\u0151k, M.","Ring, O.","Dar\u0123is, R.","Utka, A.","Petkevi\u010dius, M.","Briedien\u0117, M.","Krilavi\u010dius, T.","Morkevi\u010dius, V.","Diwersy, S.","Luxardo, G.","Rayson, P."],"abstract":"ParlaMint 2.1 is a multilingual set of 17 comparable corpora containing parliamentary debates mostly starting in 2015 and extending to mid-2020, with each corpus being about 20 million words in size. The sessions in the corpora are marked as belonging to the COVID-19 period (after November 1st 2019), or being \"reference\" (before that date). The corpora have extensive metadata, including aspects of the parliament; the speakers (name, gender, MP status, party affiliation, party coalition\/opposition); are structured into time-stamped terms, sessions and meetings; with speeches being marked by the speaker and their role (e.g. chair, regular speaker). The speeches also contain marked-up transcriber comments, such as gaps in the transcription, interruptions, applause, etc. Note that some corpora have further information, e.g. the year of birth of the speakers, links to their Wikipedia articles, their membership in various committees, etc. The corpora are encoded according to the Parla-CLARIN TEI recommendation (https:\/\/clarin-eric.github.io\/parla-clarin\/), but have been validated against the compatible, but much stricter ParlaMint schemas. This entry contains the ParlaMint TEI-encoded corpora with the derived plain text version of the corpus along with TSV metadata on the speeches. Also included is the 2.0 release of the data and scripts available at the GitHub repository of the ParlaMint project. Note that there also exists the linguistically marked-up version of the corpus, which is available at http:\/\/hdl.handle.net\/11356\/1431.","keywords":["dibattiti parlamentari","covid-19","discorso politico","CLARIN","parlamenti","ParlaCLARIN"],"pages":"","url":"http:\/\/hdl.handle.net\/11356\/1431","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132444,"last_updated":"2022-02-16 15:50:32","id_people":453502,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Relazione di fine progetto \"PIM-Piattaforma Integrata Monitoraggio\"","year":2020,"authors_people":"Roberto Bartolini, Valeria Quochi, Monica Monachini, Fabio Aff\u00e9","authors_cnr":["Monachini, Monica","Bartolini, Roberto","Quochi, Valeria"],"authors_cnr_id":["8945","10441","11893"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Quochi, V.","Monachini, M.","Aff\u00e9, F."],"abstract":"Il documento presenta l'attivit\u00e0 svolta dal CNR-ILC nel ruolo di subcontraente di COMDATA per la realizzazione di moduli di trattamento automatico del linguaggio e la consulenza per l'integrazione di metodi di clustering automatico di documenti nella Digital Library del progetto PIM.","keywords":["accesso intelligente al testo","digital library","natural language processing"],"pages":"156","url":"https:\/\/publications.cnr.it\/doc\/453502","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132265,"last_updated":"2019-06-03 17:01:00","id_people":387361,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"CLARIN-IT: State of Affairs, Challenges and Opportunities","year":2018,"authors_people":"Lionel Nicolas, Alexander K\u00f6nig, Monica Monachini, Riccardo Del Gratta, Silvia Calamai, Andrea Abel, Alessandro Enea, Francesca Biliotti, Valeria Quochi, Francesco Vincenzo Stella","authors_cnr":["Enea, Alessandro","Monachini, Monica","Quochi, Valeria","Del Gratta, Riccardo"],"authors_cnr_id":["8533","8945","11893","11933"],"authors_cnr_institute":[""],"authors":["Nicolas, L.","K\u00f6nig, A.","Monachini, M.","Del Gratta, R.","Calamai, S.","Abel, A.","Enea, A.","Biliotti, F.","Quochi, V.","Stella, F. V."],"abstract":"his paper gives an overview on the Italian national CLARIN consortium as it currently stands two years after its creation at the end of 2015. It thus discusses the current state of affairs of the consortium on several aspects, especially with regards to members. It also discusses the events and initiatives that have been undertaken, as well as the ones that are planned in the close future. It finally outlines the conclusions of a user survey performed to understand the expectations of a targeted user population and provides indications regarding the next steps planned.","keywords":["CLARIN-IT Consortium Pisa Bolzano Siena"],"pages":"1-14","url":"http:\/\/www.ep.liu.se\/ecp\/contents.asp?issue=147","volume":"147","doi":"","editors_people":"","editors":[""],"published":"Selected papers from the CLARIN Annual Conference 2017, Budapest, 18-20 September 2017","publisher":"","issn":"","isbn":"978-91-7685-273-6","conference_name":"CLARIN Annual Conference 2017","conference_place":"Budapest, Hungary","conference_date":"18-20 September, 2017"},{"id":132266,"last_updated":"2019-09-25 11:49:40","id_people":387362,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"The DLDP Survey on Digital Use and Usability of EU Regional and Minority Languages","year":2018,"authors_people":"Claudia Soria, Valeria Quochi, Irene Russo","authors_cnr":["Soria, Claudia","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11893","17442"],"authors_cnr_institute":[""],"authors":["Soria, C.","Quochi, V.","Russo, I."],"abstract":"This paper reports about the design, the results and the key findings of a survey launched by the Digital Language Diversity Project about the digital use and usability of regional and minority languages. The aim of the survey - the first of this kind - was to investigate the real needs and expectations of European minority language speakers regarding digital opportunities. The focus on four languages (Basque, Breton, Karelian and Sardinian) at different stages of digital development offers a starting point to develop strategies for assessing digital vitality of these languages and overcoming specific difficulties.","keywords":["minority languages","digital survival","electronic communication"],"pages":"4155-4160","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2018\/pdf\/684.pdf","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference chair), Khalid Choukri, Christopher Cieri, Thierry Declerck, Sara Goggi, Koiti Hasida, Hitoshi Isahara, Bente Maegaard, Joseph Mariani, H\u00e9l\u00e8ne Mazo, Asuncion Moreno, Jan Odijk, Stelios Piperidis, Takenobu Tokunaga","editors":["Calzolari, N.","Choukri, K.","Cieri, C.","Declerck, T.","Goggi, S.","Hasida, K.","Isahara, H.","Maegaard, B.","Mariani, J.","Mazo, H.","Moreno, A.","Odijk, J.","Piperidis, S.","Tokunaga, T."],"published":"Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"979-10-95546-00-9","conference_name":"Eleventh International Conference on Language Resources and Evaluation (LREC 2018)","conference_place":"Miyazaki, Japan","conference_date":"7-12\/05\/2018"},{"id":358734,"last_updated":"2023-07-06 11:41:14","id_people":483257,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Kit per la sopravvivenza digitale della lingua sarda-Le raccomandazioni del progetto DLDP per migliorare la vitalit\u00e0 digitale della lingua sarda","year":2018,"authors_people":"Baroni P., Quochi V., Russo I., Soria C., Ceberio Berger K., Gurrutxaga Hernaiz A., Hicks D., Kruse E., Salonen T., Sarhimaa A.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Baroni, P.","Quochi, V.","Russo, I.","Soria, C.","Ceberio, B. K.","Gurrutxaga, H. A.","Hicks, D.","Kruse, E.","Salonen, T.","Sarhimaa, A."],"abstract":"Le raccomandazioni del progetto DLDP per migliorare la vitalit\u00e0 digitale della lingua sarda (versione italiana)","keywords":["digital vitality","digital diversity","digital language survival","recommendations","Sardinian"],"pages":"12","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Survival-Kit-for-Sardinian_IT.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358723,"last_updated":"2023-07-06 12:00:30","id_people":443050,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Euskarak Mundu Digitalean Bizirauteko Kita-DLDPren gomendioak, euskararen bizitasun digitala hobetu dadin","year":2018,"authors_people":"Ceberio Berger K., Gurrutxaga Hernaiz A., Baroni P., Hicks D.,Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Ceberio, B. K.","Gurrutxaga, H. A.","Baroni, P.","Hicks, D.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP per la sopravvivenza digitale della lingua basca (versione basca)","keywords":["digital vitality","digital diversity","digital language survival","recommendations","Basque"],"pages":"27","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Survival-Kit-for-Basque_EU.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358724,"last_updated":"2023-07-06 11:48:32","id_people":443051,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Kit de Supervivencia Ling\u00fc\u00edstica Digital del Euskera-Recomendaciones del DLDP para mejorar la Vitalidad Digital del euskera","year":2018,"authors_people":"Ceberio Berger K., Gurrutxaga Hernaiz A., Baroni P., Hicks D.,Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Ceberio, B. K.","Gurrutxaga, H. A.","Baroni, P.","Hicks, D.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP per la sopravvivenza digitale del basco (versione spagnola)","keywords":["digital diversity","digital vitality","recommendations","Basque","digital survival"],"pages":"28","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Survival-Kit-for-Basque_ES.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358728,"last_updated":"2023-07-05 11:09:45","id_people":443020,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"The DLDP Digital Language Survival Kit","year":2018,"authors_people":"Ceberio Berger K., Gurrutxaga Hernaiz A., Baroni P., Hicks D., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Ceberio, B. K.","Gurrutxaga, H. A.","Baroni, P.","Hicks, D.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP per la sopravvivenza digitale delle lingue (versione inglese integrale)","keywords":["sopravvivenza digitale","lingue minoritarie","less-resourced languages"],"pages":"38","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Survival-Kit.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358722,"last_updated":"2023-07-06 12:09:45","id_people":443047,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"The DLDP Roadmap","year":2018,"authors_people":"Hicks D., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione inglese integrale)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"19","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Roadmap.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358729,"last_updated":"2023-07-05 11:03:24","id_people":483247,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"The DLDP Roadmap-Policy Recommendations & Timeline","year":2018,"authors_people":"Hicks D., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione inglese sintetica)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"6","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP-Roadmap_Short-Version_EN.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358730,"last_updated":"2023-07-06 12:02:45","id_people":483251,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"DLDP etenemissuunnitelma-Toimenpidesuunnitelmat ja aikajana","year":2018,"authors_people":"Hicks D., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione finlandese sintetica)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"6","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP-Roadmap_Short-Version_FI.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358731,"last_updated":"2023-07-06 11:37:13","id_people":483254,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"La DLDP Hoja de Ruta-Pol\u00edticas recomendadas & Cronograma","year":2018,"authors_people":"Hicks D., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione spagnola sintetica)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"6","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP-Roadmap_Short-Version_ES.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358732,"last_updated":"2023-07-06 12:16:41","id_people":483255,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Diversit\u00e0 Linguistica Digitale: la Roadmap-Raccomandazioni strategiche & Sequenza","year":2018,"authors_people":"Hicks D., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione italiana sintetica)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"6","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP-Roadmap_Short-Version_IT.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358733,"last_updated":"2023-07-06 12:15:30","id_people":483256,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"DLDP Bide Orria-Gomendatutako politikak & Kronograma","year":2018,"authors_people":"Hicks D., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione basca sintetica)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"6","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP-Roadmap_Short-Version_EU.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358736,"last_updated":"2023-07-06 12:18:02","id_people":483262,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Die DLDP Roadmap-Strategieempfehlungen & Zeitplan","year":2018,"authors_people":"Hicks D., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione tedesca sintetica)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"6","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP-Roadmap_Short-Version_DE.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358737,"last_updated":"2023-07-05 11:19:34","id_people":483263,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"La Roadmap DLDP-Recommandations de politique et calendrier","year":2018,"authors_people":"Hicks D., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione francese sintetica)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"6","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP-Roadmap_Short-Version_FR.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132422,"last_updated":"2023-07-05 11:14:17","id_people":443354,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Pak treuzvevi\u00f1 ar Brezhoneg niverel-Erbedo\u00f9 an DLDP evit gwellaat buhezegezh niverel ar brezhoneg","year":2018,"authors_people":"Hicks D., Soria C., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Soria, C.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A."],"abstract":"Le raccomandazioni del progetto DLDP per la sopravvivenza digitale del bretone (versione bretone)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Survival-Kit-for-Breton_BR.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358725,"last_updated":"2023-07-06 11:43:38","id_people":443359,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Kit de survie numerique pour la langue bretonne-Les recommandations du DLDP pour am\u00e9liorer la vitalit\u00e9 num\u00e9rique du Breton","year":2018,"authors_people":"Hicks D., Soria C., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Kruse E., Quochi V., Russo I., Salonen T., Sarhimaa A.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Hicks, D.","Soria, C.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Kruse, E.","Quochi, V.","Russo, I.","Salonen, T.","Sarhimaa, A."],"abstract":"Le raccomandazioni del progetto DLDP per la sopravvivenza digitale del bretone (versione francese)","keywords":["digital vitality","digital diversity","recommendations"],"pages":"","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Survival-Kit-for-Breton_FR.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358726,"last_updated":"2023-07-06 11:57:28","id_people":443365,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Karjalan digitaalinen kielenselviytymispakkaus-DLDP-suositukset karjalan kielen digitaalisen elinvoimaisuuden parantamiseksi","year":2018,"authors_people":"Salonen T., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Hicks D., Kruse E., Quochi V., Russo I., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Salonen, T.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Hicks, D.","Kruse, E.","Quochi, V.","Russo, I.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP per la sopravvivenza digitale della lingua careliana (versione finlandese)","keywords":["digital vitality","digital diversity","digital language survival","recommendations","Karelian"],"pages":"","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Survival-Kit-for-Karelian_FI.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":358735,"last_updated":"2023-07-06 11:50:55","id_people":483261,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Karjalan digitualine hengihji\u00e4mispakkavus-DLDP-rekomendatsiet karjalan kielen digitualizen elinvoimazuon kohendamizeh","year":2018,"authors_people":"Salonen T., Baroni P., Ceberio Berger K., Gurrutxaga Hernaiz A., Hicks D., Kruse E., Quochi V., Russo I., Sarhimaa A., Soria C.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11332","11893","17442"],"authors_cnr_institute":[""],"authors":["Salonen, T.","Baroni, P.","Ceberio, B. K.","Gurrutxaga, H. A.","Hicks, D.","Kruse, E.","Quochi, V.","Russo, I.","Sarhimaa, A.","Soria, C."],"abstract":"Le raccomandazioni del progetto DLDP per migliorare la vitalit\u00e0 digitale della lingua careliana (versione careliana)","keywords":["digital vitality","digital diversity","digital language survival","recommendations","Karelian"],"pages":"12","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Survival-Kit-for-Karelian_KRL.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132408,"last_updated":"2021-01-26 12:01:49","id_people":440548,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"How to Use the Digital Language Vitality Scale","year":2018,"authors_people":"Klara Ceberio, Antton Gurrutxaga, Claudia Soria, Irene Russo, Valeria Quochi","authors_cnr":["Soria, Claudia","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11893","17442"],"authors_cnr_institute":[""],"authors":["Ceberio, K.","Gurrutxaga, A.","Soria, C.","Russo, I.","Quochi, V."],"abstract":"The Digital Language Vitality Scale is an instrument developed within the framework of the Digital Language Diversity Project (www.dldp.eu) for estimating the degree of digital vitality of any given language. It aims to be an instrument for self-assessment of the digital vitality of any language, although it is aimed in particular at identifying current gaps, needs and requirements regarding the extent to which a language community is active\/vital on digital media and devices so that adequate digital language planning can be done. This document instructs prospective adopters on how to best use it.","keywords":["Diversit\u00e0 Linguistica","BLARK","Sopravvivenza linguistica digitale"],"pages":"18","url":"http:\/\/www.dldp.eu\/sites\/default\/files\/documents\/DLDP_Digital-Language-Vitality-Scale.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132239,"last_updated":"2018-03-23 17:15:01","id_people":382301,"institutes":["ILC"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Reports on Digital Language Diversity in Europe","year":2017,"authors_people":"Soria Claudia, Russo Irene, Quochi Valeria","authors_cnr":["Soria, Claudia","Quochi, Valeria","Russo, Irene"],"authors_cnr_id":["9887","11893","17442"],"authors_cnr_institute":[""],"authors":["Soria, C.","Russo, I.","Quochi, V."],"abstract":"In these reports we present the results of the first survey about the actual needs of European minority languages speakers in terms of digital opportunities","keywords":["regional languahges","minority languages","digital vitality","digital use"],"pages":"","url":"http:\/\/www.dldp.eu\/content\/reports-digital-language-diversity-europe","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132196,"last_updated":"2018-05-18 14:01:13","id_people":375984,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"CLARIN-IT: State of Affairs, Challenges and Opportunities","year":2017,"authors_people":"Lionel Nicolas, Alexander Konig, Monica Monachini, Riccardo Del Gratta, Silvia Calamai, Andrea Abel, Alessandro Enea, Francesca Biliotti, Valeria Quochi","authors_cnr":["Enea, Alessandro","Monachini, Monica","Quochi, Valeria","Del Gratta, Riccardo"],"authors_cnr_id":["8533","8945","11893","11933"],"authors_cnr_institute":[""],"authors":["Nicolas, L.","Konig, A.","Monachini, M.","Del Gratta, R.","Calamai, S.","Abel, A.","Enea, A.","Biliotti, F.","Quochi, V."],"abstract":"This paper provides an overview on the Italian national CLARIN consortium and the status of CLARIN-IT in general. It thus discusses the current state of affairs of the consortium and provi-des information on the members, especially with regards to what they offer to CLARIN in terms of resources, services and expertise, and what CLARIN offers them to further their own research.","keywords":["Italian CLARIN consortium","CLARIN-IT"],"pages":"4","url":"https:\/\/www.clarin.eu\/event\/2017\/clarin-annual-conference-2017-budapest-hungary","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"CLARIN Annual Conference 2017","conference_place":"Budapest, Hungary","conference_date":"18-20 September, 2017"},{"id":132132,"last_updated":"2023-07-09 20:21:37","id_people":358123,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Development and representation of Italian light-fare constructions","year":2016,"authors_people":"Valeria Quochi","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":[""],"authors":["Quochi, V."],"abstract":"The essay describes the study of the development and use of light fare 'do' constructions in Child-directed Speech and in Child Language with the twofold goal of showing that a Construction Grammar approach is viable, and of providing support to usage-based, functional predictions on language acquisition. The analysis of naturalistic data derived from the CHILDES database lead to two main findings: first, a representation of fare Light Verb Constructions as a family of constructions organized like a radial category is not only possible but more explicative, second, there exists a 'fare' pivot schema that children generalize at an early stage because it serves the purpose of naming new events, activities or situations.","keywords":["Corpus linguistics Language Acquisition Construction Grammar","phraseology"],"pages":"39-64","url":"https:\/\/benjamins.com\/#catalog\/books\/cal.19.03quo\/details","volume":"19","doi":"10.1075\/cal.19.03quo","editors_people":"Yoon, Jiyoung ; Th. Gries, Stefan","editors":["Yoon, J.","Th Gries, S."],"published":"Corpus-based Approaches to Construction Grammar","publisher":"John Benjamins Publishing Company (Amsterdam\/Philadelphia, USA)","issn":"","isbn":"9789027204417","conference_name":"","conference_place":"","conference_date":""},{"id":132120,"last_updated":"2016-09-07 10:05:16","id_people":355526,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Fostering digital representation of EU regional and minority languages: the Digital Language Diversity Project","year":2016,"authors_people":"Claudia Soria, Irene Russo, Valeria Quochi, Davyth Hicks, Antton Gurrutxaga, Anneli Sarhimaa, Matti Tuomisto","authors_cnr":["Russo, Irene","Soria, Claudia","Quochi, Valeria"],"authors_cnr_id":["9887","11893"],"authors_cnr_institute":["048","048","048"],"authors":["Soria, C.","Russo, I.","Quochi, V.","Hicks, D.","Gurrutxaga, A.","Sarhimaa, A.","Tuomisto, M."],"abstract":"Poor digital representation of minority languages further prevents their usability on digital media and devices. The Digital Language Diversity Project, a three-year project funded under the Erasmus+ programme, aims at addressing the problem of low digital representation of EU regional and minority languages by giving their speakers the intellectual an practical skills to create, share, and reuse online digital content. Availability of digital content and technical support to use it are essential prerequisites for the development of language-based digital applications, which in turn can boost digital usage of these languages. In this paper we introduce the project, its aims, objectives and current activities for sustaining digital usability of minority languages through adult education.","keywords":["Less-resourced languages","Language Technology","digital language vitality","digital language diversity"],"pages":"3256-3260","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2016\/index.html","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-9-1","conference_name":"Tenth International Conference on Language Resources and Evaluation (LREC 2016)","conference_place":"Portoroz, Slovenia","conference_date":"23-28 may"},{"id":132093,"last_updated":"2021-04-08 08:30:49","id_people":342213,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Visualising Italian Language Resources: a Snapshot","year":2015,"authors_people":"Riccardo Del Gratta, Francesca Frontini, Monica Monachini, Gabriella Pardelli, Irene Russo, Roberto Bartolini, Sara Goggi, Fahad Khan, Valeria Quochi, Claudia Soria, Nicoletta Calzolari","authors_cnr":["Del Gratta, Riccardo","Russo, Irene","Khan, Anas Fahad","Monachini, Monica","Soria, Claudia","Goggi, Sara","Bartolini, Roberto","Quochi, Valeria","Frontini, Francesca","Pardelli, Gabriella","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","10441","11893","15911","16333","26123"],"authors_cnr_institute":[""],"authors":["Del Gratta, R.","Frontini, F.","Monachini, M.","Pardelli, G.","Russo, I.","Bartolini, R.","Goggi, S.","Khan, F.","Quochi, V.","Soria, C.","Calzolari, N."],"abstract":"This paper aims to provide a first snapshot of Italian Language Resources (LRs) and their uses by the community, as documented by the papers presented at two different conferences, LREC2014 and CLiC-it 2014. The data of the former were drawn from the LOD version of the LRE Map, while those of the latter come from manually analyzing the proceedings. The results are presented in the form of visual graphs and confirm the initial hypothesis that Italian LRs require concrete actions to enhance their visibility.","keywords":["Italian Language Resources"],"pages":"100-104","url":"https:\/\/books.openedition.org\/aaccademia\/1277?lang=it","volume":"","doi":"","editors_people":"Cristina Bosco, Sara Tonelli, Fabio Massimo Zanzotto","editors":["Bosco, C.","Tonelli, S.","Zanzotto, F. M."],"published":"Proceedings of the Second Italian Conference on Computational Linguistics CLiC-it 2015","publisher":"","issn":"","isbn":"978-88-99200-62-6","conference_name":"Second Italian Conference on Computational Linguistics CLiC-it 2015","conference_place":"Trento","conference_date":"3-4 December 2015"},{"id":131997,"last_updated":"2021-04-08 08:39:25","id_people":304304,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Generative Lexicon and polysemy: inducing logical alternations","year":2015,"authors_people":"Francesca Frontini, Valeria Quochi, Monica Monachini","authors_cnr":["Quochi, Valeria","Frontini, Francesca","Monachini, Monica"],"authors_cnr_id":["8945"],"authors_cnr_institute":[""],"authors":["Frontini, F.","Quochi, V.","Monachini, M."],"abstract":"The current paper brings together the results of a series of experiments for inducing regular sense alternations, or regular\/ logical polysemy, from a computational lexicon based on the Generative Lexicon theory. The results are discussed in light of the potential benefits and uses of the amended algorithm.","keywords":["Polysemy","Generative Lexicon","Logical Alternations"],"pages":"7","url":"https:\/\/publications.cnr.it\/doc\/304304","volume":"","doi":"","editors_people":"Shu-Kai Hsieh and Kyoko Kanzaki (eds.)","editors":["Hsieh, S.","Kanzaki, K."],"published":"","publisher":"MAPLEX2015 Multiple Approaches to Lexicon Conference (Yamagata, JPN)","issn":"","isbn":"","conference_name":"MAPLEX2015 Multiple Approaches to Lexicon Conference","conference_place":"Yamagata, Japan","conference_date":"February 9-10, 2015"},{"id":131880,"last_updated":"2016-03-16 15:13:49","id_people":285553,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"The language resource Strategic Agenda: the FLaReNet synthesis of community recommendations","year":2014,"authors_people":"Claudia Soria, Nicoletta Calzolari, Monica Monachini, Valeria Quochi, Nuria Bel, Khalid Choukri, Joseph Mariani, Jan Odijk, Stelios Piperidis","authors_cnr":["Monachini, Monica","Soria, Claudia","Quochi, Valeria","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","11893","26123"],"authors_cnr_institute":["048","048","048","048"],"authors":["Soria, C.","Calzolari, N.","Monachini, M.","Quochi, V.","Bel, N.","Choukri, K.","Mariani, J.","Odijk, J.","Piperidis, S."],"abstract":"The main purpose of this paper is to serve as a landmark for future research and in particular for future strategic, infrastructural and coordination initiatives. It presents a preliminary plan for actions and infrastructures that could become the basis for future initiatives in the sector of Language Resources and Technologies (LRTs). The FLaReNet Language Resource Strategic Agenda presents a set of recommen- dations for the development and progress of LRT in Europe, as issued from a three- year consultation of the FLaReNet European project. Recommendations cover a broad range of topics and activities, spanning over production and use of language resources, licensing, maintenance and preservation issues, infrastructures for language resour- ces, resource identification and sharing, evaluation and validation, interoperability and policy issues. The intended recipients belong to a large set of players and stakeholders in LRT, ranging from individuals to research and education institutions, to policy- makers, funding agencies, SMEs and large companies, service and media providers","keywords":["Strategic agenda","Language resources planning","Recommended priority actions"],"pages":"753-775","url":"https:\/\/publications.cnr.it\/doc\/285553","volume":"48","doi":"10.1007\/s10579-014-9279-y","editors_people":"","editors":[""],"published":"Language resources and evaluation (Print)","publisher":"Springer (Dordrecht, Paesi Bassi)","issn":"1574-020X","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131892,"last_updated":"2018-01-30 12:46:58","id_people":286868,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Lexicons, Terminologies, Ontologies: Reflections from Experiences in Resource Construction","year":2014,"authors_people":"Calzolari Nicoletta, Monachini Monica, Quochi Valeria, Soria Claudia, Toral Antonio","authors_cnr":["Monachini, Monica","Soria, Claudia","Quochi, Valeria","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","11893","26123"],"authors_cnr_institute":[""],"authors":["Calzolari","Nicoletta","Monachini, M.","Quochi, V.","Soria, C.","Toral, A."],"abstract":"This contribution aims at highlighting the strong interconnection between lexicons, terminologies and ontologies and especially the fundamental role that ontologies and lexica mutually play. Our view is that lexical resources are evolving in nature, from ontologically based lexicons we are going towards lexically based ontologies. We explore different instantiations of the current trend of using formal ontologies as a core module of computational lexicons, presenting the advantages especially in multilingual and terminological contexts. We present work showing that the lexical knowledge already present in non formal computational lexicons can be exploited to derive or enrich a formal ontology without much manual effort. In the terminology domain, we describe the construction of a resource for biology, directly linked to a parallel domain-ontology, that combines characteristics of both lexicons and terminologies, so that is can allow for intelligent access to content. Finally, we describe our experience in two projects in which formal ontologies play a central role in the context of multilingual computational lexicons, where the ontology is what acts as the glue among the different monolingual lexicons and what provides cross-lingual reasoning capabilities.","keywords":["Computational Lexicons","Ontology","Terminology","Interoperability","Standards"],"pages":"103-121","url":"http:\/\/www.springer.com\/computer\/ai\/book\/978-3-642-45326-7","volume":"8003","doi":"10.1007\/978-3-642-45327-4_7","editors_people":"Nachum Dershowitz and Ephraim Nissan","editors":["Dershowitz, N.","Nissan, E."],"published":"Language, Culture, Computation. Computational Linguistics and Linguistics. Essays Dedicated to Yaacov Choueka on the Occasion of His 75th Birthday, Part III","publisher":"Springer (Berlin Heidelberg, DEU)","issn":"","isbn":"978-3-642-45326-7","conference_name":"","conference_place":"","conference_date":""},{"id":128886,"last_updated":"2016-01-13 15:30:58","id_people":286882,"institutes":["IIT","ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Marrying Technical Writing with LRT","year":2014,"authors_people":"Antico Giovanni, Valeria Quochi, Monica Monachini, Maurizio Martinelli","authors_cnr":["Quochi, Valeria","Martinelli, Maurizio","Monachini, Monica"],"authors_cnr_id":["5126","8945"],"authors_cnr_institute":["048","044","048"],"authors":["Antico, G.","Quochi, V.","Monachini, M.","Martinelli, M."],"abstract":"In the last years the Technical Writer operational scenarios and the workflow sensibly changed; specifically,\"free style\" writing - or manual writing - has become outdated and technical writing is now much more concerned with structured management of content than in the past. Technical writing has become more demanding due to a number of factors among which the rise and spread of mobile devices usage. This paper discusses the new needs of technical writing and content management business and how LRT can help it improve quality and productivity.","keywords":["controlled language","technical writing","content management systems"],"pages":"19-25","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/index.html","volume":"","doi":"","editors_people":"Hitoshi Isahara, Key-Sun Choi. Shinhoi Lee, Sejin Nam","editors":["Isahara, H.","Lee, K. C. S.","Nam, S."],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-8-4","conference_name":"9th International Conference on Language Resources and Evaluation (LREC)","conference_place":"Reykjavik, Iceland","conference_date":"26-31 may 2014"},{"id":131894,"last_updated":"2016-03-29 15:25:08","id_people":286944,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"From Synsets to Videos: Enriching ItalWordNet Multimodally","year":2014,"authors_people":"Bartolini R., Quochi V., De Felice, I., Russo I., Monachini M.","authors_cnr":["Quochi, Valeria","Russo, Irene","De Felice, Irene","Monachini, Monica","Bartolini, Roberto"],"authors_cnr_id":["8945","10441"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Bartolini, R.","Quochi, V.","De Felice, I.","Russo, I.","Monachini, M."],"abstract":"The paper describes the multimodal enrichment of ItalWordNet action verbs' entries by means of an automatic mapping with a conceptual ontology of action types instantiated by video scenes (ImagAct). The two resources present significative differences as well as interesting complementary features, such that a mapping of these two resources can lead to a an enrichment of IWN, through the connection between synsets and videos apt to illustrate the meaning described by glosses. Here, we describe an approach inspired by ontology matching methods for the automatic mapping of ImagAct video scenes onto ItalWordNet. The experiments described in the paper are conducted on Italian, but the same methodology can be extended to other languages for which WordNets have been created, since ImagAct is available also for English, Chinese and Spanish. This source of multimodal information can be exploited to design second language learning tools, as well as for language grounding in action recognition in video sources and potentially for robotics.","keywords":["Action ontology","Multimodality","WordNet"],"pages":"3110-3117","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/index.html","volume":"","doi":"","editors_people":"N. Calzolari, K. Choukri, T. Declerck, H. Loftsson, B. Maegaard, J. Mariani, A. Moreno, J. Odijk, S. Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Loftsson, H.","Maegaard, B.","Mariani, J.","Moreno, A.","Odijk, J.","Piperidis, S."],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-8-4","conference_name":"LREC 2014. European Language Resources Association ELRA: Paris (Francia)","conference_place":"Reykjavik, Iceland","conference_date":"26-31 may"},{"id":131983,"last_updated":"2016-03-29 15:24:09","id_people":291282,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Evaluating ImagAct-WordNet mapping for English and Italian through videos","year":2014,"authors_people":"De Felice I., Bartolini R., Russo I., Quochi V., Monachini M.","authors_cnr":["Quochi, Valeria","Russo, Irene","De Felice, Irene","Monachini, Monica","Bartolini, Roberto"],"authors_cnr_id":["8945","10441"],"authors_cnr_institute":["048","048","","048","048"],"authors":["De Felice, I.","Bartolini, R.","Russo, I.","Quochi, V.","Monachini, M."],"abstract":"In this paper we present the results of the evaluation of an automatic mapping between two lexical resources, WordNet\/ItalWordNet and ImagAct, a conceptual ontology of action types instantiated by video scenes. Results are compared with those obtained from a previous experiment performed only on Italian data. Differences between the two evaluation strategies, as well as between the quality of the mappings for the two languages considered in this paper, are iscussed.","keywords":["Language Resources (LRs)"],"pages":"128-131","url":"http:\/\/clic.humnet.unipi.it\/proceedings\/Proceedings-CLICit-2014.pdf","volume":"","doi":"10.12871\/CLICIT2014126","editors_people":"Roberto Basili, Alessandro Lenci, Bernardo Magnini","editors":["Basili, R.","Lenci, A.","Magnini, B."],"published":"","publisher":"Pisa University Press srl (Pisa, ITA)","issn":"","isbn":"978-88-67-41472-7","conference_name":"Proceedings of the First Italian Conference on Computational Linguistics CLiC-it 2014 & the Fourth International Workshop EVALITA 2014. Pisa University Press srl: Pisa (Italia)","conference_place":"Pisa","conference_date":"9-11 December 2014, Pisa"},{"id":131985,"last_updated":"2014-12-15 17:12:36","id_people":291452,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Polysemy alternations extraction using the PAROLE SIMPLE CLIPS Italian lexicon","year":2014,"authors_people":"Frontini F., Quochi V., Monachini M.","authors_cnr":["Frontini, Francesca","Monachini, Monica","Quochi, Valeria"],"authors_cnr_id":["8945","11893"],"authors_cnr_institute":["048","048","048"],"authors":["Frontini, F.","Quochi, V.","Monachini, M."],"abstract":"This paper presents the results of an experiment of polysemy alternations induction from a lexicon (Utt and Pad\u00b4o, 2011; Frontini et al., 2014), discussing the results and proposing an amendment in the original algorithm.","keywords":["Language Resources and Technologies"],"pages":"175-179","url":"http:\/\/clic.humnet.unipi.it\/proceedings\/Proceedings-CLICit-2014.pdf","volume":"","doi":"10.12871\/CLICIT2014134","editors_people":"Roberto Basili, Alessandro Lenci, Bernardo Magnini","editors":["Basili, R.","Lenci, A.","Magnini, B."],"published":"","publisher":"Pisa University Press srl (Pisa, ITA)","issn":"","isbn":"978-88-67-41472-7","conference_name":"Proceedings of the First Italian Conference on Computational Linguistics CLiC-it 2014 & the Fourth International Workshop EVALITA 2014","conference_place":"Pisa","conference_date":"9-11 December 2014, Pisa"},{"id":131896,"last_updated":"2016-03-29 10:00:21","id_people":286984,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Polysemy Index for Nouns: an Experiment on Italian using the PAROLE SIMPLE CLIPS Lexical Database","year":2014,"authors_people":"Frontini Francesca, Valeria Quochi, Sebastian Pad\u00f3, Jason Utt, Monica Monachini","authors_cnr":["Quochi, Valeria","Frontini, Francesca","Monachini, Monica"],"authors_cnr_id":["8945"],"authors_cnr_institute":["048","048","048"],"authors":["Frontini, F.","Quochi, V.","Pad\u00f3, S.","Utt, J.","Monachini, M."],"abstract":"An experiment is presented to induce a set of polysemous basic type alternations (such as ANIMAL-FOOD, or BUILDING-INSTITUTION) by deriving them from the sense alternations found in an existing lexical resource. The paper builds on previous work and applies those results to the Italian lexicon PAROLE SIMPLE CLIPS. The new results show how the set of frequent type alternations that can be induced from the lexicon is partly different from the set of polysemy relations selected and explicitly applied by lexicographers when building it. The analysis of mismatches shows that frequent type alternations do not always correspond to prototypical polysemy relations, nevertheless the proposed methodology represents a useful tool offered to lexicographers to systematically check for possible gaps in their resource.","keywords":["Polysemy","lexical resources","semantics"],"pages":"2955-2963","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/index.html","volume":"","doi":"","editors_people":"N. Calzolari, K. Choukri, T. Declerck, H. Loftsson, B. Maegaard, J. Mariani, A. Moreno, J. Odijk, S. Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Loftsson, H.","Maegaard, B.","Mariani, J.","Moreno, A.","Odijk, J.","Piperidis, S."],"published":"LREC 2014 Ninth International Conference on Language Resources and Evaluation Proceedings","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-8-4","conference_name":"9th International Conference on Language Resources and Evaluation, LREC 2014","conference_place":"Reykjavik, Iceland","conference_date":"26-31 may"},{"id":131863,"last_updated":"2014-12-17 14:57:40","id_people":285381,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Translating action verbs using a dictionary of images: the IMAGACT ontology","year":2014,"authors_people":"Alessandro Panunzi, Irene De Felice, Lorenzo Gregori, Stefano Jacoviello, Monica Monachini, Massimo Moneglia, Valeria Quochi, Irene Russo","authors_cnr":["Russo, Irene","De Felice, Irene","Monachini, Monica","Quochi, Valeria"],"authors_cnr_id":["8945","11893"],"authors_cnr_institute":[""],"authors":["Panunzi, A.","De Felice, I.","Gregori, L.","Jacoviello, S.","Monachini, M.","Moneglia, M.","Quochi, V.","Russo, I."],"abstract":"Action verbs have many meanings, covering actions in different ontological types. Moreover, each language categorizes action in its own way. One verb can refer to many different actions and one action can be identified by more than one verb. The range of variations within and across languages is largely unknown, causing trouble in all translation tasks. IMAGACT is a corpus-based ontology of action concepts, derived from English and Italian spontaneous speech corpora, which makes use of the universal language of images to identify the different action types extended by verbs referring to action in English, Italian, Chinese and Spanish. This paper presents the IMAGACT search interface and the various kinds of linguistic information the user can derive from it. IMAGACT makes explicit the variation of meaning of action verbs within one language and allows comparisons of verb variations within and across languages. Because the action concepts are represented with videos, extension into new languages beyond those presently implemented in IMAGACT is done using competence-based judgments by mother-tongue informants, without intense lexicographic work involving underdetermined semantic descriptions.","keywords":["Action verbs","Image ontology","Multilingual dictionary","Computer-aided translation"],"pages":"1163-1170","url":"http:\/\/euralex2014.eurac.edu\/en\/callforpapers\/Documents\/EURALEX%202014_gesamt.pdf","volume":"","doi":"10.13140\/2.1.3719.2320","editors_people":"Abel Andrea, Vettori Chiara, Ralli Natascia","editors":["Abel, A.","Vettori, C.","Ralli, N."],"published":"Proceedings of the XVI EURALEX International Congress: The User in Focus","publisher":"EURAC (Bolzano, ITA)","issn":"","isbn":"978-88-88906-97-3","conference_name":"XVI EURALEX International Congress: The User in Focus","conference_place":"Bolzano","conference_date":"15-19\/07\/2014"},{"id":132018,"last_updated":"2015-02-20 17:23:21","id_people":287038,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Flexible Acquisition of Subcategorization Frames in Italian","year":2012,"authors_people":"Caselli, Tommaso; Frontini, Francesca; Quochi, Valeria; Rubino, Francesco and Russo, Irene","authors_cnr":["Caselli, Tommaso","Russo, Irene","Frontini, Francesca","Rubino, Francesco","Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Caselli, T.","Frontini, F.","Quochi, V.","Rubino, F.","Russo, I."],"abstract":"Lexica of predicate-argument structures constitute a useful tool for several tasks in NLP. This paper describes a web-service system for automatic acquisition of verb subcategorization frames (SCFs) from parsed data in Italian. The system acquires SCFs in an unsupervised manner. We created two gold standards for the evaluation of the system, the first by mixing together information from two lexica (one manually created and the second automatically acquired) and manual exploration of corpus data and the other annotating data extracted from a specialized corpus (environmental domain). Data filtering is accomplished by means of the maximum likelihood estimate (MLE). The evaluation phase has allowed us to identify the best empirical MLE threshold for the creation of a lexicon (P=0.653, R=0.557, F1=0.601). In addition to this, we assigned to the extracted entries of the lexicon a confidence score based on the relative frequency and evaluated the extractor on domain specific data. The confidence score will allow the final user to easily select the entries of the lexicon in terms of their reliability: one of the most interesting feature of this work is the possibility the final users have to customize the results of the SCF extractor, obtaining different SCF lexica in terms of size and accuracy.","keywords":["lexicon","automatic acquisition","subcategorisation frames"],"pages":"2842-2848","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/summaries\/390.html","volume":"","doi":"","editors_people":"Nicoletta Calzolari, Khalid Choukri, Thierry Declerck, Mehmet U?ur Do?an, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Do\u011fan, M. U.","Maegaard, B.","Mariani, J.","Odijk, J.","Piperidis, S."],"published":"Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"9782951740877","conference_name":"Eight International Conference on Language Resources and Evaluation (LREC'12)","conference_place":"Istanbul, Turkey","conference_date":"23-25 Maggio 2012"},{"id":128425,"last_updated":"2022-08-24 00:43:28","id_people":223098,"institutes":["IIT","ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"L-LEME: an Automatic Lexical Merger based on the LMF Standard","year":2012,"authors_people":"Riccardo Del Gratta, Francesca Frontini, Monica Monachini, Valeria Quochi, Francesco Rubino, Matteo Abrate, Angelica Lo Duca","authors_cnr":["Abrate, Matteo","Frontini, Francesca","Rubino, Francesco","Lo Duca, Angelica","Monachini, Monica","Quochi, Valeria","Del Gratta, Riccardo"],"authors_cnr_id":["8945","11893","11933"],"authors_cnr_institute":["044","048","048","044","048","048","048"],"authors":["Del Gratta, R.","Frontini, F.","Monachini, M.","Quochi, V.","Rubino, F.","Abrate, M.","Lo Duca, A."],"abstract":"The present paper describes LMF LExical MErger (L-LEME), an architecture to combine two lexicons in order to obtain new resource(s). L-LEME relies on standards, thus exploiting the benefits of the ISO Lexical Markup Framework (LMF) to ensure interoperability. L-LEME is meant to be dynamic and heavily adaptable: it allows the users to configure it to meet their specific needs. The L-LEME architecture is composed of two main modules: the Mapper, which takes in input two lexicons A and B and a set of user-defined rules and instructions to guide the mapping process (Directives D) and gives in output all matching entries. The algorithm also calculates a cosine similarity score. The Builder takes in input the previous results, a set of Directives D1 and produces a new LMF lexicon C. The Directives allow the user to define its own building rules and different merging scenarios. L-LEME is applied to a specific concrete task within the PANACEA project, namely the merging of two Italian SubCategorization Frame (SCF) lexicons. The experiment is interesting in that A and B have different philosophies behind, being A built by human introspection and B automatically extracted. Ultimately, L-LEME has interesting repercussions in many language technology applications","keywords":["LMF","Lexicon mapping","similarity score"],"pages":"31-40","url":"https:\/\/publications.cnr.it\/doc\/223098","volume":"","doi":"","editors_people":"Bel N. , Gavrilidou M. , Monachini M., Quochi V., Rimell L.","editors":["Bel, N.","Gavrilidou, M.","Monachini, M.","Quochi, V.","Rimell, L."],"published":"Proceedings of the LREC 2012 Workshop on Language Resource Merging","publisher":"","issn":"","isbn":"978-2-9517408-7-7","conference_name":"The Eight International Conference on Language Resources and Evaluation (LREC) 2012","conference_place":"Istanbul, Turkey","conference_date":"2012"},{"id":131773,"last_updated":"2014-10-23 10:53:31","id_people":220785,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Automatic Creation of Quality Multi-Word Lexica from Noisy Text Data","year":2012,"authors_people":"Francesca Frontini, Valeria Quochi, Francesco Rubino","authors_cnr":["Frontini, Francesca","Rubino, Francesco","Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048","048","048"],"authors":["Frontini, F.","Quochi, V.","Rubino, F."],"abstract":"This paper describes the design of a tool for the automatic creation of multi-word lexica that is deployed as a web service and runs on automatically web-crawled data within the framework of the PANACEA platform. The main purpose of our task is to provide a (computationally \"light\") tool that creates a full high quality lexical resource of multi-word items. Within the platform, this tool is typically inserted in a work flow whose first step is automatic web-crawling. Therefore, the input data of our lexical extractor is intrinsically noisy. The paper evaluates the capacity of the tool to deal with noisy data, and in particular with texts containing a significant amount of duplicated paragraphs. The accuracy of the extraction of multi-word expressions from the original crawled corpus is compared to the accuracy of the extraction from a later \"de-duplicated\" version of the corpus. The paper shows how our method can extract with sufficiently good precision also from the original, noisy crawled data. The output of our tool is a multi-word lexicon formatted and encoded in XML according to the Lexical Mark-up Framework.","keywords":["Lexical induction","multi-word extraction","web-based distributed platform","noisy data"],"pages":"","url":"http:\/\/www.kde.cs.tut.ac.jp\/~aono\/pdf\/COLING2012\/AND\/pdf\/AND04.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of the Sixth Workshop on Analytics for Noisy Unstructured Text Data","publisher":"ACM, Association for computing machinery (New York, USA)","issn":"","isbn":"978-1-4503-1919-5","conference_name":"AND 2012","conference_place":"Mumbai, India","conference_date":"December 9, 2012"},{"id":131893,"last_updated":"2014-11-11 15:43:07","id_people":286877,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Towards a User-Friendly Platform for Building Language Resources based on Web Services","year":2012,"authors_people":"Poch, Marc; Toral, Antonio; Hamon, Olivier; Quochi, Valeria; Bel, Nuria","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048"],"authors":["Poch, M.","Toral, A.","Hamon, O.","Quochi, V.","Bel, N."],"abstract":"This paper presents the platform developed in the PANACEA project, a distributed factory that automates the stages involved in the acquisition, production, updating and maintenance of Language Resources required by Machine Translation and other Language Technologies. We adopt a set of tools that have been successfully used in the Bioinformatics field, they are adapted to the needs of our field and used to deploy web services, which can be combined to build more complex processing chains (workflows). This paper describes the platform and its different components (web services, registry, workflows, social network and interoperability). We demonstrate the scalability of the platform by carrying out a set of massive data experiments. Finally, a validation of the platform across a set of required criteria proves its usability for different types of users (non-technical users and providers).","keywords":["service platform","workflow","interoperability"],"pages":"1156-1163","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/pdf\/543_Paper.pdf","volume":"","doi":"","editors_people":"Nicoletta Calzolari, Khalid Choukri, Thierry Declerck, Mehmet U?ur Do?an, Bente Maegaard, Joseph Mariani, Asuncion Moreno, Jan Odijk, Stelios Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Do\u011fan, M. U.","Maegaard, B.","Mariani, J.","Moreno, A.","Odijk, J.","Piperidis, S."],"published":"Proceedings of the Eighth International Conference on Language Resources and Evaluation, LREC 2012","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-7-7","conference_name":"Eighth International Conference on Language Resources and Evaluation","conference_place":"Istanbul, Turchia","conference_date":"23-25\/05\/2012"},{"id":131772,"last_updated":"2023-08-21 19:57:38","id_people":220778,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A MWE Acquisition and Lexicon Builder Web Service","year":2012,"authors_people":"Quochi, Valeria; Frontini, Francesca; Rubino, Francesco","authors_cnr":["Frontini, Francesca","Rubino, Francesco","Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048","048","048"],"authors":["Quochi, V.","Frontini, F.","Rubino, F."],"abstract":"This paper describes the development of a web-service tool for the automatic extraction of Multi-word expressions lexicons, which has been integrated in a distributed platform for the automatic creation of linguistic resources. The main purpose of the work described is thus to provide a (computationally \"light\") tool that produces a full lexical resource: multi-word terms\/items with relevant and useful attached information that can be used for more complex processing tasks and applications (e.g. parsing, MT, IE, query expansion, etc.). The output of our tool is a MW lexicon formatted and encoded in XML according to the Lexical Mark-up Framework. The tool is already functional and available as a service. Evaluation experiments show that the tool precision is of about 80%.","keywords":["Multiword extraction","lexical resources","LMF","web services"],"pages":"2291-2306","url":"http:\/\/aclweb.org\/anthology\/C\/C12\/C12-1140.pdf","volume":"","doi":"","editors_people":"Martin Kay and Christian Boitet","editors":["Kay, M.","Boitet, C."],"published":"Proceedings of COLING 2012: Technical Papers","publisher":"Curran Associates (Red Hook, NY 12571, USA)","issn":"","isbn":"9781627483896","conference_name":"International Conference on Computational Linguistics (COLING)","conference_place":"Mumbai, India","conference_date":"December 2012"},{"id":131771,"last_updated":"2016-03-15 15:50:21","id_people":220773,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Integrating NLP Tools in a Distributed Environment: A Case Study Chaining a Tagger with a Dependency Parser","year":2012,"authors_people":"Rubino, Francesco; Frontini, Francesca; Quochi, Valeria","authors_cnr":["Frontini, Francesca","Rubino, Francesco","Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048","048","048"],"authors":["Rubino, F.","Frontini, F.","Quochi, V."],"abstract":"The present paper tackles the issue of PoS tag conversion within the framework of a distributed web service platform for the automatic creation of language resources. PoS tagging is now considered a \"solved problem\"; yet, because of the differences in the tagsets, interchange of the various PoS taggers vailable is still hampered. In this paper we describe the implementation of a PoS-tagged-corpus converter, which is needed for chaining together in a workflow the FreeLing PoS tagger for Italian and the DESR dependency parser, given that these two tools have been developed independently. The conversion problems experienced during the implementation, related to the properties of the different tagsets and of tagset conversion in general, are discussed together with the solutions adopted. Finally, the converter is evaluated by assessing the impact of conversion on the performance of the dependency parser by comparing with the outcome of the native pipeline. From this we learn that in most cases parsing errors are due to actual tagging errors, and not to conversion itself. Besides, information on accuracy loss is an important feature in a distributed environment of (NLP) services, where users need to decide which services best suit their needs","keywords":["PoS tag conversion","interoperability","NLP pipelines"],"pages":"2125-2131","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/summaries\/726.html","volume":"","doi":"","editors_people":"Nicoletta Calzolari, Khalid Choukri, Thierry Declerck, Mehmet U?ur Do?an, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Do\u011fan, M. U.","Maegaard, B.","Mariani, J.","Odijk, J.","Piperidis, S."],"published":"Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)","publisher":"European language resources association (ELRA) (Paris, FRA)","issn":"","isbn":"9782951740877","conference_name":"Language Resources and Evaluation Conference 2012","conference_place":"Istanbul, Turchia","conference_date":"23-25 Maggio 2012"},{"id":131752,"last_updated":"2015-02-26 14:38:14","id_people":219679,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"The FLaReNet Strategic Language Resource Agenda","year":2012,"authors_people":"Soria, Claudia [1]; Bel, N\u00faria [2]; Choukri, Khalid [3]; Mariani, Joseph [4]; Monachini, Monica [1]; Odijk, Jan [5]; Piperidis, Stelios [6]; Quochi, Valeria [1]; Calzolari, Nicoletta [1]","authors_cnr":["Monachini, Monica","Soria, Claudia","Quochi, Valeria","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","11893","26123"],"authors_cnr_institute":["048","048","048","048"],"authors":["Soria, C.","Bel, N.","Choukri, K.","Mariani, J.","Monachini, M.","Odijk, J.","Piperidis, S.","Quochi, V.","Calzolari, N."],"abstract":"The FLaReNet Strategic Agenda highlights the most pressing needs for the sector of Language Resources and Technologies and presents a set of recommendations for its development and progress in Europe, as issued from a three-year consultation of the FLaReNet European project. The FLaReNet recommendations are organised around nine dimensions: a) documentation b) interoperability c) availability, sharing and distribution d) coverage, quality and adequacy e) sustainability f) recognition g) development h) infrastructure and i) international cooperation. As such, they cover a broad range of topics and activities, spanning over production and use of language resources, licensing, maintenance and preservation issues, infrastructures for language resources, resource identification and sharing, evaluation and validation, interoperability and policy issues. The intended recipients belong to a large set of players and stakeholders in Language Resources and Technology, ranging from individuals to research and education institutions, to policy-makers, funding agencies, SMEs and large companies, service and media providers. The main goal of these recommendations is to serve as an instrument to support stakeholders in planning for and addressing the urgencies of the Language Resources and Technologies of the future.","keywords":["strategic agenda","language resources planning","recommended priority actions"],"pages":"1379-1386","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/index.html","volume":"","doi":"","editors_people":"N. Calzolari, K. Choukri, T. Declerck, M. Ugur Dogan, B. Maegaard, J. Mariani, J. Odijk, S. Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Dogan, M. U.","Maegaard, B.","Mariani, J.","Odijk, J.","Piperidis, S."],"published":"Proceedings of the 8th international conference on Language Resources and Evaluation (LREC2012)","publisher":"","issn":"","isbn":"978-2-9517408-7-7","conference_name":"The Eight International Conference on Language Resources and Evaluation (LREC'12)","conference_place":"Istanbul, Turkey","conference_date":"23-25 may 2012"},{"id":131776,"last_updated":"2015-02-25 17:57:07","id_people":220828,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"How predictive are grammatical constructions in Italian? The case of the caused-motion construction","year":2012,"authors_people":"Quochi, Valeria","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048"],"authors":["Quochi, V."],"abstract":"Differently from English, Italian has a rich morpho logical system and a relative free word-order. For these reasons, the suitability of a \"full-scope\" constructional approach to Italian is not given. Although Goldberg's (1995, 2006) version of Construction grammar language is constructions all the way down (or up), one could still argue that in Italian, i.e. a language rich in morphology, abstract, grammatical constructions do not play a role, thus weakening the constructionist view. One of the strong points in favour of goldberg's approach is that argument structure constructions in English have been found to be highly predictive of sentence meaning (Goldberg et al. 2005), which provides a motivationfor their early acquisition by children. Many of such studies and evidences are still missing for Italian. This contribution will therefore attempt to start filling this gap by testing the predictive power of the Italian Caused Motion Construction. Data is taken from the CHILDES database (MacWhinney 2000) and annotated according to constructional properties and verb meaning. The annotation is then used to calculate the Cue and Category Validity (Murphy 2002) of both the Construction and the main verbs, which measures their predictive power (i.e respectively their reliability and availability) in relation to the overall sentence meaning. Results show that the Italian Caused Motion Construction is not only more reliable than verbs as a predictor of overall sentence meaning, but it is also more available.","keywords":["Construction Grammar Psicolinguistica Linguistica del corpus"],"pages":"265-265","url":"http:\/\/www.sle2012.eu\/downloads\/Book_abstracts_SLE2012_23aug_final.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"45th Annual Meeting of the Societas Linguistica Europaea (SLE2012)","conference_place":"Stoccolma, Svezia","conference_date":"29\/8-1\/9 2012"},{"id":131785,"last_updated":"2014-12-09 15:55:06","id_people":221573,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D3. 4 Third version (v4) of the integrated platform and documentation","year":2012,"authors_people":"Poch, Marc; Hamon, Olivier; Quochi, Valeria; Del Gratta, Riccardo; Toral, Antonio; Thurmair, Gregor; Prokopidis, Prokopis; Bel, Nuria","authors_cnr":["Quochi, Valeria","Del Gratta, Riccardo"],"authors_cnr_id":["11893","11933"],"authors_cnr_institute":["048","048"],"authors":["Poch, M.","Hamon, O.","Quochi, V.","Del Gratta, R.","Toral, A.","Thurmair, G.","Prokopidis, P.","Bel, N."],"abstract":"The deliverable describes the third and final version of the PANACEA platform.","keywords":["infrastrutture Trattamento del linguaggio naturale"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/221573","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131787,"last_updated":"2020-09-12 01:47:14","id_people":221616,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D7. 4 Third evaluation report. Evaluation of PANACEA v3 and produced resources","year":2012,"authors_people":"Quochi, Valeria; Frontini, Francesca; Bartolini, Roberto; Hamon, Olivier; Poch Riera, Marc; Padro, Muntsa; Bel, Nuria; Thurmair, Gregor; Toral, Antonio; Kamran, Amir","authors_cnr":["Frontini, Francesca","Bartolini, Roberto","Quochi, Valeria"],"authors_cnr_id":["10441","11893"],"authors_cnr_institute":[""],"authors":["Quochi, V.","Frontini, F.","Bartolini, R.","Hamon, O.","Poch Riera, M.","Padro, M.","Bel, N.","Thurmair, G.","Toral, A.","Kamran, A."],"abstract":"D7.4 reports on the evaluation of the different components integrated in the PANACEA third cycle of development as well as the final validation of the platform itself. All validation and evaluation experiments follow the evaluation criteria already described in D7.1. The main goal of WP7 tasks was to test the (technical) functionalities and capabilities of the middleware that allows the integration of the various resource-creation components into an interoperable distributed environment (WP3) and to evaluate the quality of the components developed in WP5 and WP6. The content of this deliverable is thus complementary to D8.2 and D8.3 that tackle advantages and usability in industrial scenarios. It has to be noted that the PANACEA third cycle of development addressed many components that are still under research. The main goal for this evaluation cycle thus is to assess the methods experimented with and their potentials for becoming actual production tools to be exploited outside research labs. For most of the technologies, an attempt was made to re-interpret standard evaluation measures, usually in terms of accuracy, precision and recall, as measures related to a reduction of costs (time and human resources) in the current practices based on the manual production of resources. In order to do so, the different tools had to be tuned and adapted to maximize precision and for some tools the possibility to offer confidence measures that could allow a separation of the resources that still needed manual revision has been attempted. Furthermore, the extension to other languages in addition to English, also a PANACEA objective, has been evaluated. The main facts about the evaluation results are now summarized.","keywords":["PANACEA","evaluation","machine translation"],"pages":"","url":"http:\/\/hdl.handle.net\/10230\/22533","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131788,"last_updated":"2015-02-24 18:27:38","id_people":221631,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D6. 2 Integrated Final Version of the Components for Lexical Acquisition","year":2012,"authors_people":"Rimell, Laura; Bel, N\u00faria; Padr\u00f3, Muntsa; Frontini, Francesca; Monachini, Monica; Quochi, Valeria","authors_cnr":["Frontini, Francesca","Monachini, Monica","Quochi, Valeria"],"authors_cnr_id":["8945","11893"],"authors_cnr_institute":["048","048","048"],"authors":["Rimell, L.","Bel, N.","Padr\u00f3, M.","Frontini, F.","Monachini, M.","Quochi, V."],"abstract":"The PANACEA project has addressed one of the most critical bottlenecks that threaten the development of technologies to support multilingualism in Europe, and to process the huge quantity of multilingual data produced annually. Any attempt at automated language processing, particularly Machine Translation (MT), depends on the availability of language-specific resources. Such Language Resources (LR) contain information about the language's lexicon, i.e. the words of the language and the characteristics of their use. In Natural Language Processing (NLP), LRs contribute information about the syntactic and semantic behaviour of words - i.e. their grammar and their meaning - which inform downstream applications such as MT. To date, many LRs have been generated by hand, requiring significant manual labour from linguistic experts. However, proceeding manually, it is impossible to supply LRs for every possible pair of European languages, textual domain, and genre, which are needed by MT developers. Moreover, an LR for a given language can never be considered complete nor final because of the characteristics of natural language, which continually undergoes changes, especially spurred on by the emergence of new knowledge domains and new technologies. PANACEA has addressed this challenge by building a factory of LRs that progressively automates the stages involved in the acquisition, production, updating and maintenance of LRs required by MT systems. The existence of such a factory will significantly cut down the cost, time and human effort required to build LRs. WP6 has addressed the lexical acquisition component of the LR factory, that is, the techniques for automated extraction of key lexical information from texts, and the automatic collation of lexical information into LRs in a standardized format. The goal of WP6 has been to take existing techniques capable of acquiring syntactic and semantic information from corpus data, improving upon them, adapting and applying them to multiple languages, and turning them into powerful and flexible techniques capable of supporting massive applications. One focus for improving the scalability and portability of lexical acquisition techniques has been to extend exiting techniques with more powerful, less \"supervised\" methods. In NLP, the amount of supervision refers to the amount of manual annotation which must be applied to a text corpus before machine learning or other techniques are applied to the data to compile a lexicon. More manual annotation means more accurate training data, and thus a more accurate LR. However, given that it is impractical from a cost and time perspective to manually annotate the vast amounts of data required for multilingual MT across domains, it is important to develop techniques which can learn from corpora with less supervision. Less supervised methods are capable of supporting both large-scale acquisition and efficient domain adaptation, even in the domains where data is scarce. Another focus of lexical acquisition in PANACEA has been the need of LR users to tune the accuracy level of LRs. Some applications may require increased precision, or accuracy, where the application requires a high degree of confidence in the lexical information used. At other times a greater level of coverage may be required, with information about more words at the expense of some degree of accuracy. Lexical acquisition in PANACEA has investigated confidence thresholds for lexical acquisition to ensure that the ultimate users of LRs can generate lexical data from the PANACEA factory at the desired level of accuracy.","keywords":["Lexical Acquisition"],"pages":"","url":"http:\/\/www.panacea-lr.eu\/system\/deliverables\/PANACEA_D6.2.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131789,"last_updated":"2015-03-06 13:23:12","id_people":221650,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D6. 5 Merged dictionaries","year":2012,"authors_people":"Rimell, Laura; Bel, N\u00faria; Padr\u00f3, Muntsa; Frontini, Francesca; Monachini, Monica; Quochi, Valeria; Del Gratta, Riccardo","authors_cnr":["Frontini, Francesca","Monachini, Monica","Quochi, Valeria","Del Gratta, Riccardo"],"authors_cnr_id":["8945","11893","11933"],"authors_cnr_institute":["048","048","048","048"],"authors":["Rimell, L.","Bel, N.","Padr\u00f3, M.","Frontini, F.","Monachini, M.","Quochi, V.","Del Gratta, R."],"abstract":"This document presents the merged dictionaries delivered in PANACEA. Those dictionaries result from merging already existing lexica, generally for general domain, with domain specific lexica acquired using PANACEA platform. The domain specific lexica are presented and delivered in D6.3 and the merging repository that allowed the multilevel merging in D6.4.","keywords":["merged dictionaries","computational lexicon"],"pages":"","url":"http:\/\/www.panacea-lr.eu\/\/en\/deliverables\/list","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131794,"last_updated":"2015-02-24 18:30:12","id_people":221755,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D6. 3 Monolingual lexica for English, Spanish and Italian tuned for a particular domain (LAB and ENV)","year":2012,"authors_people":"Rimell, Laura; Bel, Nuria; Padr\u00f2, Muntsa; Frontini, Francesca; Monachini, Monica; Quochi, Valeria; Del Gratta, Riccardo","authors_cnr":["Frontini, Francesca","Monachini, Monica","Quochi, Valeria","Del Gratta, Riccardo"],"authors_cnr_id":["8945","11893","11933"],"authors_cnr_institute":["048","048","048","048"],"authors":["Rimell, L.","Bel, N.","Padr\u00f2, M.","Frontini, F.","Monachini, M.","Quochi, V.","Del Gratta, R."],"abstract":"This document presents the lexica acquired using PANACEA platform for Labour and Environment domains. The languages of the lexica are English, Spanish and Italian. The lexical information acquired depends on the language, according to the available tools in the platform.","keywords":["Lexicon Acqusition"],"pages":"","url":"http:\/\/www.panacea-lr.eu\/system\/deliverables\/PANACEA_D6.3.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131669,"last_updated":"2016-03-18 14:44:40","id_people":205232,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"The BioLexicon: a large-scale terminological resource for biomedical text mining","year":2011,"authors_people":"Paul Thompson, John McNaught, Simonetta Montemagni, Nicoletta Calzolari, Riccardo del Gratta, Vivian Lee, Simone Marchi, Monica Monachini, Piotr Pezik, Valeria Quochi, CJ Rupp, Yutaka Sasaki, Giulia Venturi, Dietrich Rebholz-Schuhmann, Sophia Ananiadou","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Monachini, Monica","Marchi, Simone","Quochi, Valeria","Del Gratta, Riccardo","Zamorani, Nicoletta"],"authors_cnr_id":["5595","8945","10442","11893","11933","26123"],"authors_cnr_institute":["048","048","048","048","048","048","048"],"authors":["Thompson, P.","McNaught, J.","Montemagni, S.","Calzolari, N.","Del Gratta, R.","Lee, V.","Marchi, S.","Monachini, M.","Pezik, P.","Quochi, V.","Rupp, C.","Sasaki, Y.","Venturi, G.","Rebholz Schuhmann, D.","Ananiadou, S."],"abstract":"Background Due to the rapidly expanding body of biomedical literature, biologists require increasingly sophisticated and efficient systems to help them to search for relevant information. Such systems should account for the multiple written variants used to represent biomedical concepts, and allow the user to search for specific pieces of knowledge (or events) involving these concepts, e.g., protein-protein interactions. Such functionality requires access to detailed information about words used in the biomedical literature. Existing databases and ontologies often have a specific focus and are oriented towards human use. Consequently, biological knowledge is dispersed amongst many resources, which often do not attempt to account for the large and frequently changing set of variants that appear in the literature. Additionally, such resources typically do not provide information about how terms relate to each other in texts to describe events. Results This article provides an overview of the design, construction and evaluation of a large-scale lexical and conceptual resource for the biomedical domain, the BioLexicon. The resource can be exploited by text mining tools at several levels, e.g., part-of-speech tagging, recognition of biomedical entities, and the extraction of events in which they are involved. As such, the BioLexicon must account for real usage of words in biomedical texts. In particular, the BioLexicon gathers together different types of terms from several existing data resources into a single, unified repository, and augments them with new term variants automatically extracted from biomedical literature. Extraction of events is facilitated through the inclusion of biologically pertinent verbs (around which events are typically organized) together with information about typical patterns of grammatical and semantic behaviour, which are acquired from domain-specific texts. In order to foster interoperability, the BioLexicon is modelled using the Lexical Markup Framework, an ISO standard. Conclusions The BioLexicon contains over 2.2 M lexical entries and over 1.8 M terminological variants, as well as over 3.3 M semantic relations, including over 2 M synonymy relations. Its exploitation can benefit both application developers and users. We demonstrate some such benefits by describing integration of the resource into a number of different tools, and evaluating improvements in performance that this can bring.","keywords":["Text Mining","Information Extraction","Computational Lexicon"],"pages":"1-29","url":"http:\/\/www.biomedcentral.com\/1471-2105\/12\/397","volume":"12","doi":"10.1186\/1471-2105-12-397","editors_people":"","editors":[""],"published":"BMC bioinformatics","publisher":"BioMed Central ([London], Regno Unito)","issn":"1471-2105","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131710,"last_updated":"2023-06-26 21:29:25","id_people":206410,"institutes":["ILC"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings of the 3rd European Language Resources and Technologies Forum: Language Resources in the Sharing Age-the Strategic Agenda","year":2011,"authors_people":"Nicoletta Calzolari, Paola Baroni, Claudia Soria, Sara Goggi, Monica Monachini, Valeria Quochi","authors_cnr":["Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Quochi, Valeria","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","11893","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Baroni, P.","Soria, C.","Goggi, S.","Monachini, M.","Quochi, V."],"abstract":"Proceedings of the third FLaReNet forum on the European Language Resources and Technologies, held in Venezia, at the Auditorium Santa Margherita of the Universit\u00e0 Ca' Foscari, on 26-27 May 2011.","keywords":["Language Resources","Language Technologies"],"pages":"86","url":"http:\/\/www.flarenet.eu\/sites\/default\/files\/FLaReNet_Forum_2011_Proceedings.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131686,"last_updated":"2013-02-27 11:57:04","id_people":205719,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Interoperability Framework: The FLaReNet action plan proposal","year":2011,"authors_people":"Nicoletta Calzolari, Monica Monachini, Valeria Quochi","authors_cnr":["Monachini, Monica","Quochi, Valeria"],"authors_cnr_id":["8945","11893"],"authors_cnr_institute":["048","048"],"authors":["Calzolari, N.","Monachini, M.","Quochi, V."],"abstract":"Standards are fundamental to ex-change, preserve, maintain and integrate data and language resources, and as an essential basis of any language resource infrastructure. This paper promotes an Interoperability Framework as a dynamic environment of standards and guidelines, also intended to support the provision of language-(web)service interoperability. In the past two decades, the need to define common practices and formats for linguistic resources has been increasingly recognized and sought. Today open, collaborative, shared data is at the core of a sound language strategy, and standardisation is actively on the move. This paper first describes the current landscape of standards, and presents the major barriers to their adoption; then, it describes those scenarios that critically involve the use of standards and provide a strong motivation for their adoption; lastly, a series of actions and steps needed to operationalise standards and achieve a full interoperability for Language Resources and Technologies are proposed.","keywords":["Language Resources","standards"],"pages":"41-49","url":"https:\/\/publications.cnr.it\/doc\/205719","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-974-466-564-5","conference_name":"Workshop on Language Resources, Technology and Services in the Sharing Paradigm","conference_place":"Chiang Mai","conference_date":"12 Novembre 2011"},{"id":131902,"last_updated":"2014-11-14 17:37:42","id_people":287125,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"The development of Light-'do' Verb Constructions in Italian","year":2011,"authors_people":"Quochi Valeria","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048"],"authors":["Quochi, V."],"abstract":"This contribution presents the results of a study of the development of Light 'do' Verb Constructions in Italian based on naturalistic data. The claim is that there exists a Light Verb pivot schema that accounts for new productive formations and that this pattern is learnt by young children because it constitutes a labeling technique for naming new events, activities and situations. The findings of this research support two hypotheses of language acquisition. The results are based on analysis of longitudinal transcriptions of adult children interactions contained in the CHILDES databank (MacWhinney 2000).","keywords":["child language","construction grammar","light verb constructions"],"pages":"256-257","url":"http:\/\/sle2011.cilap.es\/downloads\/book_abstracts.pdf","volume":"","doi":"","editors_people":"Javier Mart\u00edn Arista","editors":["Arista, J. M."],"published":"SLE 2011-44TH ANNUAL MEETING BOOK OF ABSTRACT","publisher":"","issn":"","isbn":"","conference_name":"SLE 2011-44 TH ANNUAL MEETING","conference_place":"Logro\u00f1o, Spain","conference_date":"8-11 Settembre 2011"},{"id":131982,"last_updated":"2015-02-26 13:23:59","id_people":290606,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"The FLaReNet Databook","year":2011,"authors_people":"Arranz V., Bel N., Budin G., Caselli T., Choukri K., Del Gratta R., Frontini F., Goggi S., Monachini M., Quochi V., Rubino F., Russo I. et alii","authors_cnr":["Del Gratta, Riccardo","Caselli, Tommaso","Russo, Irene","Frontini, Francesca","Rubino, Francesco","Monachini, Monica","Goggi, Sara","Quochi, Valeria"],"authors_cnr_id":["8945","10172","11893"],"authors_cnr_institute":["048","048","048","048","048","048","048","048"],"authors":["Arranz, V.","Bel, N.","Budin, G.","Caselli, T.","Choukri, K.","Del Gratta, R.","Frontini, F.","Goggi, S.","Monachini, M.","Quochi, V.","Rubino, F.","Russo, I."],"abstract":"The FLaReNet Databook is not only the collection of all the factual material collected during the activities of the project, but also a set on innovative initiatives and instruments that will remain in place for the continuous collection of such \"facts\". The purpose of the Databook is in fact, on one side, to consolidate the analyses carried out in the project and, at the same time, to set up the proper mechanisms that will enable the provision of a continuous stream of relevant factual material, also after the end of the project.","keywords":["Language Resources (LRs)"],"pages":"1-8","url":"http:\/\/www.flarenet.eu\/?q=FLaReNet_Databook","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131708,"last_updated":"2015-02-26 10:47:02","id_people":206397,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Final FLaReNet deliverable: Language Resources for the Future-The Future of Language Resources","year":2011,"authors_people":"Nicoletta Calzolari, Nuria Bel, Khalid Choukri, Joseph Mariani, Monica Monachini, Jan Odijk, Stelios Piperidis, Valeria Quochi, Claudia Soria","authors_cnr":["Monachini, Monica","Soria, Claudia","Quochi, Valeria","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","11893","26123"],"authors_cnr_institute":["048","048","048"],"authors":["Calzolari, N.","Bel, N.","Choukri, K.","Mariani, J.","Monachini, M.","Odijk, J.","Piperidis, S.","Quochi, V.","Soria, C."],"abstract":"Language Technologies (LT), together with their backbone, Language Resources (LR), provide an essential support to the challenge of Multilingualism and ICT of the future. The main task of language technologies is to bridge language barriers and to help creating a new environment where information flows smoothly across frontiers and languages, no matter the country, and the language, of origin. To achieve this goal, all players involved need to act as a community able to join forces on a set of shared priorities. However, until now the field of Language Resources and Technology has long suffered from an excess of individuality and fragmentation, with a lack of coherence concerning the priorities for the field, the direction to move, not to mention a common timeframe. The context encountered by the FLaReNet project was thus represented by an active field needing a coherence that can only be given by sharing common priorities and endeavours. FLaReNet has contributed to the creation of this coherence by gathering a wide community of experts and making them participate in the definition of an exhaustive set of recommendations.","keywords":["language resources and technologies","infrastructures"],"pages":"97","url":"https:\/\/publications.cnr.it\/doc\/206397","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131712,"last_updated":"2013-03-12 12:20:30","id_people":206420,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"FLaReNet Strategic Language Resource Agenda","year":2011,"authors_people":"Nicoletta Calzolari, Valeria Quochi, Claudia Soria","authors_cnr":["Soria, Claudia","Quochi, Valeria"],"authors_cnr_id":["9887","11893"],"authors_cnr_institute":["048","048"],"authors":["Calzolari, N.","Quochi, V.","Soria, C."],"abstract":"Despite the complexity of handling its languages, the European Union has established that cultural and language differences are a unique asset to be preserved. Europe needs to find means - such as technological ones - to overcome the language barriers to support citizens and industry in a multilingual globalised world. The large majority of industrial technological applications that handle natural language, i.e. Machine Translation, Crosslingual Information Retrieval, Multilingual Information Extraction, Automatic Document Indexing, Question Answering, Natural Language Interfaces, etc., include Language Resources as critical components. Although Language Technologies may consist of language independent engines, they depend on the availability of language-dependent knowledge under the form of Language Resources for their real-life implementation. At the same time, it is proved that a critical mass of Language Resources can make advancement in research and technology development possible and quicker, making Europe the leader of the market related to multilingualism. Companies such as Google or Microsoft play a dominant role in this framework, as they have access to a huge amount of data in many different languages, devote considerable resources to Language Technologies, have massive computing power and a direct research-to-application pipeline using a new business model based on so-called \"free\" services. The fact that a US company like Google is delivering some of the most comprehensive Language Technology solutions to support multilingualism should raise concern among EU officials.","keywords":["Language resources","infrastructures"],"pages":"23","url":"https:\/\/publications.cnr.it\/doc\/206420","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131721,"last_updated":"2013-03-13 10:26:59","id_people":206507,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"The Standards' Landscape Towards an Interoperability Framework","year":2011,"authors_people":"Monica Monachini, Valeria Quochi, Nicoletta Calzolari, N\u00faria Bel, Gerhard Budin, Tommaso Caselli, Khalid Choukri, Gil Francopoulo, Erhard Hinrichs, Steven Krauwer, Lothar Lemnitzer, Joseph Mariani, Jan Odijk, Stelios Piperidis, Adam Przepiorkowski, Laurent Romary, Helmut Schmidt, Hans Uszkoreit, Peter Wittenburg","authors_cnr":["Caselli, Tommaso","Monachini, Monica","Quochi, Valeria"],"authors_cnr_id":["8945","11893"],"authors_cnr_institute":["048","048","048"],"authors":["Monachini, M.","Quochi, V.","Calzolari, N.","Bel, N.","Budin, G.","Caselli, T.","Choukri, K.","Francopoulo, G.","Hinrichs, E.","Krauwer, S.","Lemnitzer, L.","Mariani, J.","Odijk, J.","Piperidis, S.","Przepiorkowski, A.","Romary, L.","Schmidt, H.","Uszkoreit, H.","Wittenburg, P."],"abstract":"This document proposes an overview of the current scene towards an Interoperability Framework and acts as a reference point for the current standards that the community fosters and encourages to adopt\/improve. This initiative is in close synchronization with other relevant initiatives such as CLARIN, ELRA, ISO and TEI and META-Share. The document builds on the CLARIN Standardisation Action Plan and adapts and extends it to the needs of the broader LT Community, beyond the SSH research areas including the industry. The main goal of this document is to give a practical orientation for various LT players, both commercial and academic; the main message being that a harmonized domain of language resources and technology can be achieved stepwise, but that an effort to adopt standards is necessary to overcome fragmentation. NB: This is to be intended by no means as a static, closed document, rather a dynamic one which needs to be constantly\/periodically revised and updated by the community itself.","keywords":["Standards","interoperability"],"pages":"23","url":"https:\/\/publications.cnr.it\/doc\/206507","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131250,"last_updated":"2012-06-05 10:38:01","id_people":84809,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"The LREC Map of Language Resources and Technologies","year":2010,"authors_people":"Calzolari N.; Soria C.; Del Gratta R.; Goggi S.; Quochi V.; Russo I.; Choukri K.; Mariani J.; Piperidis S.","authors_cnr":["Russo, Irene","Soria, Claudia","Goggi, Sara","Quochi, Valeria","Del Gratta, Riccardo"],"authors_cnr_id":["9887","10172","11893","11933"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Calzolari, N.","Soria, C.","Del Gratta, R.","Goggi, S.","Quochi, V.","Russo, I.","Choukri, K.","Mariani, J.","Piperidis, S."],"abstract":"In this paper we present the LREC Map of Language Resources (data and tools), an innovative feature introduced in conjunction with the LREC 2010 Conference. The purpose of the Map is to shed light on the vast amount of resources that represent the background of the research presented at LREC, in the attempt to fill in a gap in the community knowledge about the resources that are used or created worldwide. It also aims at a change of culture in the field, actively engaging each researcher in the documentation task about resources. The Map has been developed on the basis of the information provided by LREC authors during the submission of papers to the LREC 2010 conference and the LREC workshops, and contains information about almost 2000 resources. The paper illustrates the motivation behind this initiative, its main characteristics, its relevance and future impact in the field, the metadata used to describe the resources, and finally presents some of the most relevant findings.","keywords":["LR national\/international projects","organizational\/policy issues"],"pages":"949-956","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2010\/index.html","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference Chair); Khalid Choukri; Bente Maegaard; Joseph Mariani; Jan Odjik; Stelios Piperidis; Mike Rosner; Daniel Tapias","editors":["Calzolari, N.","Choukri, K.","Maegaard, B.","Mariani, J.","Odjik, J.","Piperidis, S.","Rosner, M.","Tapias, D."],"published":"LREC'10-Seventh International Conference on Language Resources and Evaluation. Proceedings","publisher":"European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)","issn":"","isbn":"2-9517408-6-7","conference_name":"LREC 2010 Seventh International Conference on Language Resources and Evaluation","conference_place":"Valletta, Malta","conference_date":"17-23 May 2010"},{"id":131225,"last_updated":"2012-06-08 12:07:42","id_people":84782,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A Web-based Architecture for Interoperability of Lexical Resources","year":2010,"authors_people":"Del Gratta R.; D'Onofrio L.; Bartolini R.; Caselli T.; Enea A.; Monachini M.; Quochi V.; Soria C.; Toral A.; Calzolari N.","authors_cnr":["Caselli, Tommaso","Enea, Alessandro","Monachini, Monica","Soria, Claudia","Bartolini, Roberto","Quochi, Valeria","Del Gratta, Riccardo","Zamorani, Nicoletta"],"authors_cnr_id":["8533","8945","9887","10441","11893","11933","26123"],"authors_cnr_institute":["048","048","048","048","048","048","048"],"authors":["Del Gratta, R.","D'Onofrio, L.","Bartolini, R.","Caselli, T.","Enea, A.","Monachini, M.","Quochi, V.","Soria, C.","Toral, A.","Calzolari, N."],"abstract":"In this paper we present aWeb Service Architecture for managing high level interoperability of Language Resources (LRs) by means of a Service Oriented Architecture (SOA) and the use of ISO standards, such as ISO LMF. We propose a layered architecture which separates the management of legacy resources (data collection) from data aggregation (workflow) and data access (user requests). We provide a case study to demonstrate how the proposed architecture is capable of managing data exchange among different lexical services in a coherent way and show how the use of a lexical standard becomes of primary importance when a protocol of interoperability is defined.","keywords":["Interoperability","Web sercives","Lexical resources"],"pages":"53-62","url":"http:\/\/weblab.iit.cnr.it\/kyoto\/www2.let.vu.nl\/twiki\/pub\/Kyoto\/Publications\/icgl2010_DOnofrioetal.pdf","volume":"","doi":"","editors_people":"A. Chengyu Fang; N. Ide; J. Webster","editors":["Fang, A. C.","Ide, N.","Webster, J."],"published":"2nd International Conference on Global Interoperability for Language Resources, ICGL 2010","publisher":"City university of Hong Kong press (Hong Kong, CHN)","issn":"","isbn":"978-962-442-323-5","conference_name":"2nd International Conference on Global Interoperability for Language Resources","conference_place":"Hong Kong","conference_date":"18-20 January 2010"},{"id":131226,"last_updated":"2016-01-14 15:24:41","id_people":84783,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Capturing Coercions in Texts: a First Annotation Exercise","year":2010,"authors_people":"Jezek E.; Quochi V.","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048"],"authors":["Jezek, E.","Quochi, V."],"abstract":"In this paper we report the first results of an annotation exercise of argument coercion phenomena performed on Italian texts. Our corpus consists of ca 4000 sentences from the PAROLE sottoinsieme corpus (Bindi et al. 2000) annotated with Selection and Coercion relations among verb-noun pairs formatted in XML according to the Generative Lexicon Mark-up Language (GLML) format (Pustejovsky et al., 2008). For the purposes of coercion annotation, we selected 26 Italian verbs that impose semantic typing on their arguments in either Subject, Direct Object or Complement position. Every sentence of the corpus is annotated with the source type for the noun arguments by two annotators plus a judge. An overall agreement of 0.87 kappa indicates that the annotation methodology is reliable. A qualitative analysis of the results allows us to outline some suggestions for improvement of the task: 1) a different account of complex types for nouns has to be devised and 2) a more comprehensive account of coercion mechanisms requires annotation of the deeper meaning dimensions that are targeted in coercion operations, such as those captured by Qualia relations.","keywords":["Corpus (creation","annotation","etc.)","Knowledge Discovery\/Representation","Semantics"],"pages":"1464-1471","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2010\/summaries\/713.html","volume":"","doi":"","editors_people":"Nicoletta Calzolari, Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odjik, Stelios Piperidis, Mike Rosner, Daniel Tapias","editors":["Calzolari, N.","Choukri, K.","Maegaard, B.","Mariani, J.","Odjik, J.","Piperidis, S.","Rosner, M.","Tapias, D."],"published":"Proceedings of the Seventh International Conference on Language Resources and Evaluation-LREC'10","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"2-9517408-6-7","conference_name":"Seventh International Conference on Language Resources and Evaluation","conference_place":"Valletta, Malta","conference_date":"17-23 Maggio 2010"},{"id":131217,"last_updated":"2015-02-25 18:21:02","id_people":84771,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"SemEval-2010 Task 7: Argument Selection and Coercion","year":2010,"authors_people":"Pustejovsky J.; Rumshisky A.; Plotnick A.; Jezek E.; Batiukova O.; Quochi V.","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":[""],"authors":["Pustejovsky, J.","Rumshisky, A.","Plotnick, A.","Jezek, E.","Batiukova, O.","Quochi, V."],"abstract":"The paper describes the Argument Selection and Coercion task for the SemEval-2010 evaluation exercise, which involves characterizing the type of compositional operation that exists between a predicate and the arguments it selects. Specifically, the goal is to identify whether the type that a verb selects is satisfied directly by the argument, or whether the argument must change type to satisfy the verb typing.","keywords":["semantic annotation","verb coercion"],"pages":"","url":"http:\/\/www.aclweb.org\/anthology\/S10-1005","volume":"","doi":"","editors_people":"Erk, Katrin; Strapparava, Carlo","editors":["Erk, K.","Strapparava, C."],"published":"Proceedings of the 5th International Workshop on Semantic Evaluation","publisher":"Association for Computational Linguistics (Stroudsburg, USA)","issn":"","isbn":"978-1-932432-70-1","conference_name":"Fifth International Workshop on Semantic Evaluation (SemEval 2010)","conference_place":"Uppsala","conference_date":"15-16 Luglio 2010"},{"id":131618,"last_updated":"2015-04-21 11:32:18","id_people":157488,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Progress Report No. 4","year":2010,"authors_people":"Calzolari N.; Soria C.; Baroni P.; Quochi V.; Bel N.; Budin G.; Choukri K.; Mariani J.; Odijk J.; Piperidis S.","authors_cnr":["Soria, Claudia","Baroni, Paola","Quochi, Valeria"],"authors_cnr_id":["9887","11332","11893"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Soria, C.","Baroni, P.","Quochi, V.","Bel, N.","Budin, G.","Choukri, K.","Mariani, J.","Odijk, J.","Piperidis, S."],"abstract":"","keywords":["Language Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157488","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131976,"last_updated":"2014-11-28 19:10:25","id_people":288752,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Usage scenarios and basic workflows","year":2009,"authors_people":"Valeria Quochi","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048"],"authors":["Quochi, V."],"abstract":"","keywords":[""],"pages":"5-5","url":"http:\/\/www.clarin.eu\/sites\/default\/files\/CLARIN_Newsletter_no_6.pdf","volume":"6","doi":"","editors_people":"","editors":[""],"published":"CLARIN Newsletter","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130900,"last_updated":"2012-06-28 13:49:59","id_people":30876,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"A Standard Lexical-Terminological Resource for the Bio Domain","year":2009,"authors_people":"Quochi V.; Del Gratta R.; Sassolini E.; Bartolini R.; Monachini M.; Calzolari N.","authors_cnr":["Quochi, Valeria","Del Gratta, Riccardo","Monachini, Monica","Bartolini, Roberto","Sassolini, Eva","Zamorani, Nicoletta"],"authors_cnr_id":["8945","10441","11032","26123"],"authors_cnr_institute":[""],"authors":["Quochi, V.","Del Gratta, R.","Sassolini, E.","Bartolini, R.","Monachini, M.","Calzolari, N."],"abstract":"The present paper describes a large-scale lexical resource for the biology domain designed both for human and for machine use. This lexicon aims at semantic interoperability and extendability, through the adoption of ISO-LMF standard for lexical representation and through a granular and distributed encoding of relevant information. The first part of this contribution focuses on three aspects of the model that are of particular interest to the biology community: the treatment of term variants, the representation on bio events and the alignment with a domain ontology. The second part of the paper describes the physical implementation of the model: a relational database equipped with a set of automatic uploading procedures. Peculiarity of the BioLexicon is that it combines features of both terminologies and lexicons. A set verbs relevant for the domain is also represented with full details on their syntactic and semantic argument structure.","keywords":["Lexical representation model","Lexical Database","Computational Lexicography","Special Domains","Standards"],"pages":"325-335","url":"https:\/\/publications.cnr.it\/doc\/30876","volume":"5603","doi":"10.1007\/978-3-642-04235-5_28","editors_people":"","editors":[""],"published":"Lecture notes in computer science","publisher":"Springer (Berlin, Germania)","issn":"0302-9743","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131647,"last_updated":"2023-06-26 21:27:07","id_people":183877,"institutes":["ILC"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings of the 1st European Language Resources and Technologies Forum: Shaping the Future of the Multilingual Digital Europe","year":2009,"authors_people":"Calzolari N.; Baroni P.; Bel N.; Budin G.; Choukri K.; Goggi S.; Mariani J.; Monachini M.; Odijk J.; Piperidis S.; Quochi V.; Soria C.; Toral A.","authors_cnr":["Toral Ruiz, Antonio","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Quochi, Valeria","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","11893","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Baroni, P.","Bel, N.","Budin, G.","Choukri, K.","Goggi, S.","Mariani, J.","Monachini, M.","Odijk, J.","Piperidis, S.","Quochi, V.","Soria, C.","Toral, A."],"abstract":"Proceedings of the first FLaReNet Forum on the European Language Resources and Technologies, held in Vienna, at the Austrian Academy of Science, on 12-13 February 2009.","keywords":["Language Resources","Language Technologies","Multilingual","Digital"],"pages":"105","url":"http:\/\/www.flarenet.eu\/sites\/default\/files\/Vienna09_Proceedings.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131201,"last_updated":"1970-01-01 01:00:00","id_people":84752,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Relevance of Qualia Relations in Coercive Contexts","year":2009,"authors_people":"Jezek E.; Quochi V.; Calzolari N.","authors_cnr":["Quochi, Valeria","Zamorani, Nicoletta"],"authors_cnr_id":["26123"],"authors_cnr_institute":[""],"authors":["Jezek, E.","Quochi, V.","Calzolari, N."],"abstract":"","keywords":["annotation","annotation scheme","semantics","type shift"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84752","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"5th International Conference on Generative Approaches to the Lexicon","conference_place":"Pisa","conference_date":"2009"},{"id":131595,"last_updated":"2010-11-20 00:00:00","id_people":157465,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Dissemination Plan","year":2009,"authors_people":"Calzolari N.; Baroni P.; Goggi S.; Monachini M.; Quochi V.; Soria C.; Toral A.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Baroni, P.","Goggi, S.","Monachini, M.","Quochi, V.","Soria, C.","Toral, A."],"abstract":"","keywords":["Language Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157465","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131598,"last_updated":"2015-04-21 11:32:34","id_people":157468,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Progress Report No. 1","year":2009,"authors_people":"Calzolari N.; Baroni P.; Goggi S.; Monachini M.; Quochi V.; Soria C.; Toral A.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Baroni, P.","Goggi, S.","Monachini, M.","Quochi, V.","Soria, C.","Toral, A."],"abstract":"","keywords":["Language Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157468","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131597,"last_updated":"2015-04-21 11:32:49","id_people":157467,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Progress Report No. 2","year":2009,"authors_people":"Calzolari N.; Monachini M.; Soria C.; Baroni P.; Goggi S.; Quochi V.; Toral A.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Monachini, M.","Soria, C.","Baroni, P.","Goggi, S.","Quochi, V.","Toral, A."],"abstract":"","keywords":["Language Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157467","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131592,"last_updated":"2010-11-20 00:00:00","id_people":157462,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Action Plan","year":2009,"authors_people":"Calzolari N.; Soria C.; Baroni P.; Caselli T.; Goggi S.; Monachini M.; Quochi V.; Toral A.; Bel N.; Budin G.; Choukri K.; Mariani J.; Odijk J.; Piperidis S.","authors_cnr":["Quochi, Valeria","Caselli, Tommaso","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Soria, C.","Baroni, P.","Caselli, T.","Goggi, S.","Monachini, M.","Quochi, V.","Toral, A.","Bel, N.","Budin, G.","Choukri, K.","Mariani, J.","Odijk, J.","Piperidis, S."],"abstract":"","keywords":["Language Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157462","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131596,"last_updated":"2010-11-20 00:00:00","id_people":157466,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Evaluation Plan for the functioning of the Network","year":2009,"authors_people":"Calzolari N.; Soria C.; Baroni P.; Goggi S.; Monachini M.; Quochi V.; Toral A.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Soria, C.","Baroni, P.","Goggi, S.","Monachini, M.","Quochi, V.","Toral, A."],"abstract":"","keywords":["Language Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157466","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131593,"last_updated":"2010-11-20 00:00:00","id_people":157463,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Annual Report No. 1","year":2009,"authors_people":"Calzolari N.; Soria C.; Baroni P.; Monachini M.; Quochi V.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Soria, C.","Baroni, P.","Monachini, M.","Quochi, V."],"abstract":"","keywords":["Language Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157463","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131599,"last_updated":"2010-11-20 00:00:00","id_people":157469,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Project Presentation","year":2009,"authors_people":"Calzolari N.; Soria C.; Baroni P.; Monachini M.; Quochi V.; Toral A.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Soria, C.","Baroni, P.","Monachini, M.","Quochi, V.","Toral, A."],"abstract":"","keywords":["Language Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157469","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131594,"last_updated":"2015-02-26 11:35:48","id_people":157464,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ECP-2007-LANG-617001 FLaReNet: Blueprint of actions and infrastructures No. 1","year":2009,"authors_people":"Calzolari N.; Soria C.; Bel N.; Budin G.; Caselli T.; Choukri K.; Mariani J.; Monachini M.; Odijk J.; Piperidis S.; Quochi V.; Toral A.","authors_cnr":["Quochi, Valeria","Caselli, Tommaso","Monachini, Monica","Soria, Claudia","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","26123"],"authors_cnr_institute":["048","","048","048","048"],"authors":["Calzolari, N.","Soria, C.","Bel, N.","Budin, G.","Caselli, T.","Choukri, K.","Mariani, J.","Monachini, M.","Odijk, J.","Piperidis, S.","Quochi, V.","Toral, A."],"abstract":"","keywords":["Language Resources","Infrastructures","Recommendations"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157464","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131601,"last_updated":"2023-07-05 06:28:56","id_people":157471,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"The European Language Resources and Technologies Forum: Shaping the Future of the Multilingual Digital Europe","year":2009,"authors_people":"Calzolari N.; Baroni P.; Bel N.; Budin G.; Choukri K.; Goggi S.; Mariani J.; Monachini M.; Odijk J.; Piperidis S.; Quochi V.; Soria C.; Toral A.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Baroni, P.","Bel, N.","Budin, G.","Choukri, K.","Goggi, S.","Mariani, J.","Monachini, M.","Odijk, J.","Piperidis, S.","Quochi, V.","Soria, C.","Toral, A."],"abstract":"","keywords":["Language Resources","Language Technologies"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157471","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131587,"last_updated":"2010-11-20 00:00:00","id_people":157457,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Extended Report of: The European Language Resources and Technologies Forum: Shaping the Future of the Multilingual Digital Europe","year":2009,"authors_people":"Calzolari N.; Bel N.; Budin G.; Choukri K.; Mariani J.; Odijk J.; Piperidis S.; Baroni P.; Goggi S.; Monachini M.; Quochi V.; Soria C.; Toral A.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Bel, N.","Budin, G.","Choukri, K.","Mariani, J.","Odijk, J.","Piperidis, S.","Baroni, P.","Goggi, S.","Monachini, M.","Quochi, V.","Soria, C.","Toral, A."],"abstract":"","keywords":["Language Resources","Language Technologies"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157457","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131590,"last_updated":"2013-09-03 16:53:56","id_people":157460,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Short Report of The European Language Resources and Technologies Forum: Shaping the Future of the Multilingual Digital Europe","year":2009,"authors_people":"Calzolari N.; Bel N.; Budin G.; Choukri K.; Mariani J.; Odijk J.; Piperidis S.; Baroni P.; Goggi S.; Monachini M.; Quochi V.; Soria C.; Toral A.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Soria, Claudia","Goggi, Sara","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","11332","26123"],"authors_cnr_institute":["048"],"authors":["Calzolari, N.","Bel, N.","Budin, G.","Choukri, K.","Mariani, J.","Odijk, J.","Piperidis, S.","Baroni, P.","Goggi, S.","Monachini, M.","Quochi, V.","Soria, C.","Toral, A."],"abstract":"","keywords":["Language Resources","Language Technologies"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157460","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131182,"last_updated":"2013-06-26 16:13:14","id_people":84731,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Using LMF to Shape a Lexicon for the Biomedical Domain","year":2008,"authors_people":"Monachini M.; Quochi V.; Del Gratta R.; Calzolari N.","authors_cnr":["Quochi, Valeria","Del Gratta, Riccardo","Monachini, Monica","Zamorani, Nicoletta"],"authors_cnr_id":["8945","26123"],"authors_cnr_institute":["048"],"authors":["Monachini, M.","Quochi, V.","Del Gratta, R.","Calzolari, N."],"abstract":"This paper describes the design, implementation and population of the BioLexicon in the framework of BootStrep, an FP6 project. The BioLexicon (BL) is a lexical resource designed for text mining in the bio-domain. It has been conceived to meet both domain requirements and upcoming ISO standards for lexical representation. The data model and data categories are compliant to the ISO Lexical Markup Framework and the Data Category Registry. The BioLexicon integrates features of lexicons and terminologies: term entries (and variants) derived from existing resources are enriched with linguistic features, including sub-categorization and predicate-argument information, extracted from texts. Thus, it is an extendable resource. Furthermore, the lexical entries will be aligned to concepts in the BioOntology, the ontological resource of the project. The BL implementation is an extensible relational database with automatic population procedures. Population relies on a dedicated input data structure allowing to upload terms and their linguistic properties and \"pull-and-push\" them in the database. The BioLexicon teaches that the state-of-the-art is mature enough to aim at setting up a standard in this domain. Being conformant to lexical standards, the BioLexicon is interoperable and portable to other areas.","keywords":["Domain terminologies","Computational lexicons","Lexical standards","Lexical architectures"],"pages":"153-157","url":"https:\/\/publications.cnr.it\/doc\/84731","volume":"","doi":"","editors_people":"C. Delogu; M. Falcone (eds.)","editors":["Delogu, C.","Falcone, M."],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LangTech 2008-Tecnologia applicata alla linguistica","conference_place":"Roma","conference_date":"28-29 February 2008"},{"id":131974,"last_updated":"2014-11-28 16:07:22","id_people":288714,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Learning properties of Noun Phrases: from data to functions","year":2008,"authors_people":"Quochi, Valeria; Calderone, Basilio","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048"],"authors":["Quochi, V.","Calderone, B."],"abstract":"The paper presents two experiments of unsupervised classification of Italian noun phrases. The goal of the experiments is to identify the most prominent contextual properties that allow for a functional classification of noun phrases. For this purpose, we used a Self Organizing Map is trained with syntactically-annotated contexts containing noun phrases. The contexts are defined by means of a set of features representing morpho-syntactic properties of both nouns and their wider contexts. Two types of experiments have been run: one based on noun types and the other based on noun tokens. The results of the type simulation show that when frequency is the most prominent classification factor, the network isolates idiomatic or fixed phrases. The results of the token simulation experiment, instead, show that, of the 3 6 attributes represented in the original input matrix, only a few of them are prominent in the re-organization of the map. In particular, key features in the emergent macro-classification are the type of determiner and the grammatical number of the noun. An additional but not less interesting result is an organization into semantic\/pragmatic micro-classes. In conclusions, our result confirm the relative prominence of determiner type and grammatical number in the task of noun (phrase) categorization.","keywords":["cognitive linguistics","noun phrase"],"pages":"2596-2602","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2008\/summaries\/644.html","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"2-9517408-4-0","conference_name":"Sixth International Conference on Language Resources and Evaluation (LREC'08)","conference_place":"Marrakech, Morocco","conference_date":"28-30 Maggio"},{"id":131153,"last_updated":"2015-02-04 12:06:01","id_people":84700,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A lexicon for biology and bioinformatics: the BOOTStrep experience","year":2008,"authors_people":"Quochi V.; Monachini M.; Del Gratta R.; Calzolari N.","authors_cnr":["Quochi, Valeria","Del Gratta, Riccardo","Monachini, Monica","Zamorani, Nicoletta"],"authors_cnr_id":["8945","26123"],"authors_cnr_institute":[""],"authors":["Quochi, V.","Monachini, M.","Del Gratta, R.","Calzolari, N."],"abstract":"","keywords":["Lexicon","Ontologies","Lexical database"],"pages":"2285-2292","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2008\/pdf\/576_paper.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"2-9517408-4-0","conference_name":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","conference_place":"Marrakech, Marocco","conference_date":"26-05\/1-06-2008"},{"id":131166,"last_updated":"2013-06-07 18:01:12","id_people":84714,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Lexically-based Ontologies and Ontologically Based Lexicons","year":2008,"authors_people":"Toral Ruiz A.; Quochi V.; Del Gratta R.; Monachini M.; Soria C.; Calzolari N.","authors_cnr":["Quochi, Valeria","Del Gratta, Riccardo","Toral Ruiz, Antonio","Monachini, Monica","Soria, Claudia","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","26123"],"authors_cnr_institute":["048"],"authors":["Toral, R. A.","Quochi, V.","Del Gratta, R.","Monachini, M.","Soria, C.","Calzolari, N."],"abstract":"This paper deals with the relations between ontologies and lexicons. We study the role of these two components and their evolution during the last years in the field of Computational Linguistics. Subsequently, we survey the current lines of research at ILC-CNR which tackle this topic. They involve (I) the reuse of already existing Lexical Resources to derive formal ontologies, (II) the conversion and combination of terminologies into rich and formal Lexical Resources and (III) the use of formal ontologies as the backbone of multilingual Lexical Resources.","keywords":["Resource Infrastructure","UIMA","Clarin"],"pages":"49-59","url":"https:\/\/publications.cnr.it\/doc\/84714","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"AI*IA 2008-10th Congress of Italian Association for Artificial Intelligence","conference_place":"Cagliari","conference_date":"11-13 Settembre 2008"},{"id":131128,"last_updated":"2015-02-25 18:27:20","id_people":84670,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Inferring the semantics of temporal prepositions in Italian","year":2007,"authors_people":"Caselli T., Quochi V.","authors_cnr":["Quochi, Valeria","Caselli, Tommaso"],"authors_cnr_id":[""],"authors_cnr_institute":["048","048"],"authors":["Caselli, T.","Quochi, V."],"abstract":"","keywords":["italian","prepositions","computational linguistics"],"pages":"38-44","url":"http:\/\/www.aclweb.org\/anthology\/W07-1606","volume":"","doi":"","editors_people":"Fintan Costello, John Kelleher and Martin Volk","editors":["Costello, F.","Kelleher, J.","Volk, M."],"published":"Proceedings of the Fourth ACL-SIGSEM Workshop on Prepositions","publisher":"Association for Computational Linguistics (Stroudsburg, USA)","issn":"","isbn":"","conference_name":"Fourth ACL-SIGSEM Workshop on Prepositions","conference_place":"Prague, Czech Republic","conference_date":"28\/07\/2007"},{"id":131133,"last_updated":"2013-06-07 17:17:27","id_people":84676,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Lexical Relations and Domain Knowledge: The BioLexicon Meets the Qualia Structure","year":2007,"authors_people":"Monachini M., Quochi V., Ruimy N., Calzolari N.","authors_cnr":["Quochi, Valeria","Monachini, Monica","Ruimy, Nilda","Zamorani, Nicoletta"],"authors_cnr_id":["8945","18402","26123"],"authors_cnr_institute":["048"],"authors":["Monachini, M.","Quochi, V.","Ruimy, N.","Calzolari, N."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84676","volume":"","doi":"","editors_people":"P. Bouillon, L. Danlos, K. Kanzaki (eds.)","editors":["Bouillon, P.","Danlos, L.","Kanzaki, K."],"published":"","publisher":"","issn":"","isbn":"","conference_name":"GL2007: Fourth International Conference on Generative Approaches to the Lexicon","conference_place":"Parigi","conference_date":"10-11 Maggio 2007"},{"id":131186,"last_updated":"2013-06-25 17:38:57","id_people":84735,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Toward a Standard Lexical Resource in the Bio Domain","year":2007,"authors_people":"Quochi V.; Del Gratta R.; Sassolini E.; Monachini M.; Calzolari N.","authors_cnr":["Quochi, Valeria","Del Gratta, Riccardo","Monachini, Monica","Sassolini, Eva","Zamorani, Nicoletta"],"authors_cnr_id":["8945","11032","26123"],"authors_cnr_institute":["048"],"authors":["Quochi, V.","Del Gratta, R.","Sassolini, E.","Monachini, M.","Calzolari, N."],"abstract":"The present paper describes a large-scale lexical resource for the biology domain designed both for human and for machine use. This lexicon aims at semantic interoperability and extendability, through the adoption of ISO-LMF standard for lexical representation and through a granular and distributed encoding of relevant information. The first part of this contribution focuses on three aspects of the model that are of particular interest to the biology community: the treatment of term variants, the representation on bio events and the alignment with a domain ontology. The second part of the paper describes the physical implementation of the model: a relational database equipped with a set of automatic uploading procedures. Peculiarity of the BioLexicon is that it combines features of both terminologies and lexicons. A set verbs relevant for the domain is also represented with full details on their syntactic and semantic argument structure.","keywords":["Lexical representation model","Lexical Database","Computational Lexicography","Special Domains","Standards"],"pages":"295-299","url":"https:\/\/publications.cnr.it\/doc\/84735","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Fundacja Uniwersytetu im A. Mickiewicza (Poznan, POL)","issn":"","isbn":"978-83-7177-413-3","conference_name":"LTC07-3rd Language and Technology Conference: Human Language Technology. Challenges of the Information Society","conference_place":"Poznan, Poland","conference_date":"5-7 Ottobre 2007"},{"id":131903,"last_updated":"2014-11-14 17:42:28","id_people":287126,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Emergent Cognitive Functions of the Noun Phrase","year":2007,"authors_people":"Basilio Calderone; Valeria Quochi","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":["11893"],"authors_cnr_institute":["048"],"authors":["Calderone, B.","Quochi, V."],"abstract":"","keywords":["noun phrase","emergence of language"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/287126","volume":"","doi":"","editors_people":"","editors":[""],"published":"SLE 2007 Annual Meeting Book of Abstracts","publisher":"","issn":"","isbn":"","conference_name":"SLE 2007 Annual Meeting","conference_place":"Joensuu, Finlandia","conference_date":"28\/08\/2007-01\/09\/2007"},{"id":131574,"last_updated":"2009-06-16 00:00:00","id_people":157444,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"FLaReNet: Fostering Language Resources Network. Grant Agreement n\u00b0 617001, eContentPlus","year":2007,"authors_people":"Calzolari N., Monachini M., Quochi V., Soria C., Goggi S., Baroni P.","authors_cnr":["Quochi, Valeria","Baroni, Paola","Monachini, Monica","Soria, Claudia","Goggi, Sara","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Monachini, M.","Quochi, V.","Soria, C.","Goggi, S.","Baroni, P."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157444","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131572,"last_updated":"2009-06-16 00:00:00","id_people":157442,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"TimeML: An Ontological Mapping onto the UIMA Type Systems","year":2007,"authors_people":"Del Gratta R., Bartolini R., Caselli T., Enea A., Monachini M., Quochi V., Sassolini V.","authors_cnr":["Sassolini, Eva","Quochi, Valeria","Del Gratta, Riccardo","Caselli, Tommaso","Enea, Alessandro","Monachini, Monica","Bartolini, Roberto"],"authors_cnr_id":["8533","8945","10441"],"authors_cnr_institute":[""],"authors":["Del Gratta, R.","Bartolini, R.","Caselli, T.","Enea, A.","Monachini, M.","Quochi, V.","Sassolini, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157442","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131555,"last_updated":"2014-11-28 16:39:39","id_people":157425,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Bio-Lexicon DataBase: Architecture, Concepts and Loading Software","year":2007,"authors_people":"Del Gratta R., Monachini M., Quochi V., Sassolini E., Calzolari N.","authors_cnr":["Sassolini, Eva","Quochi, Valeria","Del Gratta, Riccardo","Monachini, Monica","Zamorani, Nicoletta"],"authors_cnr_id":["8945","26123"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Del Gratta, R.","Monachini, M.","Quochi, V.","Sassolini, E.","Calzolari, N."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157425","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131571,"last_updated":"2009-06-16 00:00:00","id_people":157441,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"LocalBioLex: A database framework for biolinguistic research on integrated databases","year":2007,"authors_people":"Del Gratta R., Toral A., Quochi V., Monachini. M.","authors_cnr":["Quochi, Valeria","Del Gratta, Riccardo","Toral Ruiz, Antonio","Monachini, Monica"],"authors_cnr_id":["8945"],"authors_cnr_institute":[""],"authors":["Del Gratta, R.","Toral, A.","Quochi, V.","Monachini, M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157441","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131533,"last_updated":"2015-02-26 11:11:14","id_people":157403,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Bio-Lexicon Model and Preliminary ISO Conformant Data Categories","year":2006,"authors_people":"Quochi V., Monachini M., Calzolari N., Del Gratta R., Sassolini E.","authors_cnr":["Sassolini, Eva","Quochi, Valeria","Del Gratta, Riccardo","Monachini, Monica","Zamorani, Nicoletta"],"authors_cnr_id":["8945","26123"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Quochi, V.","Monachini, M.","Calzolari, N.","Del Gratta, R.","Sassolini, E."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157403","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131356,"last_updated":"2023-07-09 23:44:32","id_people":136443,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Issues on the acquisition of Italian complex nominals from text corpora: a computational approach combining syntactic and semantic information","year":2005,"authors_people":"Quochi, Valeria","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":[""],"authors_cnr_institute":[""],"authors":["Quochi, V."],"abstract":"The paper addressed the issue of Italian Complex Nominals from an (automatic) acquisition and representational perspective. Just like English noun compounds, ICNs blur the distinction between the syntactic and the lexical component because they are (at least) partially non-transparent but, nevertheless, show regularities both at the syntactic and at the semantic level. This contribution reports on an experiment conducted to identify the highest possible number of productive syntactic-semantic patterns of ICN formation, and to make explicit the particular semantic relation that exists between the head of the phrase and its modifier(s). I rely on a non-traditional generative theory of the lexicon, namely the Generative Lexicon, as a model for the representation\/ interpretation of ICNs which provides us with a structured representation of the internal semantics of lexical items. The experiment explored the representational power of the qualia structure with respect to ICNs.","keywords":["complex nominals","multiword expressions","lexicon","lexical representation","generative lexicon"],"pages":"153-174","url":"https:\/\/publications.cnr.it\/doc\/136443","volume":"","doi":"","editors_people":"Marcella Bertuccelli","editors":["Bertuccelli, M."],"published":"Studies in the Semantics of Lexical Combinatory Patterns","publisher":"Edizioni Plus srl (Pisa, ITA)","issn":"","isbn":"9788884922366","conference_name":"","conference_place":"","conference_date":""},{"id":131078,"last_updated":"2016-01-11 17:46:42","id_people":84616,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Representing Italian Complex Nominals: A Pilot Study","year":2004,"authors_people":"Quochi V.","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":[""],"authors_cnr_institute":["048"],"authors":["Quochi, V."],"abstract":"A corpus-based investigation of Italian Complex Nominals (CNs), of the form N+PP, which aims at clarifying their syntactic and semantic constitution, is presented. The main goal is to find out useful parameters for their representation in a computational lexicon. As a reference model we have taken an implementation of Pustejovsky's Generative Lexicon Theory (1995), the SIMPLE Italian Lexicon, and in particular the Extended Qualia Structure. Italian CN formation mainly exploits post-modification; of particular interest here are CNs of the kind N+PP since this syntactic pattern is highly productive in Italian and such CNs very often translate compound nouns of other languages. One of the major problems posed by CNs for interpretation is the retrieval or identification of the semantic relation linking their components, which is (at least partially) implicit on the surface. Studying a small sample, we observed some interesting facts that could be useful when setting up a larger experiment to identify semantic relations and\/or automatically learn the syntactic peculiarities of given semantic paradigms. Finally, a set of representational features exploiting the results from our corpus is proposed.","keywords":["Multiword expressions Complex Nominals","Italian language"],"pages":"1863-1866","url":"https:\/\/publications.cnr.it\/doc\/84616","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of the Fourth International Conference on Language Resources and Evaluation, LREC'04","publisher":"","issn":"","isbn":"2-9517408-1-6","conference_name":"LREC 2004: Fourth International Conference on Language Resources and Evaluation","conference_place":"Lisbona, Portogallo","conference_date":"26-28\/05\/2004"},{"id":131499,"last_updated":"2015-02-23 16:39:32","id_people":157368,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Final Resources Landscape","year":2004,"authors_people":"Baroni P., Calzolari N., Lenci A. , Quochi V., Ulivieri M.","authors_cnr":["Ulivieri, Marisa","Quochi, Valeria","Baroni, Paola","Zamorani, Nicoletta"],"authors_cnr_id":["26123"],"authors_cnr_institute":[""],"authors":["Baroni, P.","Calzolari, N.","Lenci, A.","Quochi, V.","Ulivieri, M."],"abstract":"ELSNET-4 Deliverable D6.4","keywords":["Language Resources","Landscapes"],"pages":"11","url":"https:\/\/publications.cnr.it\/doc\/157368","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131012,"last_updated":"2016-01-07 18:52:25","id_people":84547,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Towards Multiword and Multilingual Lexicons: Between Theory and Practice","year":2003,"authors_people":"Calzolari N., Lenci A., Quochi V.","authors_cnr":["Quochi, Valeria","Zamorani, Nicoletta"],"authors_cnr_id":["11893","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, N.","Lenci, A.","Quochi, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84547","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Linguistics and Phonetics 2002 Conference","conference_place":"Urayasu (Giappone)","conference_date":"2003"},{"id":131481,"last_updated":"2014-03-07 16:10:10","id_people":157349,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"\"Appendix F: Representing noun compounds and support verbs in MILE (PISA & XMELLT)\"","year":2003,"authors_people":"Quochi, Valeria and Jan Odjik","authors_cnr":["Quochi, Valeria"],"authors_cnr_id":[""],"authors_cnr_institute":["048"],"authors":["Quochi, V.","Odjik, J."],"abstract":"","keywords":[""],"pages":"","url":"http:\/\/www.ilc.cnr.it\/EAGLES96\/isle\/clwg_doc\/ISLE_D2.2-D3.2.zip","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""}]