[{"id":343148,"last_updated":"2022-10-21 15:19:30","id_people":472294,"institutes":["ILC","IGSG"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Making Italian Parliamentary Records Machine-Actionable: the Construction of the ParlaMint-IT corpus","year":2022,"authors_people":"Tommaso Agnoloni, Roberto Bartolini, Francesca Frontini, Simonetta Montemagni, Carlo Marchetti, Valeria Quochi, Manuela Ruisi, Giulia Venturi","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Agnoloni, Tommaso","Quochi, Valeria","Frontini, Francesca","Venturi, Giulia"],"authors_cnr_id":["5595","10441","11403","11893","15911","17692"],"authors_cnr_institute":[""],"authors":["Agnoloni, T.","Bartolini, R.","Frontini, F.","Montemagni, S.","Marchetti, C.","Quochi, V.","Ruisi, M.","Venturi, G."],"abstract":"This paper describes the process of acquisition, cleaning, interpretation, coding and linguistic annotation of a collection of parliamentary debates from the Senate of the Italian Republic covering the COVID-19 pandemic emergency period and a former period for reference and comparison according to the CLARIN ParlaMint prescriptions. The corpus contains 1199 sessions and 79,373 speeches for a total of about 31 million words, and was encoded according to the ParlaCLARIN TEI XML format. It includes extensive metadata about the speakers, sessions, political parties and parliamentary groups. As required by the ParlaMint initiative, the corpus was also linguistically annotated for sentences, tokens, POS tags, lemmas and dependency syntax according to the universal dependencies guidelines. Named entity annotation and classification is also included. All linguistic annotation was performed automatically using state-of-the-art NLP technology with no manual revision. The Italian dataset is freely available as part of the larger ParlaMint 2.1 corpus deposited and archived in CLARIN repository together with all other national corpora. It is also available for direct analysis and inspection via various CLARIN services and has already been used both for research and educational purposes.","keywords":["parliamentary debates","CLARIN ParlaMint","corpus creation","corpus annotation"],"pages":"117-124","url":"https:\/\/aclanthology.org\/2022.parlaclarin-1.17\/","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"","conference_name":"Workshop ParlaCLARIN III within the 13th Language Resources and Evaluation Conference","conference_place":"Marseille, France","conference_date":"20\/06\/2022"},{"id":132444,"last_updated":"2022-02-16 15:50:32","id_people":453502,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Relazione di fine progetto \"PIM-Piattaforma Integrata Monitoraggio\"","year":2020,"authors_people":"Roberto Bartolini, Valeria Quochi, Monica Monachini, Fabio Aff\u00e9","authors_cnr":["Monachini, Monica","Bartolini, Roberto","Quochi, Valeria"],"authors_cnr_id":["8945","10441","11893"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Quochi, V.","Monachini, M.","Aff\u00e9, F."],"abstract":"Il documento presenta l'attivit\u00e0 svolta dal CNR-ILC nel ruolo di subcontraente di COMDATA per la realizzazione di moduli di trattamento automatico del linguaggio e la consulenza per l'integrazione di metodi di clustering automatico di documenti nella Digital Library del progetto PIM.","keywords":["accesso intelligente al testo","digital library","natural language processing"],"pages":"156","url":"https:\/\/publications.cnr.it\/doc\/453502","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132344,"last_updated":"2019-12-13 11:27:43","id_people":411599,"institutes":["ILC","ISTI"],"type":"journal_article","type_order":0,"type_people":"article","title":"Semantic Query Analysis from the Global Science Gateway","year":2019,"authors_people":"Goggi S.; Pardelli G.; Bartolini R.; Monachini M.; Biagioni S.; Carlesi C.","authors_cnr":["Biagioni, Stefania","Carlesi, Carlo","Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["3483","8945","10172","10441","16333"],"authors_cnr_institute":["074","074","048","048","048","048"],"authors":["Goggi, S.","Pardelli, G.","Bartolini, R.","Monachini, M.","Biagioni, S.","Carlesi, C."],"abstract":"Nowadays web portals play an essential role in searching and retrieving information in the several fields of knowledge: they are ever more technologically advanced and designed for supporting the storage of a huge amount of information in natural language originating from the queries launched by users worldwide. Given this scenario, we focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience.org (The Global Science Gateway) portal: the aim is to retrieve information related to social media which as of today represent a considerable source of data more and more widely used for research ends.","keywords":["Information Extraction","Query Log","WorldWideScience Alliance","Information gateways","Social Media"],"pages":"147-155","url":"https:\/\/publications.cnr.it\/doc\/411599","volume":"15","doi":"","editors_people":"","editors":[""],"published":"The Grey journal (Print)","publisher":"TextRelease (Amsterdam, Paesi Bassi)","issn":"1574-1796","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132327,"last_updated":"2020-06-01 08:34:24","id_people":400343,"institutes":["ILC","ISTI"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Semantic query analysis from the global science gateway","year":2019,"authors_people":"Goggi S.; Pardelli G.; Bartolini R.; Monachini M.; Biagioni S.; Carlesi C.","authors_cnr":["Biagioni, Stefania","Carlesi, Carlo","Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["2577","3483","8945","10172","10441","16333"],"authors_cnr_institute":["074","074","048","048","048","048"],"authors":["Goggi, S.","Pardelli, G.","Bartolini, R.","Monachini, M.","Biagioni, S.","Carlesi, C."],"abstract":"We focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience.org (The Global Science Gateway) portal.","keywords":["Information Extraction","Terminology"],"pages":"105-113","url":"https:\/\/publications.cnr.it\/doc\/400343","volume":"20","doi":"","editors_people":"Dominic Farace, Jerry Frantzen","editors":["Farace, D.","Frantzen, J."],"published":"Research Data Fuels and Sustains Grey Literature","publisher":"","issn":"","isbn":"978-90-77484-33-3","conference_name":"GL20-Twentieth International Conference on Grey Literature: Research Data Fuels and Sustains Grey Literature","conference_place":"New Orleans, USA","conference_date":"3-4 December 2018"},{"id":131319,"last_updated":"2020-09-01 09:44:39","id_people":388612,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Providing Access to Grey Literature: The CLARIN Infrastructure","year":2018,"authors_people":"Goggi, Sara; Pardelli, Gabriella; Russo, Irene; Bartolini, Roberto; Monachini, Monica","authors_cnr":["Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella","Russo, Irene"],"authors_cnr_id":["8945","10172","10441","16333","17442"],"authors_cnr_institute":[""],"authors":["Goggi, S.","Pardelli, G.","Russo, I.","Bartolini, R.","Monachini, M."],"abstract":"\"In the electronic age, the World Wide Web has played a major role in making scientific information accessible to a wide audience more rapidly and efficiently. This democratic approach to information dissemination in science is changing the way science is perceived and implemented in our daily lives\" (Weintraub, 2000).","keywords":["CLARIN-IT","CLARIN-European Research Infrastructure for Language Resources and Technology","Grey Literature"],"pages":"87-93","url":"http:\/\/www.scopus.com\/record\/display.url?eid=2-s2.0-85048643343&origin=inward","volume":"14","doi":"","editors_people":"","editors":[""],"published":"The Grey journal (Print)","publisher":"TextRelease (Amsterdam, Paesi Bassi)","issn":"1574-1796","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132262,"last_updated":"2020-09-01 09:44:46","id_people":387159,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"The LREC Workshops Map","year":2018,"authors_people":"Roberto Bartolini, Sara Goggi, Monica Monachini, Gabriella Pardelli","authors_cnr":["Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","16333"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Goggi, S.","Monachini, M.","Pardelli, G."],"abstract":"The aim of this work is to present an overview of the research presented at the LREC workshops over the years 1998-2016 with the aim to shed light on the community represented by workshop participants in terms of country of origin, type of affiliation, gender. There has been also an effort towards the identification of the major topics dealt with as well as of the terminological variations noticed in this time span. Data has been retrieved from the portal of the European Language Resources Association (ELRA) which organizes the conference and the resulting corpus made up of workshops titles and of the related presentations has then been processed using a term extraction tool developed at ILC-CNR.","keywords":["corpus creation","terminology","LREC"],"pages":"557-562","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2018\/summaries\/639.html","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference chair), Khalid Choukri, Christopher Cieri, Thierry Declerck, Sara Goggi, Koiti Hasida, Hitoshi Isahara, Bente Maegaard, Joseph Mariani, H\u00e9l\u00e8ne Mazo, Asuncion Moreno, Jan Odijk, Stelios Piperidis, Takenobu Tokunaga","editors":["Calzolari, N.","Choukri, K.","Cieri, C.","Declerck, T.","Goggi, S.","Hasida, K.","Isahara, H.","Maegaard, B.","Mariani, J.","Mazo, H.","Moreno, A.","Odijk, J.","Piperidis, S.","Tokunaga, T."],"published":"Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"979-10-95546-00-9","conference_name":"Eleventh International Conference on Language Resources and Evaluation (LREC 2018)","conference_place":"Miyazaki, Japan","conference_date":"7-12\/05\/2018"},{"id":132258,"last_updated":"2019-12-04 12:27:38","id_people":385571,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Providing Access to Grey Literature: The CLARIN Infrastructure","year":2018,"authors_people":"Sara Goggi, Gabriella Pardelli, Irene Russo, Roberto Bartolini, Monica Monachini","authors_cnr":["Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella","Russo, Irene"],"authors_cnr_id":["8945","10172","10441","16333","17442"],"authors_cnr_institute":[""],"authors":["Goggi, S.","Pardelli, G.","Russo, I.","Bartolini, R.","Monachini, M."],"abstract":"This work will provide a map of the documentation archived in the CLARIN infrastructure, whose purpose is to share language resources produced and managed in the various European countries but finally merged into the CLARIN data centers for allowing access, interoperability, reuse and preservation of scientific documentation as well as Grey Literature.","keywords":["CLARIN Infrastructure","Language Resources","Grey Literature"],"pages":"93-99","url":"http:\/\/greyguide.isti.cnr.it\/wp-content\/uploads\/2018\/03\/GL19_Conference_Proceedings.pdf","volume":"19","doi":"","editors_people":"Farace Dominic, Frantzen Jerry","editors":["Farace, D.","Frantzen, J."],"published":"Nineteenth International Conference on Grey Literature \"Public Awareness and Access to Grey Literature\"","publisher":"TextRelease (Amsterdam, NLD)","issn":"","isbn":"978-90-77484-31-9","conference_name":"Nineteenth International Conference on Grey Literature, GL19","conference_place":"Roma","conference_date":"October 23-24, 2017"},{"id":132310,"last_updated":"2019-01-04 18:36:13","id_people":395584,"institutes":["ILC","ISTI"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Semantic query analysis from the global science gateway","year":2018,"authors_people":"Goggi S.; Pardelli G.; Bartolini R.; Monachini M.; Biagioni S.; Carlesi C.","authors_cnr":["Biagioni, Stefania","Carlesi, Carlo","Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["2577","3483","8945","10172","10441","16333"],"authors_cnr_institute":["074","074","048","048","048","048"],"authors":["Goggi, S.","Pardelli, G.","Bartolini, R.","Monachini, M.","Biagioni, S.","Carlesi, C."],"abstract":"We focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience.org (The Global Science Gateway) portal: the aim is to retrieve information related to social media which as of today represent a considerable source of data more and more widely used for research ends. This project includes eight months of query logs3 registered between July 2017 and February 2018 for a total of 445,827 queries. The analysis mainly concentrates on the semantics of the queries received from the portal clients: it is a process of information retrieval from a rich digital catalogue whose language is dynamic, is evolving and follows - as well as reflects - the cultural changes of our modern society.","keywords":["Global Science Gateway","Semantic Query Analysis","Terminology"],"pages":"93-95","url":"http:\/\/greyguide.isti.cnr.it\/wp-content\/uploads\/2018\/12\/GL20_ProgramBook.pdf","volume":"20","doi":"","editors_people":"Farace Dominic, Frantzen Jerry","editors":["Farace, D.","Frantzen, J."],"published":"Research Data Fuels and Sustains Grey Literature","publisher":"","issn":"","isbn":"978-90-77484-34-0","conference_name":"Twentieth International Conference on Grey Literature \"Research Data Fuels and Sustains Grey Literature\"","conference_place":"New Orleans, USA (Loyola University)","conference_date":"December 3-4, 2018"},{"id":132187,"last_updated":"2018-03-28 13:37:13","id_people":369103,"institutes":["ILC","ISTI"],"type":"journal_article","type_order":0,"type_people":"article","title":"A terminological \"journey\" in the Grey Literature domain","year":2017,"authors_people":"Bartolini R.; Pardelli G.; Goggi S.; Giannini S.; Biagioni S.","authors_cnr":["Biagioni, Stefania","Giannini, Silvia","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["2577","7455","10172","10441","16333"],"authors_cnr_institute":["074","074","048","048","048"],"authors":["Bartolini, R.","Pardelli, G.","Goggi, S.","Giannini, S.","Biagioni, S."],"abstract":"\"It is by means of terms that the expert usually transfer their knowledge and again through terms scientific communication reaches the highest effectiveness. Therefore we can assert that terminology - in the sense of a set of representative and domain-specific units - is necessary for representing and connecting specialized fields as well as any attempt to represent and\/or transfer scientific knowledge requires, more or less extensively, the use of terminology.\" (Cabr\u00e9, 2000). \"When we read the articles or papers of a particular domain, we can recognize some lexical items in the texts as technical terms. In a domain where new knowledge is generated, new terms are constantly created to fulfill the needs of the domain, while others become obsolete. In addition, existing terms may undergo changes of meaning...\" (Kageura K., 1998\/1999). Specialized lexicons are made up of the terms which are specific to each field of knowledge, \u00aba subset which is distinct but not separated from the common language\u00bb (Cassese, 1992): it is usually difficult to extract the relevant domain-specific terminology, meaning to discern terms which belong to a specialized glossary from those belonging to the common dictionary. The interest in the study of terminology and the \"truth\" contained in the above definitions has led us to make a \"journey\" in the Grey Literature (GL) domain in order to offer an overall vision on the terms used and the links between them. Within this scenario, the work analyzes a corpus constituted of the entire amount of full research papers published in the GL conference series over a time-span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words in the various GL research topics. \"... corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents which can be detected (Pej?ov\u00e1 P. et al., 2012).","keywords":["Grey Literature","Information Extraction IE","Terminology"],"pages":"41-53","url":"http:\/\/www.greynet.org\/thegreyjournal\/currentissue.html","volume":"13","doi":"","editors_people":"","editors":[""],"published":"The Grey journal (Print)","publisher":"TextRelease (Amsterdam, Paesi Bassi)","issn":"1574-1796","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132183,"last_updated":"2021-04-27 16:34:59","id_people":368363,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Semantic Search Engine for Data Management and Sustainable Development: Marine Planning Service Platform","year":2017,"authors_people":"Giuseppe M. R. Manzella , Roberto Bartolini, Franco Bustaffa, Paolo D'Angelo, Maurizio De Mattei, Francesca Frontini, Maurizio Maltese, Daniele Medone, Monica Monachini, Antonio Novellino, Andrea Spada","authors_cnr":["Monachini, Monica","Bartolini, Roberto","Frontini, Francesca"],"authors_cnr_id":["8945","10441","15911"],"authors_cnr_institute":[""],"authors":["Manzella, G. M. R.","Bartolini, R.","Bustaffa, F.","D'Angelo, P.","De Mattei, M.","Frontini, F.","Maltese, M.","Medone, D.","Monachini, M.","Novellino, A.","Spada, A."],"abstract":"This chapter presents a computer platform supporting a Marine Information and Knowledge System based on a repository that gathers, classify and structures marine scientific literature and data, guaranteeing their accessibility by means of standard protocols. This requires the access to quality controlled data and to information that is provided in grey literature and\/or in relevant scientific literature. There exist efforts to develop search engines to find author's contributions to scientific literature or publications. This implies the use of persistent identifiers. However very few efforts are dedicated to link publications to data that was used, or cited in them or that can be of importance for the published studies. Full-text technologies are often unsuccessful since they assume the presence of specific keywords in the text; to fix this problem,it is suggested to use different semantic technologies for retrieving the text and data and thus getting much more complying results.","keywords":["Marine Information and Knowledge System"],"pages":"127-154","url":"http:\/\/www.igi-global.com\/chapter\/semantic-search-engine-for-data-management-and-sustainable-development\/166839#","volume":"Volume 7","doi":"10.4018\/978-1-5225-0700-0.ch006","editors_people":"Paolo Diviacco, Adam Leadbetter & Helen Glaves","editors":["Diviacco, P.","Leadbetter, A.","Glaves, H."],"published":"Oceanographic and Marine Cross-Domain Data Management for Sustainable Development","publisher":"IGI Global (Hershey, USA)","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132184,"last_updated":"2017-10-30 09:14:16","id_people":368487,"institutes":["ILC","ISTI"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A terminological \"journey\" in the Grey Literature domain","year":2017,"authors_people":"Bartolini R.; Pardelli G.; Goggi S.; Giannini S.; Biagioni S.","authors_cnr":["Biagioni, Stefania","Giannini, Silvia","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["7455","10172","10441","16333"],"authors_cnr_institute":["074","074","048","048","048"],"authors":["Bartolini, R.","Pardelli, G.","Goggi, S.","Giannini, S.","Biagioni, S."],"abstract":"The work analyzes a corpus constituted of the entire amount of full research papers published in the GL conference series over a time-span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words in the various GL research topics. \"... corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents which can be detected (Pej?ov\u00e1 P. et al., 2012).","keywords":["Grey Literature","Information Extraction IE","Terminology"],"pages":"117-130","url":"https:\/\/publications.cnr.it\/doc\/368487","volume":"18","doi":"","editors_people":"Dominic Farace, Jerry Frantzen","editors":["Farace, D.","Frantzen, J."],"published":"Proceedings of the Eighteenth International Conference on Grey Literature (GL18): Leveraging Diversity in Grey Literature","publisher":"TextRelease (Amsterdam, NLD)","issn":"","isbn":"978-90-77484-30-2","conference_name":"Eighteenth International Conference on Grey Literature (GL18): Leveraging Diversity in Grey Literature","conference_place":"New York, US","conference_date":"November 28-29, 2016"},{"id":132177,"last_updated":"2019-12-04 12:42:27","id_people":367782,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A Geographical Visualization of GL Communities: A Snapshot","year":2017,"authors_people":"Pardelli G., Goggi S., Bartolini R., Russo I., Monachini M.","authors_cnr":["Russo, Irene","Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","16333"],"authors_cnr_institute":[""],"authors":["Pardelli, G.","Goggi, S.","Bartolini, R.","Russo, I.","Monachini, M."],"abstract":"This quotation stresses the important role of the several international organizations in producing and disseminating knowledge in the field of Grey Literature (GL): the paper aims to provide a first snapshot of the geographical distribution of GL organizations and their participation to the annual International Conference on Grey Literature over the time (in the period from 2003 to 2015. See List of Conferences on Table 2 ). Nowadays a visual representation of data is often associated with the traditional statistical graphs, in particular for representing complex phenomena by means of maps and diagrams, which allow a deeper and more focused analysis of the data. In our case the geographical representation of stakeholders in government, academics, business and industry aims at visualizing the GL community across the globe: it concerns 674 organizations which over the years have contributed to the development of a common vision on the most pressing issues of the field by using new paradigms such as Open Access and the social networks.","keywords":["Geographical Visualization","Grey Literature Communities"],"pages":"109-113","url":"http:\/\/greyguide.isti.cnr.it\/wp-content\/uploads\/2017\/04\/GL18_Conference_Proceedings.pdf","volume":"18","doi":"","editors_people":"D. Farace and J. Frantzen","editors":["Farace, D.","Frantzen, J."],"published":"GL18 Conference Proceedings Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature","publisher":"TextRelease (Amsterdam, NLD)","issn":"","isbn":"978-90-77484-30-2","conference_name":"Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature","conference_place":"Washington","conference_date":"November 28-29, 2016"},{"id":132198,"last_updated":"2018-01-18 16:18:59","id_people":377073,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Data Visualization of a Grey Literature Community: A Cooperative Project","year":2017,"authors_people":"Roberto Bartolini, Sara Goggi, Gabriella Pardelli, Irene Russo Dominic Farace, Jerry Frantzen","authors_cnr":["Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella","Russo, Irene"],"authors_cnr_id":["10172","10441","16333","17442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Goggi, S.","Pardelli, G.","Russo, I.","Farace, D.","Frantzen, J."],"abstract":"The expected outcome of this project will not only produce a revised and updated publication of International Directory of Organizations in Grey Literature, IDGL, but will also provide a visual overview of GreyNet as an international organization serving diverse communities with shared interests in grey literature. It would be a demonstration of GreyNet's commitment to research, publication, open access, education, and public awareness in this field of library and information science.","keywords":["International Directory of Organizations in Grey Literature","Data Visualization"],"pages":"63-63","url":"https:\/\/publications.cnr.it\/doc\/377073","volume":"19","doi":"","editors_people":"Farace Dominic, Frantzen Jerry","editors":["Farace, D.","Frantzen, J."],"published":"Nineteenth International Conference on Grey Literature Public Awareness and Access to Grey Literature. Program Book","publisher":"","issn":"","isbn":"978-90-77484-32-6","conference_name":"Nineteenth International Conference on Grey Literature, GL19","conference_place":"Rome, National Research Council, CNR","conference_date":"October 23-24, 2017"},{"id":132197,"last_updated":"2018-01-18 16:19:01","id_people":377070,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Providing Access to Grey Literature: The CLARIN Infrastructure","year":2017,"authors_people":"Sara Goggi, Gabriella Pardelli, Irene Russo, Roberto Bartolini, Monica Monachini","authors_cnr":["Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella","Russo, Irene"],"authors_cnr_id":["8945","10172","10441","16333","17442"],"authors_cnr_institute":[""],"authors":["Goggi, S.","Pardelli, G.","Russo, I.","Bartolini, R.","Monachini, M."],"abstract":"This work will provide a map of the documentation archived in the CLARIN infrastructure, whose purpose is to share language resources produced and managed in the various European countries but finally merged into the CLARIN data centers for allowing access, interoperability, reuse and preservation of scientific documentation as well as Grey Literature.","keywords":["CLARIN ERIC","Terminological Resources","Grey Literature"],"pages":"60-62","url":"https:\/\/publications.cnr.it\/doc\/377070","volume":"19","doi":"","editors_people":"Farace Dominic, Frantzen Jerry","editors":["Farace, D.","Frantzen, J."],"published":"Nineteenth International Conference on Grey Literature Public Awareness and Access to Grey Literature. Program Book","publisher":"","issn":"","isbn":"978-90-77484-32-6","conference_name":"Nineteenth International Conference on Grey Literature, GL19","conference_place":"Rome, National Research Council, CNR","conference_date":"October 23-24, 2017"},{"id":132133,"last_updated":"2017-06-22 08:54:11","id_people":359144,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"A semantic engine for grey literature retrieval in the oceanography domain","year":2016,"authors_people":"Sara Goggi, Gabriella Pardelli, Roberto Bartolini, Francesca Frontini, MonicaMonachini, Giuseppe Manzella, Maurizio De Mattei and Franco Bustaffa","authors_cnr":["Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Frontini, Francesca","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","15911","16333"],"authors_cnr_institute":[""],"authors":["Goggi, S.","Pardelli, G.","Bartolini, R.","Frontini, F.","Monachini, M.","Manzella, G.","De Mattei, M.","Bustaffa, F."],"abstract":"Here we present the final results of the MAPS (Marine Planning and Service Platform) project, an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. The system takes as input non-textual data (measurements) and text - both published papers and documentation - and it provides an advanced search facility thanks to the rich set of metadata and, above all, to the possibility of a refined and domain targeted key-word indexing of texts using Natural Language Processing (NLP) techniques. The paper describes the system in its details providing also evidence of evaluation.","keywords":["Information Extraction","Search Engine","Operative Oceanography"],"pages":"155-161","url":"http:\/\/www.greynet.org\/thegreyjournal\/currentissue.html","volume":"12","doi":"","editors_people":"","editors":[""],"published":"The Grey journal (Print)","publisher":"TextRelease (Amsterdam, Paesi Bassi)","issn":"1574-1796","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132113,"last_updated":"2017-03-17 09:44:40","id_people":355425,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"LREC as a Graph: People and Resources in a Network","year":2016,"authors_people":"Del Gratta R., Frontini F., Monachini M., Pardelli G., Russo I., Bartolini R., Khan F., Soria C., Calzolari N.","authors_cnr":["Khan, Anas Fahad","Monachini, Monica","Soria, Claudia","Bartolini, Roberto","Del Gratta, Riccardo","Frontini, Francesca","Pardelli, Gabriella","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10441","11933","15911","16333","26123"],"authors_cnr_institute":["048","048","048","048","048","048","048","048"],"authors":["Del Gratta, R.","Frontini, F.","Monachini, M.","Pardelli, G.","Russo, I.","Bartolini, R.","Khan, F.","Soria, C.","Calzolari, N."],"abstract":"This proposal describes a new way to visualise resources in the LREMap, a community-built repository of language resource descriptions and uses. The LREMap is represented as a force-directed graph, where resources, papers and authors are nodes. The analysis of the visual representation of the underlying graph is used to study how the community gathers around LRs and how LRs are used in research.","keywords":["Language Resources","Resources Documentation","Data Visualisation"],"pages":"2529-2532","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2016\/index.html","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference Chair), Khalid Choukri, Thierry Declerck, Sara Goggi, Marko Grobelnik, Bente Maegaard, Joseph Mariani, H\u00e9l\u00e8ne Mazo, Asunci\u00f3n Moreno, Jan Odijk, Stelios Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Goggi, S.","Grobelnik, M.","Maegaard, B.","Mariani, J.","Mazo, H.","Moreno, A.","Odijk, J.","Piperidis, S."],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-9-1","conference_name":"Tenth International Conference on Language Resources and Evaluation (LREC 2016)","conference_place":"Portoroz, Slovenia","conference_date":"23-28 may"},{"id":132105,"last_updated":"2017-06-22 08:53:52","id_people":350374,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A semantic engine for grey literature retrieval in the oceanography domain","year":2016,"authors_people":"Sara Goggi, Gabriella Pardelli, Roberto Bartolini, Francesca Frontini, MonicaMonachini, Giuseppe Manzella, Maurizio De Mattei and Franco Bustaffa","authors_cnr":["Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Frontini, Francesca","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","15911","16333"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Goggi, S.","Pardelli, G.","Bartolini, R.","Frontini, F.","Monachini, M.","Manzella, G.","De Mattei, M.","Bustaffa, F."],"abstract":"Here we present the final results of the MAPS (Marine Planning and Service Platform) project, an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. The system takes as input non-textual data (measurements) and text - both published papers and documentation - and it provides an advanced search facility thanks to the rich set of metadata and, above all, to the possibility of a refined and domain targeted key-word indexing of texts using Natural Language Processing (NLP) techniques. The paper describes the system in its details providing also evidence of evaluation.","keywords":["Information Extraction","Search Engine","Operative Oceanography"],"pages":"104-111","url":"https:\/\/publications.cnr.it\/doc\/350374","volume":"17","doi":"","editors_people":"Dominic Farace, Jerry Frantzen","editors":["Farace, D.","Frantzen, J."],"published":"","publisher":"","issn":"","isbn":"978-90-77484-27-2","conference_name":"Seventeenth International Conference on Grey Literature. A New Wave of Textual and Non-Textual Grey Literature","conference_place":"Amsterdam","conference_date":"December 1st-2nd 2015"},{"id":132143,"last_updated":"2022-01-26 14:13:22","id_people":362848,"institutes":["ILC","ISTI"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"A terminological \"journey\" in the Grey Literature domain","year":2016,"authors_people":"Bartolini R.; Pardelli G.; Goggi S.; Giannini S.; Biagioni S.","authors_cnr":["Biagioni, Stefania","Giannini, Silvia","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["2577","7455","10172","10441","16333"],"authors_cnr_institute":["074","074","048","048","048"],"authors":["Bartolini, R.","Pardelli, G.","Goggi, S.","Giannini, S.","Biagioni, S."],"abstract":"\"When we read the articles or papers of a particular domain, we can recognize some lexical items in the texts as technical terms. In a domain where new knowledge is generated, new terms are constantly created to fulfil the needs of the domain, while others become obsolete. In addition, existing terms may undergo changes of meaning...\" (Kageura K.,1998\/1999). According to Kaugera, our aim with this work is to make a \"journey\" in the Grey Literature (GL) domain in order to offer an overall vision on the terms used and the links\" \"between them. Moreover, by performing a terminological comparison over a given period of time it could be possible to trace the presence of obsolete words as well as of neologisms in the most recent research fields.Within this scenario, the work analyzes a corpus constituted of the entire amount of full\" \"research papers published in the GL conference series over a time span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words. \"... corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents (Pej?ov\u00e1 P. et al., 2012). The work is split up in four sections: creation of the corpus by acquiring the digital papers of GL conference proceedings (GL5 - GL16)1; data cleaning; data processing; terminological\" \"analysis and comparison. The corpus - made up of 231 research papers (for a total amount of 785.042 tokens) - was processed using a Natural Language Processing (NLP) tool for term extraction developed at the Institute of Computational Linguistics \"Antonio Zampolli\" of CNR (Goggi et al. 2015; 2016). This tool is what is called a \"pipeline\" (that is, a sequence of different tools) which extracts lexical knowledge from texts: in short, this is a rule system tool for knowledge extraction and document indexing that combines NLP technologies for term extraction and techniques to measure the associative strength of multi-words. This tool extracts a list of single (monograms) and multi-word terms (bigrams and trigrams) ordered by frequency with respect to the context. The pipeline - used as semantic engine within the MAPS project - has been customized for the extraction of terms from our corpus. This survey on the results of the information extraction process performed by the described NLP tool has been a sort of linguistic path in the past and present of terminology used in GL proceedings. By means of samplings, it has been possible to obtain the terminological flow in GL domain and to determine if and how the lexicon was evolving over these twelve years and investigate on its dynamic nature.","keywords":["Grey Literature","Digital Repositories","Open Access"],"pages":"79-84","url":"https:\/\/publications.cnr.it\/doc\/362848","volume":"18","doi":"","editors_people":"Dominic Farace, Jerry Frantzen","editors":["Farace, D.","Frantzen, J."],"published":"Leveraging Diversity in Grey Literature","publisher":"","issn":"","isbn":"978-90-77484-29-6","conference_name":"GL18-Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature","conference_place":"New York, US","conference_date":"28-29 November 2016"},{"id":132119,"last_updated":"2016-08-08 14:01:44","id_people":355476,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Marine Planning and Service Platform: Specific Ontology Based semantic Search Engine Serving Data Management and Sustainable Development","year":2016,"authors_people":"Manzella Giuseppe M.R. , Bartolini Roberto, Bustaffa Franco, D'Angelo Paolo, De Mattei Maurizio, Frontini Francesca , Maltese Maurizio, Medone Daniele, Monachini Monica, Novellino Antonio, Spada Andrea","authors_cnr":["Monachini, Monica","Bartolini, Roberto","Frontini, Francesca"],"authors_cnr_id":["8945","10441","15911"],"authors_cnr_institute":["048","048","048"],"authors":["Manzella, G. M. R.","Bartolini, R.","Bustaffa, F.","D'Angelo, P.","De Mattei, M.","Frontini, F.","Maltese, M.","Medone, D.","Monachini, M.","Novellino, A.","Spada, A."],"abstract":"The MAPS (Marine Planning and Service Platform) project is aiming at building a computer platform supporting a Marine Information and Knowledge System. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. In oceanography the cost related to data collection is very high and the new paradigm is based on the concept to collect once and re-use many times (for re-analysis, marine environment assessment, studies on trends, etc). This concept requires the access to quality controlled data and to information that is provided in reports (grey literature) and\/or in relevant scientific literature. Hence, creation of new technology is needed by integrating several disciplines such as data management, information systems, knowledge management...","keywords":["Marine Information","Knowledge System"],"pages":"2","url":"http:\/\/meetingorganizer.copernicus.org\/EGU2016\/orals\/20144","volume":"18","doi":"","editors_people":"","editors":[""],"published":"Geophysical research abstracts (Online)","publisher":"Copernicus GmbH (Katlenburg-Lindau, Germania)","issn":"1607-7962","isbn":"","conference_name":"European Geosciences Union General Assembly (EGU 2016)","conference_place":"Vienna, Austria","conference_date":"17-22 aprile 2016"},{"id":132139,"last_updated":"2017-06-22 08:53:20","id_people":362073,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"A Geographical Visualization of GL Community: a Snapshot","year":2016,"authors_people":"Gabriella Pardelli, Sara Goggi, Monica Monachini, Roberto Bartolini, Irene Russo","authors_cnr":["Russo, Irene","Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","16333"],"authors_cnr_institute":[""],"authors":["Pardelli, G.","Goggi, S.","Monachini, M.","Bartolini, R.","Russo, I."],"abstract":"\"Today, in the spirit of science, grey literature communities are called to demonstrate their know-how and merit to wider audiences\" [Farace Dominic J., 2011]. This quotation stresses the important role of the several international organizations in producing and disseminating knowledge in the field of Grey Literature (GL): the paper aims to provide a first snapshot of the geographical distribution of GL organizations and their participation to the annual International Conference on Grey Literature over the time (in the period from 2003 to 2015). Nowadays a visual representation of data is often associated with the traditional statistical graphs, in particular for representing complex phenomena by means of maps and diagrams, which allow a deeper and more focused analysis of the data. In our case the geographical representation of stakeholders in government, academics, business and industry aims at visualizing the GL community across the globe: it concerns 675 organizations which over the years have contributed to the development of a common vision on the most pressing issues of the field by using new paradigms such as Open Acces and the social networks.","keywords":["Geographical Visualization","Grey Literature"],"pages":"67-67","url":"https:\/\/publications.cnr.it\/doc\/362073","volume":"18","doi":"","editors_people":"D. Farace, J. Frantzen","editors":["Farace, D.","Frantzen, J."],"published":"GL18 Program Book","publisher":"","issn":"","isbn":"978-90-77484-29-6","conference_name":"Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature","conference_place":"New York","conference_date":"November 28-29, 2016"},{"id":132081,"last_updated":"2015-12-10 13:34:18","id_people":334894,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Marine Planning and Service Platform (MAPS) An Advanced Research Engine for Grey Literature in Marine Science","year":2015,"authors_people":"Sara Goggi, Monica Monachini, Francesca Frontini, Roberto Bartolini, Gabriella Pardelli, Maurizio De Mattei, Franco Bustaffa, and Giuseppe Manzella","authors_cnr":["Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Frontini, Francesca","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","15911","16333"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Goggi, S.","Monachini, M.","Frontini, F.","Bartolini, R.","Pardelli, G.","De Mattei, M.","Bustaffa, F.","Manzella, G."],"abstract":"The MAPS (Marine Planning and Service Platform) project is a development of the Marine project (Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013) aiming at building a computer platform for supporting a Marine Information and Knowledge System, as part of the data management activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. We will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced search engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the great impact that the processing, re-use as well as application of grey data have on societal needs\/problems and their answers.","keywords":["Marine Science Search Engine Source Data Oceanography"],"pages":"171-178","url":"https:\/\/publications.cnr.it\/doc\/334894","volume":"11","doi":"","editors_people":"","editors":[""],"published":"The Grey journal (Print)","publisher":"TextRelease (Amsterdam, Paesi Bassi)","issn":"1574-1796","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132093,"last_updated":"2021-04-08 08:30:49","id_people":342213,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Visualising Italian Language Resources: a Snapshot","year":2015,"authors_people":"Riccardo Del Gratta, Francesca Frontini, Monica Monachini, Gabriella Pardelli, Irene Russo, Roberto Bartolini, Sara Goggi, Fahad Khan, Valeria Quochi, Claudia Soria, Nicoletta Calzolari","authors_cnr":["Del Gratta, Riccardo","Russo, Irene","Khan, Anas Fahad","Monachini, Monica","Soria, Claudia","Goggi, Sara","Bartolini, Roberto","Quochi, Valeria","Frontini, Francesca","Pardelli, Gabriella","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10172","10441","11893","15911","16333","26123"],"authors_cnr_institute":[""],"authors":["Del Gratta, R.","Frontini, F.","Monachini, M.","Pardelli, G.","Russo, I.","Bartolini, R.","Goggi, S.","Khan, F.","Quochi, V.","Soria, C.","Calzolari, N."],"abstract":"This paper aims to provide a first snapshot of Italian Language Resources (LRs) and their uses by the community, as documented by the papers presented at two different conferences, LREC2014 and CLiC-it 2014. The data of the former were drawn from the LOD version of the LRE Map, while those of the latter come from manually analyzing the proceedings. The results are presented in the form of visual graphs and confirm the initial hypothesis that Italian LRs require concrete actions to enhance their visibility.","keywords":["Italian Language Resources"],"pages":"100-104","url":"https:\/\/books.openedition.org\/aaccademia\/1277?lang=it","volume":"","doi":"","editors_people":"Cristina Bosco, Sara Tonelli, Fabio Massimo Zanzotto","editors":["Bosco, C.","Tonelli, S.","Zanzotto, F. M."],"published":"Proceedings of the Second Italian Conference on Computational Linguistics CLiC-it 2015","publisher":"","issn":"","isbn":"978-88-99200-62-6","conference_name":"Second Italian Conference on Computational Linguistics CLiC-it 2015","conference_place":"Trento","conference_date":"3-4 December 2015"},{"id":132049,"last_updated":"2015-04-14 12:31:17","id_people":329370,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Marine Planning and Service Platform (MAPS): An Advanced Research Engine for Grey Literature in Marine Science","year":2015,"authors_people":"Sara Goggi, Monica Monachini, Francesca Frontini, Roberto Bartolini, Gabriella Pardelli, Maurizio De Mattei+, Franco Bustaffa+, Giuseppe Manzella\u00b0","authors_cnr":["Frontini, Francesca","Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","16333"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Goggi, S.","Monachini, M.","Frontini, F.","Bartolini, R.","Pardelli, G.","De Mattei, M.","Bustaffa, F.","Manzella, G."],"abstract":"The MAPS {Marine Planning and Service Platform} project is a development of the Marine project {Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013} aiming at building a computer platform for supporting a Marine Information and Knowledge System, as part of the data management activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. We will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced search engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the great impact that the processing, re-use as well as application of grey data have on societal needs\/problems and their answers.","keywords":["Marine Science Search Engine Source Data Oceanography"],"pages":"108-114","url":"http:\/\/www.textrelease.com\/gl16program.html","volume":"16","doi":"","editors_people":"D. Farace and J. Frantzen","editors":["Farace, D.","Frantzen, J."],"published":"Grey Literature Lobby: Engines and Requesters for Change","publisher":"TextRelease (Amsterdam, NLD)","issn":"","isbn":"978-90-77484-23-4","conference_name":"Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change","conference_place":"Library of Congress Washington D. C., USA","conference_date":"December 8-9 2014"},{"id":132094,"last_updated":"2015-12-14 15:36:38","id_people":342221,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"A semantic engine for grey literature retrieval in the oceanography domain","year":2015,"authors_people":"Sara Goggi, Gabriella Pardelli, Roberto Bartolini, Francesca Frontini, Monica Monachini, Giuseppe Manzella, Maurizio De Mattei, Franco Bustaffa","authors_cnr":["Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Frontini, Francesca","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","15911","16333"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Goggi, S.","Pardelli, G.","Bartolini, R.","Frontini, F.","Monachini, M.","Manzella, G.","De Mattei, M.","Bustaffa, F."],"abstract":"Here we present the final results of MAPS (Marine Planning and Service Platform), an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. In previous publications the general architecture of the system as well as the set of metadata (Common Data Index) used to describe the documents were presented [3]; it was shown how individual oceanographic data-sets could be indexed within the MAPS library by types of measure, measurement tools, geographic areas, and also linked to specific textual documentation. Documentation is described using the current international standards: Title, Authors, Publisher, Language, Date of publication, Body\/Institution, Abstract, etc.; serial publications are described in terms of ISSN, while books are assigned ISBN; content of various types on electronic networks is described by means of doi and url. Each description is linked to the document. Thanks to this, the MAPS library already enables researchers to go from structured oceanographic data to documents describing it. But this was not enough: documents may contain important information that has not been encoded in the metadata. Thus an advanced Search Engine was put in place that uses semantic-conceptual technologies in order to extract key concepts from unstructured text such as technical documents (reports and grey literature) and scientific papers and to make them indexable and searchable by the end user in the same way as the structured data (such as oceanographic observations and metadata) is. More specifically once a document is uploaded in the MAPS library, key domain concepts in documents are extracted via a natural language processing pipeline and used as additional information for its indexing. The key term identification algorithm is based on marine concepts that were pre-defined in a domain ontology, but crucially it also allows for the discovery of new related concepts. So for instance starting from the domain term salinity, related terms such as sea salinity and average sea salinity will also be identified as key terms and used for indexing and searching documents. A hybrid search system is then put in place, where users can search the library by metadata or by free text queries. In the latter case, the NLP pipeline performs an analysis of the text of the query, and when key concepts are matched, the relevant documents are presented. The results may be later refined by using other structured information (e.g. date of publication, area, ...). Currently a running system has been put in place, with data from satellites, buoys and sea stations; such data is documented and searchable by its relevant metadata and documentation. Results of quantitative evaluation in terms of information retrieval measures will be presented in the poster; more specifically, given an evaluation set defined by domain experts and composed of pre-defined queries together with documents that answer such queries, it will be shown how the system is highly accurate in retrieving the correct documents from the library. Though this work focuses on oceanography, its results may be easily extended to other domains; more generally, the possibility of enhancing the visibility and accessibility of grey literature via its connection to the data it describes and to an advanced full text indexing are of great relevance for the topic of this conference.","keywords":["Information Extraction","Search Engine","Oceanography"],"pages":"76-77","url":"https:\/\/publications.cnr.it\/doc\/342221","volume":"17","doi":"","editors_people":"Dominic Farace, Jerry Frantzen","editors":["Farace, D.","Frantzen, J."],"published":"GL17 Program Book","publisher":"","issn":"","isbn":"978-90-77484-26-5","conference_name":"Seventeenth International Conference on Grey Literature. A New Wave of Textual and Non-Textual Grey Literature","conference_place":"Amsterdam","conference_date":"December 1-2"},{"id":131894,"last_updated":"2016-03-29 15:25:08","id_people":286944,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"From Synsets to Videos: Enriching ItalWordNet Multimodally","year":2014,"authors_people":"Bartolini R., Quochi V., De Felice, I., Russo I., Monachini M.","authors_cnr":["Quochi, Valeria","Russo, Irene","De Felice, Irene","Monachini, Monica","Bartolini, Roberto"],"authors_cnr_id":["8945","10441"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Bartolini, R.","Quochi, V.","De Felice, I.","Russo, I.","Monachini, M."],"abstract":"The paper describes the multimodal enrichment of ItalWordNet action verbs' entries by means of an automatic mapping with a conceptual ontology of action types instantiated by video scenes (ImagAct). The two resources present significative differences as well as interesting complementary features, such that a mapping of these two resources can lead to a an enrichment of IWN, through the connection between synsets and videos apt to illustrate the meaning described by glosses. Here, we describe an approach inspired by ontology matching methods for the automatic mapping of ImagAct video scenes onto ItalWordNet. The experiments described in the paper are conducted on Italian, but the same methodology can be extended to other languages for which WordNets have been created, since ImagAct is available also for English, Chinese and Spanish. This source of multimodal information can be exploited to design second language learning tools, as well as for language grounding in action recognition in video sources and potentially for robotics.","keywords":["Action ontology","Multimodality","WordNet"],"pages":"3110-3117","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/index.html","volume":"","doi":"","editors_people":"N. Calzolari, K. Choukri, T. Declerck, H. Loftsson, B. Maegaard, J. Mariani, A. Moreno, J. Odijk, S. Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Loftsson, H.","Maegaard, B.","Mariani, J.","Moreno, A.","Odijk, J.","Piperidis, S."],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-8-4","conference_name":"LREC 2014. European Language Resources Association ELRA: Paris (Francia)","conference_place":"Reykjavik, Iceland","conference_date":"26-31 may"},{"id":131983,"last_updated":"2016-03-29 15:24:09","id_people":291282,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Evaluating ImagAct-WordNet mapping for English and Italian through videos","year":2014,"authors_people":"De Felice I., Bartolini R., Russo I., Quochi V., Monachini M.","authors_cnr":["Quochi, Valeria","Russo, Irene","De Felice, Irene","Monachini, Monica","Bartolini, Roberto"],"authors_cnr_id":["8945","10441"],"authors_cnr_institute":["048","048","","048","048"],"authors":["De Felice, I.","Bartolini, R.","Russo, I.","Quochi, V.","Monachini, M."],"abstract":"In this paper we present the results of the evaluation of an automatic mapping between two lexical resources, WordNet\/ItalWordNet and ImagAct, a conceptual ontology of action types instantiated by video scenes. Results are compared with those obtained from a previous experiment performed only on Italian data. Differences between the two evaluation strategies, as well as between the quality of the mappings for the two languages considered in this paper, are iscussed.","keywords":["Language Resources (LRs)"],"pages":"128-131","url":"http:\/\/clic.humnet.unipi.it\/proceedings\/Proceedings-CLICit-2014.pdf","volume":"","doi":"10.12871\/CLICIT2014126","editors_people":"Roberto Basili, Alessandro Lenci, Bernardo Magnini","editors":["Basili, R.","Lenci, A.","Magnini, B."],"published":"","publisher":"Pisa University Press srl (Pisa, ITA)","issn":"","isbn":"978-88-67-41472-7","conference_name":"Proceedings of the First Italian Conference on Computational Linguistics CLiC-it 2014 & the Fourth International Workshop EVALITA 2014. Pisa University Press srl: Pisa (Italia)","conference_place":"Pisa","conference_date":"9-11 December 2014, Pisa"},{"id":131987,"last_updated":"2014-12-16 16:51:56","id_people":291816,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Marine Planning and Service Platform (MAPS): An Advanced Research Engine for Grey Literature in Marine Science","year":2014,"authors_people":"Goggi S., Monachini M., Frontini F., Bartolini R., Pardelli G., De Mattei M., Bustaffa F., Manzella G.","authors_cnr":["Frontini, Francesca","Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","16333"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Goggi, S.","Monachini, M.","Frontini, F.","Bartolini, R.","Pardelli, G.","De Mattei, M.","Bustaffa, F.","Manzella, G."],"abstract":"The MAPS (Marine Planning and Service Platform) project is a development of the Marine project (Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013) aiming at building a computer platform for supporting Operative Oceanography in its activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. Community and Requirements. Operative Oceanography is the branch of marine research which deals with the development of integrated systems for examining and modeling the ocean monitoring and forecast. Experts need access to real-time data on the state of the sea such as forecasts on temperatures, streams, tides and the relevant scientific literature. This finds application in many areas, ranging from civilian and military safety to protection of off-shore and coastal infrastructures. The metadata. The set of metadata associated with marine data is defined in the CDI (Common Data Index) documented standard. They encode: the types of sizes which have been measured; the measurement tools the platform which has been employed; the geographic area where measures have been taken; the environmental matrix; the descriptive documentation. As concerns the scientific documentation, at the current stage of the CDI standard, a document is shaped around the following metadata: Title, Authors, Version, ISBN\/DOI, Topic, Date of publication, Body\/Institution, Abstract. The search engine. The query system (which is actually under development) has been designed for operating with structured data - the metadata - and raw data - the associated technical and scientific documentation. Full-text technologies are often unsuccessful when applied to this type of queries since they assume the presence of specific keywords in the text; in order to fix this problem, the MAPS project suggests to use different emantic technologies for retrieving the text and data and thus getting much more complying results. In the Poster we will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced earch engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the 2 great impact that the processing, re-use as well as application of grey data have on societal needs\/problems and their answers.","keywords":["Marine Science Search Engine Source Data Oceanography"],"pages":"93-94","url":"http:\/\/greyguide.isti.cnr.it\/dfdownloadnew.php?ident=GLConference\/GL16\/2014-G01-015&langver=en&scelta=Metadata","volume":"","doi":"","editors_people":"compiled by D. Farace and J. Frantzen","editors":["Farace, C. B. D.","Frantzen, J."],"published":"","publisher":"","issn":"","isbn":"978-90-77484-24-1","conference_name":"Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change","conference_place":"Library of Congress Washington D. C., USA","conference_date":"December 8-9, 2014"},{"id":132082,"last_updated":"2015-11-18 09:44:01","id_people":335399,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"MAPS: Architettura del Sistema","year":2014,"authors_people":"M. De Mattei; D. Medone; P. D'Angelo; M. Monachini; R. Bartolini; F. Frontini","authors_cnr":["Monachini, Monica","Bartolini, Roberto","Frontini, Francesca"],"authors_cnr_id":["8945","10441","15911"],"authors_cnr_institute":["048","048","048"],"authors":["De Mattei, M.","Medone, D.","D'Angelo, P.","Monachini, M.","Bartolini, R.","Frontini, F."],"abstract":"PROGRAMMA OPERATIVO REGIONALE POR-FESR (2007-2013) Asse 1 Innovazione e Competitivit\u00e0 Bando DLTM Azione 1.2.2 \"Ricerca industriale e sviluppo sperimentale a favore delle imprese del Distretto Ligure per le Tecnologie Marine (DLTM) anno 2012. Il presente documento \u00e8 il deliverable \"D3.1 - Architettura del Sistema\" del progetto MAPS (Marine Planning and Service Platform). Il progetto MAPS \u00e8 un'evoluzione del progetto precedente Marine. Tale evoluzione si articola su tre aspetti diversi: - Un meccanismo di federazione dei dati, che consenta di rendere disponibili ai propri utenti non soltanto i dati prodotti internamente da sistema Marine ma anche quelli resi disponibili da altri sistemi similari, soddisfacendo cos\u00ec un pi\u00f9 ampio ambito di esigenze informative. Il deliverable D2.2, Modello della Soluzione specifica in dettaglio queste nuove funzionalit\u00e0. - Un Catalogo dei Documenti che, conservando la documentazione tecnica e scientifica dei prodotti offerti, possa documentare in modo accurato le modalit\u00e0 di misurazione, elaborazione e controllo dei prodotti forniti e quindi i relativi ambiti di applicabilit\u00e0. - Un sistema di ricerca capace di selezionare i dati necessari ad uno scopo determinato non soltanto sulla base della loro tipologia, della loro dislocazione territoriale o di altre informazioni simili contenute nei metadati associati come avviene oggi nella maggior parte dei sistemi esistenti, ma anche sulla base delle informazioni contenute nella documentazione tecnica e scientifica. Tali funzionalit\u00e0 sono specificate nel deliverable D1.3 - Modello della Soluzione.","keywords":["Marine Science Search Engine Source Data Oceanography"],"pages":"1-35","url":"https:\/\/publications.cnr.it\/doc\/335399","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132085,"last_updated":"2015-11-18 09:44:09","id_people":335403,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"META: Report di progettazione degli algoritmi individuati","year":2014,"authors_people":"Maurizio De Mattei; Daniele Medone; Maurizio Maltese; Francesca Frontini; Roberto Bartolini; Monica Monachini;","authors_cnr":["Monachini, Monica","Bartolini, Roberto","Frontini, Francesca"],"authors_cnr_id":["8945","10441","15911"],"authors_cnr_institute":["048","048","048"],"authors":["De Mattei, M.","Medone, D.","Maltese, M.","Frontini, F.","Bartolini, R.","Monachini, M."],"abstract":"PROGRAMMA OPERATIVO REGIONALE POR-FESR (2007-2013) Asse 1 Innovazione e Competitivit\u00e0 Bando DLTM Azione 1.2.2 \"Ricerca industriale e sviluppo sperimentale a favore delle imprese del Distretto Ligure per le Tecnologie Marine (DLTM) anno 2012. Il deliverable definisce l'architettura del Sistema di Estrazione Eventi Meteo realizzato dagli autori nell'ambito del progetto META. Il sistema estrae da contenuti online informazione su eventi meteo critici verificatesi in Liguria e nel nord della Toscana.","keywords":["Ontology","Information Extraction","Taxonomy"],"pages":"1-19","url":"https:\/\/publications.cnr.it\/doc\/335403","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132083,"last_updated":"2015-11-18 09:44:22","id_people":335400,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"MAPS: Stato dell'Arte","year":2014,"authors_people":"Francesca Frontini; Roberto Bartolini;Monica Monachini","authors_cnr":["Monachini, Monica","Bartolini, Roberto","Frontini, Francesca"],"authors_cnr_id":["8945","10441","15911"],"authors_cnr_institute":["048","048","048"],"authors":["Frontini, F.","Bartolini, R.","Monachini, M."],"abstract":"PROGRAMMA OPERATIVO REGIONALE POR-FESR (2007-2013) Asse 1 Innovazione e Competitivit\u00e0 Bando DLTM Azione 1.2.2 \"Ricerca industriale e sviluppo sperimentale a favore delle imprese del Distretto Ligure per le Tecnologie Marine (DLTM) anno 2012 Il documento descrive lo stato dell'arte delle tecnologie linguistiche applicate ai sistemi di ricerca semantica.","keywords":["Marine Science Search Engine Source Data Oceanography"],"pages":"1-21","url":"https:\/\/publications.cnr.it\/doc\/335400","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132084,"last_updated":"2015-11-18 09:44:12","id_people":335402,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"META:-Report sui modelli e tecniche linguistiche","year":2014,"authors_people":"Francesca Frontini; Roberto Bartolini; Monica Monachini","authors_cnr":["Monachini, Monica","Bartolini, Roberto","Frontini, Francesca"],"authors_cnr_id":["8945","10441","15911"],"authors_cnr_institute":["048","048","048"],"authors":["Frontini, F.","Bartolini, R.","Monachini, M."],"abstract":"PROGRAMMA OPERATIVO REGIONALE POR-FESR (2007-2013) Asse 1 Innovazione e Competitivit\u00e0 Bando DLTM Azione 1.2.2 \"Ricerca industriale e sviluppo sperimentale a favore delle imprese del Distretto Ligure per le Tecnologie Marine (DLTM) anno 2012. Il deliverable riassume lo stato dell'arte delle tecnologie semantiche che possono essere impiegate nella realizzazione del progetto META. Il progetto META \u00e8 una progetto di ricerca e sviluppo tecnologico finanziato dalla Regione Liguria con i fondi POR-FESR 2007-2013 della Comunit\u00e0 Europea che mira alla realizzazione di un sistema per l'allerta di eventi meteo critici in Liguria e nel nord della Toscana. Nell'ambito del progetto META le tecnologie semantiche sono utilizzate per estrarre eventi meteo di interesse da articoli pubblicati in rete o sui social network.","keywords":["Ontology","Information Extraction","Semantic Web","Search Engine"],"pages":"1-20","url":"https:\/\/publications.cnr.it\/doc\/335402","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131900,"last_updated":"2014-11-14 11:46:04","id_people":287039,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Stato dell'arte dei motori semantici. Progetto MAPS, programma operativo regionale POR-FESR (2007-2013)","year":2014,"authors_people":"Francesca Frontini, Roberto Bartolini, Monica Monachini, Gabriella Pardelli, Sara Goggi","authors_cnr":["Frontini, Francesca","Monachini, Monica","Goggi, Sara","Bartolini, Roberto","Pardelli, Gabriella"],"authors_cnr_id":["8945","10172","10441","16333"],"authors_cnr_institute":["048","048","","048","048"],"authors":["Frontini, F.","Bartolini, R.","Monachini, M.","Pardelli, G.","Goggi, S."],"abstract":"Il presente documento \u00e8 il deliverable \"D1.1 - Stato dell'Arte dei motori semantici del progetto MAPS (Marine Planning and Service Platform). Il progetto MAPS \u00e8 una evoluzione del progetto precedente Marine. Tramite il progetto Marine (Bando Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013 - pos n.1) \u00e8 stata realizzata una piattaforma informatica di supporto all'Oceanografia Operativa capace di raccogliere dati marini per renderli poi disponibili ai ricercatori e alle organizzazioni interessate tramite protocolli standard. Lo scopo del progetto MAPS \u00e8 quello di realizzare una Catalogo di Documenti contenente informazioni per la piattaforma Marine. Caratteristica di MAPS \u00e8 di fornire accesso ai dati oceanografici sia attraverso la ricerca per metadati, sia attraverso la ricerca semantica contenuta nella manualistica tecnico scientifica di riferimento.","keywords":[""],"pages":"1-22","url":"https:\/\/publications.cnr.it\/doc\/287039","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":128655,"last_updated":"2016-04-01 13:36:10","id_people":278677,"institutes":["IIT","ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"GLOSS, an infrastructure for the semantic annotation and mining of documents in the public security domain","year":2012,"authors_people":"Frontini Francesca, Aliprandi Carlo, Bacciu Clara, Bartolini Roberto, Marchetti Andrea, Parenti Enrico, Piccinonno Fulvio, Soru T.","authors_cnr":["Bacciu, Clara","Frontini, Francesca","Marchetti, Andrea","Bartolini, Roberto"],"authors_cnr_id":["1738","10441"],"authors_cnr_institute":[""],"authors":["Frontini, F.","Aliprandi, C.","Bacciu, C.","Bartolini, R.","Marchetti, A.","Parenti, E.","Piccinonno, F.","Soru, T."],"abstract":"Efficient access to information is crucial in the work of organizations that require decision taking in emergency situations. This paper gives an outline of GLOSS, an integrated system for the analysis and retrieval of data in the environmental and public security domain. We shall briefly present the GLOSS infrastructure and its use, and how semantic information of various kinds is integrated, annotated and made available to the final users.","keywords":["semantic annotation","text mining","geographic data"],"pages":"21-25","url":"https:\/\/publications.cnr.it\/doc\/278677","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European language resources association (ELRA) (Paris, FRA)","issn":"","isbn":"978-2-9517408-7-7","conference_name":"Eight International Conference on Language Resources and Evaluation. LREC'12. European Language Resources Association: France","conference_place":"Istanbul","conference_date":"21-27\/05\/2012"},{"id":128383,"last_updated":"2013-06-03 13:58:00","id_people":221743,"institutes":["IIT","ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Specifiche architetturali e funzionali","year":2012,"authors_people":"Aliprandi, Carlo [1]; Bacciu, Clara [2]; Bartolini, Roberto [3]; Frontini, Francesca [3]; Lapolla, Noemi [2]; Marchetti, Andrea [2]; Piccinonno, Fulvio; Soru, Tiziana [1]","authors_cnr":["Bacciu, Clara","Frontini, Francesca","Marchetti, Andrea","Bartolini, Roberto"],"authors_cnr_id":["1738","10441"],"authors_cnr_institute":["044","048","044","048"],"authors":["Aliprandi, C.","Bacciu, C.","Bartolini, R.","Frontini, F.","Lapolla, N.","Marchetti, A.","Piccinonno, F.","Soru, T."],"abstract":"Questo documento contiene le specifiche funzionali ed architetturali del sistema GLOSS elaborate come risultato dell'obiettivo operativo 1. Tali specifiche debbono essere di riferimento per tutte le fasi di sviluppo dei vari componenti del sistema stesso e della loro integrazione in un prototipo dimostrativo. Ad una breve introduzione che richiama gli obiettivi generali del progetto, seguono: 1. La descrizione delle funzionalit\u00e0 suddivisa nelle varie fasi che compongono il flusso operativo di GLOSS. 2. La descrizione dell'architettura del sistema da realizzare nella quale si fornisce lo schema dell'integrazione dei vari componenti, il protocollo di comunicazione e memorizzazione dei dati che viene trattato pi\u00f9 nel dettaglio nel documento D1.2 GAF - Gloss Annotation Format, e la descrizione di ciascun componente del sistema. Per sua natura, questo documento sar\u00e0 soggetto a revisione durante tutto il periodo di sviluppo del sistema. Questa prima versione deve intendersi come guida per l'implementazione ed ha lo scopo di fornire a chi partecipa a questo progetto una visione generale delle funzionalit\u00e0 di GLOSS e come queste dovranno essere integrate nel prototipo dimostratore.","keywords":["GLOSS specifiche funzionali"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/221743","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131787,"last_updated":"2020-09-12 01:47:14","id_people":221616,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D7. 4 Third evaluation report. Evaluation of PANACEA v3 and produced resources","year":2012,"authors_people":"Quochi, Valeria; Frontini, Francesca; Bartolini, Roberto; Hamon, Olivier; Poch Riera, Marc; Padro, Muntsa; Bel, Nuria; Thurmair, Gregor; Toral, Antonio; Kamran, Amir","authors_cnr":["Frontini, Francesca","Bartolini, Roberto","Quochi, Valeria"],"authors_cnr_id":["10441","11893"],"authors_cnr_institute":[""],"authors":["Quochi, V.","Frontini, F.","Bartolini, R.","Hamon, O.","Poch Riera, M.","Padro, M.","Bel, N.","Thurmair, G.","Toral, A.","Kamran, A."],"abstract":"D7.4 reports on the evaluation of the different components integrated in the PANACEA third cycle of development as well as the final validation of the platform itself. All validation and evaluation experiments follow the evaluation criteria already described in D7.1. The main goal of WP7 tasks was to test the (technical) functionalities and capabilities of the middleware that allows the integration of the various resource-creation components into an interoperable distributed environment (WP3) and to evaluate the quality of the components developed in WP5 and WP6. The content of this deliverable is thus complementary to D8.2 and D8.3 that tackle advantages and usability in industrial scenarios. It has to be noted that the PANACEA third cycle of development addressed many components that are still under research. The main goal for this evaluation cycle thus is to assess the methods experimented with and their potentials for becoming actual production tools to be exploited outside research labs. For most of the technologies, an attempt was made to re-interpret standard evaluation measures, usually in terms of accuracy, precision and recall, as measures related to a reduction of costs (time and human resources) in the current practices based on the manual production of resources. In order to do so, the different tools had to be tuned and adapted to maximize precision and for some tools the possibility to offer confidence measures that could allow a separation of the resources that still needed manual revision has been attempted. Furthermore, the extension to other languages in addition to English, also a PANACEA objective, has been evaluated. The main facts about the evaluation results are now summarized.","keywords":["PANACEA","evaluation","machine translation"],"pages":"","url":"http:\/\/hdl.handle.net\/10230\/22533","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131698,"last_updated":"2015-03-18 10:56:31","id_people":206269,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"D3. 3 Second version (v2) of the integrated platform and documentation","year":2011,"authors_people":"Roberto Bartolini, Marc Poch, Olivier Hamon, Antonio Toral, Prokopis Prokopidis, Francesco Rubino, Gregor Thurmair,Vassilis Papavassiliou,Nuria Bel","authors_cnr":["Toral Ruiz, Antonio","Rubino, Francesco","Bartolini, Roberto"],"authors_cnr_id":["10441"],"authors_cnr_institute":["048","048","048"],"authors":["Bartolini, R.","Poch, M.","Hamon, O.","Toral, A.","Prokopidis, P.","Rubino, F.","Thurmair, G.","Papavassiliou, V.","Bel, N."],"abstract":"the integrated platform and documentation of panacea","keywords":["platform"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/206269","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131705,"last_updated":"2015-02-26 12:33:01","id_people":206329,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"KyotoCore: integrated system for knowledge mining from text","year":2011,"authors_people":"Piek Vossen, Wauter Bosma, German Rigau, Eneko Agirre, Aitor Soroa, Carlo Aliprandi, Joost de Jonge, Feikje Hielkema, Monica Monachini, Roberto Bartolini, Francesca Frontini","authors_cnr":["Frontini, Francesca","Monachini, Monica","Bartolini, Roberto"],"authors_cnr_id":["8945","10441"],"authors_cnr_institute":["048","048","048"],"authors":["Vossen, P.","Bosma, W.","Rigau, G.","Agirre, E.","Soroa, A.","Aliprandi, C.","De Jonge, J.","Hielkema, F.","Monachini, M.","Bartolini, R.","Frontini, F."],"abstract":"In this deliverable, we describe KyotoCore, an integrated system for applying text mining. We describe the software architecture of KyotoCore, the single modules and the process flows. Finally, we describe a use case where we apply the complete process toan English database on estuaries.","keywords":["Knowledge and text mining software"],"pages":"56","url":"https:\/\/publications.cnr.it\/doc\/206329","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131225,"last_updated":"2012-06-08 12:07:42","id_people":84782,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A Web-based Architecture for Interoperability of Lexical Resources","year":2010,"authors_people":"Del Gratta R.; D'Onofrio L.; Bartolini R.; Caselli T.; Enea A.; Monachini M.; Quochi V.; Soria C.; Toral A.; Calzolari N.","authors_cnr":["Caselli, Tommaso","Enea, Alessandro","Monachini, Monica","Soria, Claudia","Bartolini, Roberto","Quochi, Valeria","Del Gratta, Riccardo","Zamorani, Nicoletta"],"authors_cnr_id":["8533","8945","9887","10441","11893","11933","26123"],"authors_cnr_institute":["048","048","048","048","048","048","048"],"authors":["Del Gratta, R.","D'Onofrio, L.","Bartolini, R.","Caselli, T.","Enea, A.","Monachini, M.","Quochi, V.","Soria, C.","Toral, A.","Calzolari, N."],"abstract":"In this paper we present aWeb Service Architecture for managing high level interoperability of Language Resources (LRs) by means of a Service Oriented Architecture (SOA) and the use of ISO standards, such as ISO LMF. We propose a layered architecture which separates the management of legacy resources (data collection) from data aggregation (workflow) and data access (user requests). We provide a case study to demonstrate how the proposed architecture is capable of managing data exchange among different lexical services in a coherent way and show how the use of a lexical standard becomes of primary importance when a protocol of interoperability is defined.","keywords":["Interoperability","Web sercives","Lexical resources"],"pages":"53-62","url":"http:\/\/weblab.iit.cnr.it\/kyoto\/www2.let.vu.nl\/twiki\/pub\/Kyoto\/Publications\/icgl2010_DOnofrioetal.pdf","volume":"","doi":"","editors_people":"A. Chengyu Fang; N. Ide; J. Webster","editors":["Fang, A. C.","Ide, N.","Webster, J."],"published":"2nd International Conference on Global Interoperability for Language Resources, ICGL 2010","publisher":"City university of Hong Kong press (Hong Kong, CHN)","issn":"","isbn":"978-962-442-323-5","conference_name":"2nd International Conference on Global Interoperability for Language Resources","conference_place":"Hong Kong","conference_date":"18-20 January 2010"},{"id":131648,"last_updated":"2012-06-05 17:55:04","id_people":184375,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"KYOTO: an Open Platform for Mining Facts","year":2010,"authors_people":"Vossen P.; G. Rigau; E. Agirre; A. Soroa; M. Monachini; R. Bartolini","authors_cnr":["Monachini, Monica","Bartolini, Roberto"],"authors_cnr_id":["8945","10441"],"authors_cnr_institute":["048","048"],"authors":["Vossen, P.","Rigau, G.","Agirre, E.","Soroa, A.","Monachini, M.","Bartolini, R."],"abstract":"This paper describes an open text-mining system that was developed for the Asian-European project KYOTO. The KYOTO system uses an open text representation format and a central ontology to enable extraction of knowledge and facts from large volumes of text in many different languages. We implemented a semantic tagging approach that performs off-line reasoning. Mining of facts and knowledge is achieved through a flexible pattern matching module that can work in much the same way for different languages, can handle efficiently large volumes of documents and is not restricted to a specific domain. We applied the system to an English database on estuaries","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/184375","volume":"","doi":"","editors_people":"","editors":[""],"published":"ONTOLEX-COLING 2010","publisher":"","issn":"","isbn":"978-7-900268-00-6","conference_name":"OntoLex 2010","conference_place":"Beijing","conference_date":"2010"},{"id":130900,"last_updated":"2012-06-28 13:49:59","id_people":30876,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"A Standard Lexical-Terminological Resource for the Bio Domain","year":2009,"authors_people":"Quochi V.; Del Gratta R.; Sassolini E.; Bartolini R.; Monachini M.; Calzolari N.","authors_cnr":["Quochi, Valeria","Del Gratta, Riccardo","Monachini, Monica","Bartolini, Roberto","Sassolini, Eva","Zamorani, Nicoletta"],"authors_cnr_id":["8945","10441","11032","26123"],"authors_cnr_institute":[""],"authors":["Quochi, V.","Del Gratta, R.","Sassolini, E.","Bartolini, R.","Monachini, M.","Calzolari, N."],"abstract":"The present paper describes a large-scale lexical resource for the biology domain designed both for human and for machine use. This lexicon aims at semantic interoperability and extendability, through the adoption of ISO-LMF standard for lexical representation and through a granular and distributed encoding of relevant information. The first part of this contribution focuses on three aspects of the model that are of particular interest to the biology community: the treatment of term variants, the representation on bio events and the alignment with a domain ontology. The second part of the paper describes the physical implementation of the model: a relational database equipped with a set of automatic uploading procedures. Peculiarity of the BioLexicon is that it combines features of both terminologies and lexicons. A set verbs relevant for the domain is also represented with full details on their syntactic and semantic argument structure.","keywords":["Lexical representation model","Lexical Database","Computational Lexicography","Special Domains","Standards"],"pages":"325-335","url":"https:\/\/publications.cnr.it\/doc\/30876","volume":"5603","doi":"10.1007\/978-3-642-04235-5_28","editors_people":"","editors":[""],"published":"Lecture notes in computer science","publisher":"Springer (Berlin, Germania)","issn":"0302-9743","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131152,"last_updated":"2012-05-31 17:40:06","id_people":84699,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A Bilingual Corpus of Inter-linked Events","year":2008,"authors_people":"Caselli T.; Ide N.; Bartolini R.","authors_cnr":["Caselli, Tommaso","Bartolini, Roberto"],"authors_cnr_id":["10441"],"authors_cnr_institute":["048","048"],"authors":["Caselli, T.","Ide, N.","Bartolini, R."],"abstract":"This paper describes the creation of a bilingual corpus of inter-linked events for Italian and English. Linkage is accomplished through the Inter-Lingual Index (ILI) that links ItalWordNet withWordNet. The availability of this resource, on the one hand, enables contrastive analysis of the linguistic phenomena surrounding events in both languages, and on the other hand, can be used to perform multilingual temporal analysis of texts. In addition to describing the methodology for construction of the inter-linked corpus and the analysis of the data collected, we demonstrate that the ILI could potentially be used to bootstrap the creation of comparable corpora by exporting layers of annotation for words that have the same sense.","keywords":["Corpus (creation","annotation","etc.)","Semantics","Validation of LRs"],"pages":"2424-2429","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2008\/pdf\/610_paper.pdf","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference Chair); Khalid Choukri; Bente Maegaard; Joseph Mariani; Jan Odjik; Stelios Piperidis; Daniel Tapias","editors":["Calzolari, N.","Choukri, K.","Maegaard, B.","Mariani, J.","Odjik, J.","Piperidis, S.","Tapias, D."],"published":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","publisher":"European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)","issn":"","isbn":"2-9517408-4-0","conference_name":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","conference_place":"Marrakech, Marocco","conference_date":"26 May-1 June 2008"},{"id":131180,"last_updated":"2015-02-04 12:25:18","id_people":84729,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"UFRA: a UIMA-based Approach to Federated Language Resource Architecture","year":2008,"authors_people":"Del Gratta R.; Bartolini R.; Caselli T.; Monachini M.; Soria C.; Calzolari N.","authors_cnr":["Del Gratta, Riccardo","Caselli, Tommaso","Monachini, Monica","Soria, Claudia","Bartolini, Roberto","Zamorani, Nicoletta"],"authors_cnr_id":["8945","9887","10441","26123"],"authors_cnr_institute":[""],"authors":["Del Gratta, R.","Bartolini, R.","Caselli, T.","Monachini, M.","Soria, C.","Calzolari, N."],"abstract":"In this paper we address the issue of developing an interoperable infrastructure for language resources and technologies. In our approach, called UFRA, we extend the Federate Database Architecture System adding typical functionalities caming from UIMA. In this way, we capitalize the advantages of a federated architecture, such as autonomy, heterogeneity and distribution of components, monitored by a central authority responsible for checking both the integration of components and user rights on performing different tasks. We use the UIMA approach to manage and define one common front-end, enabling users and clients to query, retrieve and use language resources and technologies. The purpose of this paper is to show how UIMA leads from a Federated Database Architecture to a Federated Resource Architecture, adding to a registry of available components both static resources such as lexicons and corpora and dynamic ones such as tools and general purpose language technologies. At the end of the paper, we present a case-study that adopts this framework to integrate the SIMPLE lexicon and TIMEML annotation guidelines to tag natural language texts.","keywords":["LR Infrastructures and Architectures","LR web services","Lexicon","Lexical database"],"pages":"2634-2639","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2008\/pdf\/656_paper.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"2-9517408-4-0","conference_name":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","conference_place":"Marrakech, Marocco","conference_date":"26 May-1 June 2008"},{"id":131177,"last_updated":"2012-06-07 20:38:43","id_people":84726,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Ontology Learning and Semantic Annotation: a Necessary Symbiosis","year":2008,"authors_people":"Giovannetti E.; Marchi S.; Montemagni S.; Bartolini R.","authors_cnr":["Giovannetti, Emiliano","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["5595","10441","10442"],"authors_cnr_institute":["048","048","048","048"],"authors":["Giovannetti, E.","Marchi, S.","Montemagni, S.","Bartolini, R."],"abstract":"Semantic annotation of text requires the dynamic merging of linguistically structured information and a \"world model\", usually represented as a domain-specific ontology. On the other hand, the process of engineering a domain-ontology through semi-automatic ontology learning system requires the availability of a considerable amount of semantically annotated documents. Facing this bootstrapping paradox requires an incremental process of annotation-acquisition-annotation, whereby domain-specific knowledge is acquired from linguistically-annotated texts and then projected back onto texts for extra linguistic information to be annotated and further knowledge layers to be extracted. The presented methodology is a first step in the direction of a full \"virtuous\" circle where the semantic annotation platform and the evolving ontology interact in symbiosis. As a case study we have chosen the semantic annotation of product catalogues. We propose a hybrid approach, combining pattern matching techniques to exploit the regular structure of product descriptions in catalogues, and Natural Language Processing techniques which are resorted to analyze natural language descriptions. The semantic annotation involves the access to the ontology, semi-automatically bootstrapped with an ontology learning tool from annotated collections of catalogues.","keywords":["Information Extraction","Information Retrieval","Ontologies","Tools","Systems"],"pages":"2079-2085","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2008\/","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference Chair); Khalid Choukri; Bente Maegaard; Joseph Mariani; Jan Odjik; Stelios Piperidis; Daniel Tapias","editors":["Calzolari, N.","Choukri, K.","Maegaard, B.","Mariani, J.","Odjik, J.","Piperidis, S.","Tapias, D."],"published":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","publisher":"European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)","issn":"","isbn":"2-9517408-4-0","conference_name":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","conference_place":"Marrakech, Marocco","conference_date":"2008"},{"id":131145,"last_updated":"2014-07-28 11:46:33","id_people":84690,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Ontology-based Semantic Annotation of Product Catalogues","year":2007,"authors_people":"Giovannetti E, Marchi S, Montemagni S., Bartolini R.","authors_cnr":["Giovannetti, Emiliano","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["5595","10441","10442"],"authors_cnr_institute":["048","048","048","048"],"authors":["Giovannetti, E.","Marchi, S.","Montemagni, S.","Bartolini, R."],"abstract":"This paper describes a methodology for the semantic annotation of product catalogues. We propose a hybrid approach, combining pattern matching techniques to exploit the regular structure of product descriptions in catalogues, and Natural Language Processing techniques which are resorted to analyze natural language descriptions. It also includes the access to an application ontology, semi-automatically bootstrapped from collections of catalogues with an ontology learning tool, which is used to drive the semantic annotation process.","keywords":["Semantic Annotation of texts","Ontology Learning","Information Extraction for e-commerce"],"pages":"235-239","url":"https:\/\/publications.cnr.it\/doc\/84690","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of the International Conference \"Recent Advances in Natural Language Processing\"","publisher":"","issn":"","isbn":"","conference_name":"Recent Advances in Natural Language Processing (RANLP-2007)","conference_place":"Borovets","conference_date":"27-29 settembre 2007"},{"id":131137,"last_updated":"2009-06-16 00:00:00","id_people":84682,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Automatic Extraction of Semantics in Law Documents","year":2007,"authors_people":"Soria C., Bartolini R., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Soria, Claudia","Bartolini, Roberto"],"authors_cnr_id":["326","5595","9887","10441"],"authors_cnr_institute":[""],"authors":["Soria, C.","Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84682","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"V Legislative XML Workshop","conference_place":"Firenze","conference_date":"2007"},{"id":131572,"last_updated":"2009-06-16 00:00:00","id_people":157442,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"TimeML: An Ontological Mapping onto the UIMA Type Systems","year":2007,"authors_people":"Del Gratta R., Bartolini R., Caselli T., Enea A., Monachini M., Quochi V., Sassolini V.","authors_cnr":["Sassolini, Eva","Quochi, Valeria","Del Gratta, Riccardo","Caselli, Tommaso","Enea, Alessandro","Monachini, Monica","Bartolini, Roberto"],"authors_cnr_id":["8533","8945","10441"],"authors_cnr_institute":[""],"authors":["Del Gratta, R.","Bartolini, R.","Caselli, T.","Enea, A.","Monachini, M.","Quochi, V.","Sassolini, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157442","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131570,"last_updated":"2016-07-20 15:08:53","id_people":157440,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Report on Ontology learning tool and testing","year":2007,"authors_people":"Montemagni S., Marchi S., Venturi G., Bartolini R., Bertagna F., Ruffolo P., Peters W., Tiscornia D.","authors_cnr":["Bertagna, Francesca","Ruffolo, Paolo","Venturi, Giulia","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Marchi, S.","Venturi, G.","Bartolini, R.","Bertagna, F.","Ruffolo, P.","Peters, W.","Tiscornia, D."],"abstract":"This deliverable documents the work done within the DALOS EU project for what concerns the definition and implementation of methodologies and techniques to bootstrap terminological and ontological knowledge from domain corpora. Starting from a corpus of legacy legislative texts in different languages, linguistic technologies combined with statistical techniques have been used to extract significant terms as well as to structure them in conceptual structures for the different languages dealt with within the project, namely Italian, English, Spanish and Dutch.","keywords":["Ontology Learning","Term Extraction","Natural Language Processing","Conceptual Indexing"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157440","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131070,"last_updated":"2009-06-16 00:00:00","id_people":84608,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Creation and Use of Lexicons and Ontologies for NL Interfaces to Databases","year":2006,"authors_people":"Bartolini R., Caracciolo C., Giovannetti E., Lenci A., Marchi S., Pirrelli V., Renso C., Spinsanti L.","authors_cnr":["Giovannetti, Emiliano","Pirrelli, Vito","Bartolini, Roberto"],"authors_cnr_id":["326","10441"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Caracciolo, C.","Giovannetti, E.","Lenci, A.","Marchi, S.","Pirrelli, V.","Renso, C.","Spinsanti, L."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84608","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LREC 2006: 5th International Conference on Language Resources and Evaluation (LREC)","conference_place":"Genova","conference_date":"2006"},{"id":286671,"last_updated":"2023-08-23 14:08:08","id_people":91313,"institutes":["ILC","ISTI"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Creation and use of lexicons and ontologies for natural language interface to databases","year":2006,"authors_people":"Bartolini R., Caracciolo C., Giovannetti E., Lenci A., Marchi S., Pirrelli V., Renso C., Spinsanti L.","authors_cnr":["Pirrelli, Vito","Renso, Chiara","Bartolini, Roberto","Giovannetti, Emiliano"],"authors_cnr_id":["326","7670","10441","11969"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Caracciolo, C.","Giovannetti, E.","Lenci, A.","Marchi, S.","Pirrelli, V.","Renso, C.","Spinsanti, L."],"abstract":"In this paper we present an original approach to natural language query interpretation which has been implemented within the FuLL (Fuzzy Logic and Language) Italian project of BC S.r.l. In particular, we discuss here the creation of linguistic and ontological resources, together with the exploitation of existing ones, for natural language-driven database access and retrieval. Both the database and the queries we experiment with are Italian, but the methodology we broach naturally extends to other languages.","keywords":["Natual language processing","ontologies","gis","databases"],"pages":"6","url":"https:\/\/publications.cnr.it\/doc\/91313","volume":"","doi":"","editors_people":"","editors":[""],"published":"LREC 2006","publisher":"","issn":"","isbn":"","conference_name":"LREC Conference","conference_place":"Genova","conference_date":"24-26\/05\/2006"},{"id":131124,"last_updated":"2023-07-10 09:15:54","id_people":84664,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Multimedia Information Extraction in Ontology-based Semantic Annotation of Product Catalogues","year":2006,"authors_people":"Bartolini R., Giovannetti E., Marchi S., Montemagni S., Andreatta C., Brunelli R., Stecher R. and Bouquet P.","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone","Giovannetti, Emiliano"],"authors_cnr_id":["5595","10441","10442","11969"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Giovannetti, E.","Marchi, S.","Montemagni, S.","Andreatta, C.","Brunelli, R.","Stecher, R.","Bouquet, P."],"abstract":"The demand for efficient methods for extracting knowledge from multimedia content has led to a growing research community investigating the convergence of multimedia and knowledge technologies. In this paper we describe a methodology for extracting multimedia information from product catalogues empowered by the synergetic use and extension of a domain ontology. The methodology was implemented in the Trade Fair Advanced Semantic Annotation Pipeline of the VIKE-framework.","keywords":["Semantic Web Technologies","ontology creation","ontology extraction","ontology evolution","semantic annotation of multimedia content"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84664","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"SWAP 2006","conference_place":"Pisa","conference_date":"18-20 December 2006"},{"id":131123,"last_updated":"2014-07-28 11:57:41","id_people":84663,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Ontology Learning in Multimedia Information Extraction from Product Catalogues","year":2006,"authors_people":"Bartolini R., Giovannetti E., Marchi S., Montemagni S., Andreatta C., Brunelli R., Stecher R., Nieder\u00e9e C., Bouquet P. and Bortoli S.","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone","Giovannetti, Emiliano"],"authors_cnr_id":["5595","10441","10442","11969"],"authors_cnr_institute":["048"],"authors":["Bartolini, R.","Giovannetti, E.","Marchi, S.","Montemagni, S.","Andreatta, C.","Brunelli, R.","Stecher, R.","Nieder\u00e9e, C.","Bouquet, P.","Bortoli, S."],"abstract":"We propose a methodology for extracting multimedia information from product catalogues empowered by the synergetic use and extension of a domain ontology. The use of domain ontologies in this context additionally opens up innovative ways of catalogue use. The method is characterized by incrementally feeding and exploiting the ontology during an information extraction process, implemented by the semantic annotation of the analysed document, and by providing support for detecting existing similar ontologies to enable reuse of (parts of) them.","keywords":["knowledge-drive multimedia analysis","ontology learning","semi-automatic content annotation tools"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84663","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"BOEMIE 2006","conference_place":"Podebrady, Czech Republic","conference_date":"6 ottobre 2006"},{"id":131437,"last_updated":"2023-11-06 19:34:25","id_people":151563,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Text-to-Knowledge (T2K) Versione 2","year":2006,"authors_people":"Bartolini R., Dell'Orletta F., Lenci A., Marchi S., Montemagni S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["326","5595","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Dell'Orletta, F.","Lenci, A.","Marchi, S.","Montemagni, S.","Pirrelli, V."],"abstract":"Versione 2. Text-to-Knowledge (T2K) \u00e8 una piattaforma software di supporto avanzato alla gestione documentale per la creazione dinamica di repertori terminologici e ontologie di dominio a partire da testi e per l'indicizzazione concettuale di documenti. Il sistema T2K si propone di offrire una batteria integrata di strumenti avanzati di analisi linguistica del testo, analisi statistica e apprendimento automatico del linguaggio, destinati a offrire una rappresentazione accurata del contenuto di una base documentale non strutturata, per scopi di indicizzazione avanzata e navigazione intelligente. I risultati di questo processo di acquisizione sono annotati in forma di metadati XML, offrendo in tal modo la prospettiva di una sempre crescente e diretta interoperabilit\u00e0 con sistemi automatici per la produzione di contenuti digitali selezionati e strutturati dinamicamente su misura, per diversi profili di utenza. Versioni prototipali di T2K sono gi\u00e0 operative su alcuni portali della pubblica amministrazione e sono state applicate per l'indicizzazione di contenuti didattici multimediali. E' in corso l'integrazione della tecnologia T2K nel sistema di gestione informatica di documentazione scientifica del CNR.","keywords":["text to knowledge","nlp","estrazione terminologica","ontology learning","indicizzazione terminologica"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151563","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131039,"last_updated":"2015-02-23 14:55:26","id_people":84576,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Automatic Incremental Term Acquisition from Domain Corpora","year":2005,"authors_people":"Bartolini R., Giorgetti D., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Bartolini, Roberto"],"authors_cnr_id":["326","5595","10441"],"authors_cnr_institute":["048"],"authors":["Bartolini, R.","Giorgetti, D.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"We describe a technique for the acquisition of terms from Italian domain text corpora, which relies both on sophisticated linguistic analysis and on statistical measures applied to linguistically processed text rather than to raw text as it is usually the case. The main advantage of this technique is that minimal a priori knowledge of term structure is required, thus allowing to explore and discover terms in a given domain without imposing a strict pattern matching structure on them, and also to easily extend it to different domains. The approach we present in this paper is incremental as it may be iterated to discover terms of increasing complexity built on top of terms discovered in the previous iteration. The reason why it is convenient to adopt such an incremental approach is that it allows to \"clean\" data from noise in the first step, elicitating the constituent terms, and then to refine term acquisition on \"skimmed\" term data.","keywords":[""],"pages":"293-300","url":"https:\/\/publications.cnr.it\/doc\/84576","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of TKE 2005-7th International Conference on Terminology and Knowledge Engineering","publisher":"","issn":"","isbn":"","conference_name":"7th International conference on Terminology and Knowledge Engineering (TKE2005)","conference_place":"Copenhagen","conference_date":"2005"},{"id":131496,"last_updated":"2020-11-27 14:35:54","id_people":157365,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Motore semantico. Documento di progettazione e sviluppo","year":2005,"authors_people":"Bartolini R., Caracciolo C., Lenci A., Marchi S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["326","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Caracciolo, C.","Lenci, A.","Marchi, S.","Pirrelli, V."],"abstract":"Il presente documento descrive architettura, funzionalit\u00e0 e algoritmo di un componente software dedicato, designato come \"Motore Semantico\", che ha lo scopo di produrre rappresentazioni logico-concettuali, ontologicamente interpretate, di interrogazioni in linguaggio naturale su una base di dati di tipo anche GIS.","keywords":["NLP"],"pages":"1-42","url":"https:\/\/publications.cnr.it\/doc\/157365","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131497,"last_updated":"2020-11-27 14:35:04","id_people":157366,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ILC-CNR Contribution to Deliverable 4. 1","year":2005,"authors_people":"Bartolini R., Giorgetti D., Marchi S., Montemagni S.","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Giorgetti, D.","Marchi, S.","Montemagni, S."],"abstract":"The goal of the semantic annotation is the annotation of entities and relations starting from input documents conformant with the harmonisation output schema as defined within WP3. This harmonisation schema will focus on the structural and logical organisation of the documents, while WP4 will concentrate on the annotation of textual entities and image elements. The results of semantic annotation are intended to populate the domain ontology.","keywords":["NLP"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157366","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131498,"last_updated":"2020-11-27 14:35:36","id_people":157367,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Personalizzazione degli Italian NLP tools","year":2005,"authors_people":"Bartolini R., Lenci A., Marchi S., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["326","5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, A.","Marchi, S.","Montemagni, S.","Pirrelli, V."],"abstract":"Il presente documento intende offrire criteri e risultati della fase di personalizzazione dei moduli per l'analisi automatica del testo (Italian NLP tools o \"AnITA\") all'interno dell'architettura prevista nell'ambito del progetto FuLL.","keywords":["NLP"],"pages":"13","url":"https:\/\/publications.cnr.it\/doc\/157367","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131500,"last_updated":"2009-06-16 00:00:00","id_people":157369,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Modellazione del motore sintattico e delle strutture dati di supporto","year":2005,"authors_people":"Bartolini R., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157369","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131501,"last_updated":"2023-07-11 15:16:12","id_people":157370,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Text-2-Knowledge: Acquisizione semi-automatica di ontologie per l'indicizzazione semantica di documenti","year":2005,"authors_people":"Bartolini R., Lenci L., Marchi S., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["326","5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, L.","Marchi, S.","Montemagni, S.","Pirrelli, V."],"abstract":"Text-2-Knowledge, Acquisizione semi-automatica di ontologie per l'indicizzazione semantica di documenti","keywords":["nlp","terminology extraction"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157370","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131425,"last_updated":"2023-11-06 19:34:27","id_people":151548,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Text-to-Knowledge (T2K)","year":2005,"authors_people":"Bartolini R., Dell'Orletta F., Giorgetti D., Marchi S., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["326","5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Dell'Orletta, F.","Giorgetti, D.","Marchi, S.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"Piattaforma di estrazione e indicizzazione terminologica.","keywords":["NLP","estrazione terminologica"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151548","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131426,"last_updated":"2009-06-18 00:00:00","id_people":151550,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"NLPtools","year":2005,"authors_people":"Bartolini R., Marchi S., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Marchi, S.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151550","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130892,"last_updated":"2023-06-27 11:50:18","id_people":30867,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Automatic Classification and Analysis of Provisions in Italian Legal Texts: A Case Study","year":2004,"authors_people":"Bartolini R.; Lenci A.; Montemagni S.; Pirrelli V.; Soria C.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Soria, Claudia","Bartolini, Roberto"],"authors_cnr_id":["326","5595","9887","10441"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V.","Soria, C."],"abstract":"In this paper we address the problem of automatically enriching legal texts with semantic annotation, an essential pre\u0096requisite to effective indexing and retrieval of legal documents. This is done through illustration of SALEM (Semantic Annotation for LEgal Management), a computational system developed for automated semantic annotation of (Italian) law texts. SALEM is an incremental system using Natural Language Processing techniques to perform two tasks: i) classify law paragraphs according to their regulatory content, and ii) extract relevant text fragments corresponding to specific semantic roles that are relevant for the different types of regulatory content. The paper sketches the overall architecture of SALEM and reports results of a preliminary case study on a sample of Italian law texts.","keywords":["Annotazione semantica","Classificazione automatica"],"pages":"593-604","url":"https:\/\/rdcu.be\/dftjm","volume":"3292","doi":"10.1007\/978-3-540-30470-8_72","editors_people":"Meersman, R., Tari, Z., Corsaro, A.","editors":["Meersman, R.","Tari, Z.","Corsaro, A."],"published":"On the Move to Meaningful Internet Systems 2004: OTM 2004 Workshops. OTM 2004","publisher":"Springer (Berlin, DEU)","issn":"","isbn":"978-3-540-23664-1","conference_name":"","conference_place":"","conference_date":""},{"id":131034,"last_updated":"2009-06-16 00:00:00","id_people":84570,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Hybrid Constraints for Robust Parsing: First Experiments and Evaluation","year":2004,"authors_people":"Bartolini R., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84570","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LREC 2004: Fourth International Conference on Language Resources and Evaluation","conference_place":"Lisbon, Portugal","conference_date":"2004"},{"id":131035,"last_updated":"2012-05-04 11:58:28","id_people":84571,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Semantic Mark-up of Italian Legal Texts Through NLP-based Techniques","year":2004,"authors_people":"Bartolini R.; Lenci A.; Montemagni S.; Pirrelli V.; Soria C.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Soria, Claudia","Bartolini, Roberto"],"authors_cnr_id":["326","5595","9887","10441"],"authors_cnr_institute":["048","048","048","048"],"authors":["Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V.","Soria, C."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84571","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"2-9517408-1-6","conference_name":"LREC 2004: Fourth International Conference on Language Resources and Evaluation","conference_place":"Lisbon, Portugal","conference_date":"2004"}]