@ARTICLE{DELGRATTA_2021_ARTICLE_DGPC_451726, AUTHOR = {Del Gratta, R. and Goggi, S. and Pardelli, G. and Calzolari, N.}, TITLE = {The LRE Map: what does it tell us about the last decade of our field?}, YEAR = {2021}, ABSTRACT = {The LRE Map of Language Resources was introduced at LREC 2010. Its intended purpose was: "to shed light on the vast amount of resources that represent the background of the research presented at LREC" (Calzolari et al. in: Calzolari et al. (eds) Proceedings of the seventh international conference on language resources and evaluation (LREC'10). European Language Resources Association (ELRA), Valletta, 2010). It also aimed at a change of culture in the field, actively engaging each researcher both in the documentation task about resources and in sharing resources. When we started to use it regularly also in other conferences, it became clear that it was an innovative instrument able to provide a picture of the field and its evolution as reflected by the creation and use of Language Resources. After 9 years we revisit the Map, considerably extending the data analysed in an LREC 2018 paper. The LRE Map data analysed here have been provided by the authors of 21 conferences during the phase of submission of papers, and contain information about 9405 resources. We analyse the LRE Map data from many different viewpoints and the paper reports on the global picture, along the many Map dimensions, on different trends emerging from a diachronic perspective and finally on some comparisons between five editions of the two major conferences present in the Map: LREC and COLING.}, KEYWORDS = {LR infrastucture, metadata, LR documentation}, PAGES = {259-283}, URL = {https://link.springer.com/article/10.1007/s10579-020-09520-6}, VOLUME = {Volume 55}, DOI = {10.1007/s10579-020-09520-6}, PUBLISHER = {Springer (Dordrecht, Paesi Bassi)}, ISSN = {1574-020X}, JOURNAL = {Language resources and evaluation (Print)}, } @ARTICLE{GOGGI_2019_ARTICLE_GPBMBC_411599, AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Monachini, M. and Biagioni, S. and Carlesi, C.}, TITLE = {Semantic Query Analysis from the Global Science Gateway}, YEAR = {2019}, ABSTRACT = {Nowadays web portals play an essential role in searching and retrieving information in the several fields of knowledge: they are ever more technologically advanced and designed for supporting the storage of a huge amount of information in natural language originating from the queries launched by users worldwide. Given this scenario, we focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience.org (The Global Science Gateway) portal: the aim is to retrieve information related to social media which as of today represent a considerable source of data more and more widely used for research ends.}, KEYWORDS = {Information Extraction, Query Log, WorldWideScience Alliance, Information gateways, Social Media}, PAGES = {147-155}, URL = {https://publications.cnr.it/doc/411599}, VOLUME = {15}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @ARTICLE{SPRUGNOLI_2019_ARTICLE_SPBD_403257, AUTHOR = {Sprugnoli, R. and Pardelli, G. and Boschetti, F. and Del Gratta, R.}, TITLE = {Un'Analisi Multidimensionale della Ricerca Italiana nel Campo delle Digital Humanities e della Linguistica Computazionale}, YEAR = {2019}, ABSTRACT = {This article proposes the first comparative study of four years of Italian conferences in the fields of Digital Humanities and Computational Linguistics. More specifically, we created a corpus consisting of the contributions presented in the AIUCD and CLiC-it conferences between 2014 and 2017 to which we applied a multidimensional analysis taking into consideration: (i) the study of collaborations between authors using social networks analysis techniques, (ii) the automatic extraction of terminology and information and (iii) the examination of citational practices. By combining both qualitative and quantitative methods of investigation, this paper aims to shed light on convergences and discrepancies between two research areas that historically have common origins.}, KEYWORDS = {Digital Humanities, Computational Linguistics, Comparative study}, PAGES = {59-89}, URL = {https://umanisticadigitale.unibo.it/article/view/8581}, VOLUME = {5}, DOI = {10.6092/issn.2532-8816/8581}, ISSN = {2532-8816}, JOURNAL = {Umanistica Digitale}, } @INPROCEEDINGS{BOSCHETTI_2019_INPROCEEDINGS_BPV_409872, AUTHOR = {Boschetti, F. and Pardelli, G. and Venturi, G.}, TITLE = {Nove Anni di jTEI: What's New?}, YEAR = {2019}, ABSTRACT = {Questo contributo illustra metodi e strumenti per studiare il cambiamento diacronico degli interessi di ricerca della comunità TEI grazie all'uso di metodi di estrazione automatica della terminologia da corpora di dominio.}, KEYWORDS = {Natural Language Processing, Digital Humanities}, PAGES = {1-6}, URL = {http://ceur-ws.org/Vol-2481}, VOLUME = {Vol-2481 urn: nbn: de: 0074-2481-7}, PUBLISHER = {CEUR-WS. org (Aachen, DEU)}, CONFERENCE_NAME = {CLiC-it 2019-Sesta Conferenza Italiana di Linguistica Computazionale}, CONFERENCE_PLACE = {Bari}, CONFERENCE_DATE = {13-15/11/2019}, BOOKTITLE = {CLiC-it 2019 Italian Conference on Computational Linguistics}, EDITOR = {Bernardi, R. and Navigli, R. and Semeraro, G.}, } @INPROCEEDINGS{GOGGI_2019_INPROCEEDINGS_GPBMBC_400343, AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Monachini, M. and Biagioni, S. and Carlesi, C.}, TITLE = {Semantic query analysis from the global science gateway}, YEAR = {2019}, ABSTRACT = {We focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience.org (The Global Science Gateway) portal.}, KEYWORDS = {Information Extraction, Terminology}, PAGES = {105-113}, URL = {https://publications.cnr.it/doc/400343}, VOLUME = {20}, ISBN = {978-90-77484-33-3}, CONFERENCE_NAME = {GL20-Twentieth International Conference on Grey Literature: Research Data Fuels and Sustains Grey Literature}, CONFERENCE_PLACE = {New Orleans, USA}, CONFERENCE_DATE = {3-4 December 2018}, BOOKTITLE = {Research Data Fuels and Sustains Grey Literature}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{PARDELLI_2019_INPROCEEDINGS_PGB_398956, AUTHOR = {Pardelli, G. and Goggi, S. and Boschetti, F.}, TITLE = {Strolling around the dawn of Digital Humanities}, YEAR = {2019}, ABSTRACT = {Nelle ricerche umanistiche l'impiego dell'elaboratore elettronico prende il via nella seconda metà del ventesimo secolo favorendo l'uso di metodi statistici sia nello studio di opere letterarie che nello studio delle lingue, promuovendo un sodalizio interdisciplinare che è arrivato ai giorni nostri senza interruzione. In questo contributo tentiamo di fissare alcuni momenti salienti del processo che ha visto la nascita comune della Linguistica Computazionale e delle Digital Humanities nonché i loro alterni allontanamenti e ricongiungimenti.}, KEYWORDS = {Digital Humanities (DH), Computational Linguistics (CL), History}, PAGES = {261-264}, URL = {http://aiucd2019.uniud.it/book-of-abstracts/}, CONFERENCE_NAME = {8th Annual Conference AIUCD 2019. Teaching and research in Digital Humanities' era}, CONFERENCE_PLACE = {Udine, Dipartimento Di Studi Umanistici e Patrimonio Culturale, Università di Udine}, CONFERENCE_DATE = {23-25 gennaio 2019}, } @ARTICLE{GOGGI_2018_ARTICLE_GPRBM_388612, AUTHOR = {Goggi, S. and Pardelli, G. and Russo, I. and Bartolini, R. and Monachini, M.}, TITLE = {Providing Access to Grey Literature: The CLARIN Infrastructure}, YEAR = {2018}, ABSTRACT = {"In the electronic age, the World Wide Web has played a major role in making scientific information accessible to a wide audience more rapidly and efficiently. This democratic approach to information dissemination in science is changing the way science is perceived and implemented in our daily lives" (Weintraub, 2000).}, KEYWORDS = {CLARIN-IT, CLARIN-European Research Infrastructure for Language Resources and Technology, Grey Literature}, PAGES = {87-93}, URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85048643343\&origin=inward}, VOLUME = {14}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @INPROCEEDINGS{BARTOLINI_2018_INPROCEEDINGS_BGMP_387159, AUTHOR = {Bartolini, R. and Goggi, S. and Monachini, M. and Pardelli, G.}, TITLE = {The LREC Workshops Map}, YEAR = {2018}, ABSTRACT = {The aim of this work is to present an overview of the research presented at the LREC workshops over the years 1998-2016 with the aim to shed light on the community represented by workshop participants in terms of country of origin, type of affiliation, gender. There has been also an effort towards the identification of the major topics dealt with as well as of the terminological variations noticed in this time span. Data has been retrieved from the portal of the European Language Resources Association (ELRA) which organizes the conference and the resulting corpus made up of workshops titles and of the related presentations has then been processed using a term extraction tool developed at ILC-CNR.}, KEYWORDS = {corpus creation, terminology, LREC}, PAGES = {557-562}, URL = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/639.html}, PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)}, ISBN = {979-10-95546-00-9}, CONFERENCE_NAME = {Eleventh International Conference on Language Resources and Evaluation (LREC 2018)}, CONFERENCE_PLACE = {Miyazaki, Japan}, CONFERENCE_DATE = {7-12/05/2018}, BOOKTITLE = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)}, EDITOR = {Calzolari, N. and Choukri, K. and Cieri, C. and Declerck, T. and Goggi, S. and Hasida, K. and Isahara, H. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S. and Tokunaga, T.}, } @INPROCEEDINGS{DELGRATTA_2018_INPROCEEDINGS_DGPC_387155, AUTHOR = {Del Gratta, R. and Goggi, S. and Pardelli, G. and Calzolari, N.}, TITLE = {LREMap, a Song of Resources and Evaluation}, YEAR = {2018}, ABSTRACT = {After 8 years we revisit the LRE Map of Language Resources, introduced at LREC 2010, to try to get a picture of the field and its evolution as reflected by the creation and use of Language Resources. The purpose of the Map was in fact "to shed light on the vast amount of resources that represent the background of the research presented at LREC". It also aimed at a "change of culture in the field, actively engaging each researcher in the documentation task about resources". The data analysed here have been provided by the authors of several conferences during the phase of submission of papers, and contain information about ca. 7500 resources. We analysed the LRE Map data from many different viewpoints and the paper reports on the global picture, on different trends emerging from the diachronic perspective and finally on some comparisons between the 2 major conferences present in the Map: LREC and COLING.}, KEYWORDS = {LR Infratructure, Metadata, LR Documentation}, PAGES = {1275-1281}, URL = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/300.html}, PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)}, ISBN = {979-10-95546-00-9}, CONFERENCE_NAME = {Eleventh International Conference on Language Resources and Evaluation (LREC 2018)}, CONFERENCE_PLACE = {Miyazaki, Japan}, CONFERENCE_DATE = {7-12/05/2018}, BOOKTITLE = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)}, EDITOR = {Calzolari, N. and Choukri, K. and Cieri, C. and Declerck, T. and Goggi, S. and Hasida, K. and Isahara, H. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S. and Tokunaga, T.}, } @INPROCEEDINGS{GOGGI_2018_INPROCEEDINGS_GPRBM_385571, AUTHOR = {Goggi, S. and Pardelli, G. and Russo, I. and Bartolini, R. and Monachini, M.}, TITLE = {Providing Access to Grey Literature: The CLARIN Infrastructure}, YEAR = {2018}, ABSTRACT = {This work will provide a map of the documentation archived in the CLARIN infrastructure, whose purpose is to share language resources produced and managed in the various European countries but finally merged into the CLARIN data centers for allowing access, interoperability, reuse and preservation of scientific documentation as well as Grey Literature.}, KEYWORDS = {CLARIN Infrastructure, Language Resources, Grey Literature}, PAGES = {93-99}, URL = {http://greyguide.isti.cnr.it/wp-content/uploads/2018/03/GL19_Conference_Proceedings.pdf}, VOLUME = {19}, PUBLISHER = {TextRelease (Amsterdam, NLD)}, ISBN = {978-90-77484-31-9}, CONFERENCE_NAME = {Nineteenth International Conference on Grey Literature, GL19}, CONFERENCE_PLACE = {Roma}, CONFERENCE_DATE = {October 23-24, 2017}, BOOKTITLE = {Nineteenth International Conference on Grey Literature "Public Awareness and Access to Grey Literature"}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{GOGGI_2018_INPROCEEDINGS_GPBMBC_395584, AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Monachini, M. and Biagioni, S. and Carlesi, C.}, TITLE = {Semantic query analysis from the global science gateway}, YEAR = {2018}, ABSTRACT = {We focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience.org (The Global Science Gateway) portal: the aim is to retrieve information related to social media which as of today represent a considerable source of data more and more widely used for research ends. This project includes eight months of query logs3 registered between July 2017 and February 2018 for a total of 445,827 queries. The analysis mainly concentrates on the semantics of the queries received from the portal clients: it is a process of information retrieval from a rich digital catalogue whose language is dynamic, is evolving and follows - as well as reflects - the cultural changes of our modern society.}, KEYWORDS = {Global Science Gateway, Semantic Query Analysis, Terminology}, PAGES = {93-95}, URL = {http://greyguide.isti.cnr.it/wp-content/uploads/2018/12/GL20_ProgramBook.pdf}, VOLUME = {20}, ISBN = {978-90-77484-34-0}, CONFERENCE_NAME = {Twentieth International Conference on Grey Literature "Research Data Fuels and Sustains Grey Literature"}, CONFERENCE_PLACE = {New Orleans, USA (Loyola University)}, CONFERENCE_DATE = {December 3-4, 2018}, BOOKTITLE = {Research Data Fuels and Sustains Grey Literature}, EDITOR = {Farace, D. and Frantzen, J.}, } @ARTICLE{BARTOLINI_2017_ARTICLE_BPGGB_369103, AUTHOR = {Bartolini, R. and Pardelli, G. and Goggi, S. and Giannini, S. and Biagioni, S.}, TITLE = {A terminological "journey" in the Grey Literature domain}, YEAR = {2017}, ABSTRACT = {"It is by means of terms that the expert usually transfer their knowledge and again through terms scientific communication reaches the highest effectiveness. Therefore we can assert that terminology - in the sense of a set of representative and domain-specific units - is necessary for representing and connecting specialized fields as well as any attempt to represent and/or transfer scientific knowledge requires, more or less extensively, the use of terminology." (Cabré, 2000). "When we read the articles or papers of a particular domain, we can recognize some lexical items in the texts as technical terms. In a domain where new knowledge is generated, new terms are constantly created to fulfill the needs of the domain, while others become obsolete. In addition, existing terms may undergo changes of meaning..." (Kageura K., 1998/1999). Specialized lexicons are made up of the terms which are specific to each field of knowledge, «a subset which is distinct but not separated from the common language» (Cassese, 1992): it is usually difficult to extract the relevant domain-specific terminology, meaning to discern terms which belong to a specialized glossary from those belonging to the common dictionary. The interest in the study of terminology and the "truth" contained in the above definitions has led us to make a "journey" in the Grey Literature (GL) domain in order to offer an overall vision on the terms used and the links between them. Within this scenario, the work analyzes a corpus constituted of the entire amount of full research papers published in the GL conference series over a time-span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words in the various GL research topics. "... corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents which can be detected (Pej?ová P. et al., 2012).}, KEYWORDS = {Grey Literature, Information Extraction IE, Terminology}, PAGES = {41-53}, URL = {http://www.greynet.org/thegreyjournal/currentissue.html}, VOLUME = {13}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @ARTICLE{GIANNINI_2017_ARTICLE_GBGP_369104, AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.}, TITLE = {Grey Literature Citations in the age of Digital Repositories and Open Access}, YEAR = {2017}, ABSTRACT = {The work measures grey citations in the years 2012, 2013 and 2014 and then describes the features of GL documents cited in different areas of knowledge: Computational Linguistics, Computer Science and Engineering. With the aim of surveying a wide and varied range of resources, we selected a sample data based on the bibliographical references of articles contained in four journals - all indexed by Scopus Citation Database and ISI Web of Science, with an Impact Factor (IF) over the last three years - and two proceedings of international conferences held in 2012 and 2014.}, KEYWORDS = {Grey Literature, Citations}, PAGES = {23-31}, URL = {http://www.greynet.org/thegreyjournal/currentissue.html}, VOLUME = {13}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @INPROCEEDINGS{BARTOLINI_2017_INPROCEEDINGS_BPGGB_368487, AUTHOR = {Bartolini, R. and Pardelli, G. and Goggi, S. and Giannini, S. and Biagioni, S.}, TITLE = {A terminological "journey" in the Grey Literature domain}, YEAR = {2017}, ABSTRACT = {The work analyzes a corpus constituted of the entire amount of full research papers published in the GL conference series over a time-span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words in the various GL research topics. "... corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents which can be detected (Pej?ová P. et al., 2012).}, KEYWORDS = {Grey Literature, Information Extraction IE, Terminology}, PAGES = {117-130}, URL = {https://publications.cnr.it/doc/368487}, VOLUME = {18}, PUBLISHER = {TextRelease (Amsterdam, NLD)}, ISBN = {978-90-77484-30-2}, CONFERENCE_NAME = {Eighteenth International Conference on Grey Literature (GL18): Leveraging Diversity in Grey Literature}, CONFERENCE_PLACE = {New York, US}, CONFERENCE_DATE = {November 28-29, 2016}, BOOKTITLE = {Proceedings of the Eighteenth International Conference on Grey Literature (GL18): Leveraging Diversity in Grey Literature}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{PARDELLI_2017_INPROCEEDINGS_PGBRM_367782, AUTHOR = {Pardelli, G. and Goggi, S. and Bartolini, R. and Russo, I. and Monachini, M.}, TITLE = {A Geographical Visualization of GL Communities: A Snapshot}, YEAR = {2017}, ABSTRACT = {This quotation stresses the important role of the several international organizations in producing and disseminating knowledge in the field of Grey Literature (GL): the paper aims to provide a first snapshot of the geographical distribution of GL organizations and their participation to the annual International Conference on Grey Literature over the time (in the period from 2003 to 2015. See List of Conferences on Table 2 ). Nowadays a visual representation of data is often associated with the traditional statistical graphs, in particular for representing complex phenomena by means of maps and diagrams, which allow a deeper and more focused analysis of the data. In our case the geographical representation of stakeholders in government, academics, business and industry aims at visualizing the GL community across the globe: it concerns 674 organizations which over the years have contributed to the development of a common vision on the most pressing issues of the field by using new paradigms such as Open Access and the social networks.}, KEYWORDS = {Geographical Visualization, Grey Literature Communities}, PAGES = {109-113}, URL = {http://greyguide.isti.cnr.it/wp-content/uploads/2017/04/GL18_Conference_Proceedings.pdf}, VOLUME = {18}, PUBLISHER = {TextRelease (Amsterdam, NLD)}, ISBN = {978-90-77484-30-2}, CONFERENCE_NAME = {Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature}, CONFERENCE_PLACE = {Washington}, CONFERENCE_DATE = {November 28-29, 2016}, BOOKTITLE = {GL18 Conference Proceedings Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{BARTOLINI_2017_INPROCEEDINGS_BGPRFF_377073, AUTHOR = {Bartolini, R. and Goggi, S. and Pardelli, G. and Russo, I. and Farace, D. and Frantzen, J.}, TITLE = {Data Visualization of a Grey Literature Community: A Cooperative Project}, YEAR = {2017}, ABSTRACT = {The expected outcome of this project will not only produce a revised and updated publication of International Directory of Organizations in Grey Literature, IDGL, but will also provide a visual overview of GreyNet as an international organization serving diverse communities with shared interests in grey literature. It would be a demonstration of GreyNet's commitment to research, publication, open access, education, and public awareness in this field of library and information science.}, KEYWORDS = {International Directory of Organizations in Grey Literature, Data Visualization}, PAGES = {63-63}, URL = {https://publications.cnr.it/doc/377073}, VOLUME = {19}, ISBN = {978-90-77484-32-6}, CONFERENCE_NAME = {Nineteenth International Conference on Grey Literature, GL19}, CONFERENCE_PLACE = {Rome, National Research Council, CNR}, CONFERENCE_DATE = {October 23-24, 2017}, BOOKTITLE = {Nineteenth International Conference on Grey Literature Public Awareness and Access to Grey Literature. Program Book}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{GOGGI_2017_INPROCEEDINGS_GPRBM_377070, AUTHOR = {Goggi, S. and Pardelli, G. and Russo, I. and Bartolini, R. and Monachini, M.}, TITLE = {Providing Access to Grey Literature: The CLARIN Infrastructure}, YEAR = {2017}, ABSTRACT = {This work will provide a map of the documentation archived in the CLARIN infrastructure, whose purpose is to share language resources produced and managed in the various European countries but finally merged into the CLARIN data centers for allowing access, interoperability, reuse and preservation of scientific documentation as well as Grey Literature.}, KEYWORDS = {CLARIN ERIC, Terminological Resources, Grey Literature}, PAGES = {60-62}, URL = {https://publications.cnr.it/doc/377070}, VOLUME = {19}, ISBN = {978-90-77484-32-6}, CONFERENCE_NAME = {Nineteenth International Conference on Grey Literature, GL19}, CONFERENCE_PLACE = {Rome, National Research Council, CNR}, CONFERENCE_DATE = {October 23-24, 2017}, BOOKTITLE = {Nineteenth International Conference on Grey Literature Public Awareness and Access to Grey Literature. Program Book}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{PARDELLI_2017_INPROCEEDINGS_PGBD_366597, AUTHOR = {Pardelli, G. and Giannini, S. and Boschetti, F. and Del Gratta, R.}, TITLE = {AIUCD e CLiC-it: citazioni bibliografiche a confronto}, YEAR = {2017}, ABSTRACT = {Il lavoro propone l'analisi e il confronto dei riferimenti bibliografici delle cinque edizioni annuali della Conferenza dell'Associazione per l'Informatica Umanistica e la Cultura Digitale (AIUCD) e del primo biennio (2014-2015) della Conferenza Italiana di Linguistica Computazionale (CLiC-it) per misurare la direzione in cui si muove il trend citazionale.. L'analisi muove dal principio di rilevanza della citazione nella trasmissione della conoscenza in un periodo di grandi cambiamenti socioculturali e di importanti evoluzioni nelle modalità di produzione e diffusione dei risultati della ricerca scientifica. Lo scopo dello studio è quello di misurare la gamma delle risorse citate in questa area del sapere mediante l'uso di indicatori volti a comprendere la loro ampiezza, l'estensione temporale, la varietà, le relazioni con il mondo editoriale e i modelli di riferimento. L'osservazione dei risultati consente di classificare i documenti citati, di descriverne le caratteristiche e di valutare eventuali trasformazioni rispetto alle modalità di citazione tradizionali. -------------------------------------------------------------------------------------------------------------------------------------------------------------------------- The paper suggests the analysis of the bibliographic references - enclosed in the proceedings of the Italian Conference on Computational Linguistics - CLICit in 2014-2015 biennium and of five AIUCD Conference editions 2012-2016 . The analysis moves from the principle of relevance of citation in the transmission of knowledge in a period of great socio-cultural changes and important developments in the production and dissemination of the results in the scientific research. The purpose of the study is to measure the range of resources cited in this area of knowledge by the use of indicators aimed in understanding their wideness, the time extension, the variety, the relations with the publishing world and the reference models. The observation of the results allows to classify the cited document, to describe its characteristics and to assess any changes compared to the traditional citation mode.}, KEYWORDS = {Corpus bibliografico, Analisi di metadati}, PAGES = {38-50}, URL = {http://aiucd2017.aiucd.it/wp-content/uploads/2017/01/book-of-abstract-AIUCD-2017.pdf}, CONFERENCE_NAME = {AIUCD 2017 Conference \& 3rd EADH Day}, CONFERENCE_PLACE = {Roma, Università "Sapienza"}, CONFERENCE_DATE = {24-28 January 2017}, BOOKTITLE = {AIUCD 2017 Conference}, } @ARTICLE{GOGGI_2016_ARTICLE_GPBFMMDB_359144, AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Frontini, F. and Monachini, M. and Manzella, G. and De Mattei, M. and Bustaffa, F.}, TITLE = {A semantic engine for grey literature retrieval in the oceanography domain}, YEAR = {2016}, ABSTRACT = {Here we present the final results of the MAPS (Marine Planning and Service Platform) project, an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. The system takes as input non-textual data (measurements) and text - both published papers and documentation - and it provides an advanced search facility thanks to the rich set of metadata and, above all, to the possibility of a refined and domain targeted key-word indexing of texts using Natural Language Processing (NLP) techniques. The paper describes the system in its details providing also evidence of evaluation.}, KEYWORDS = {Information Extraction, Search Engine, Operative Oceanography}, PAGES = {155-161}, URL = {http://www.greynet.org/thegreyjournal/currentissue.html}, VOLUME = {12}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @INPROCEEDINGS{DELGRATTA_2016_INPROCEEDINGS_DFMPRBKSC_355425, AUTHOR = {Del Gratta, R. and Frontini, F. and Monachini, M. and Pardelli, G. and Russo, I. and Bartolini, R. and Khan, F. and Soria, C. and Calzolari, N.}, TITLE = {LREC as a Graph: People and Resources in a Network}, YEAR = {2016}, ABSTRACT = {This proposal describes a new way to visualise resources in the LREMap, a community-built repository of language resource descriptions and uses. The LREMap is represented as a force-directed graph, where resources, papers and authors are nodes. The analysis of the visual representation of the underlying graph is used to study how the community gathers around LRs and how LRs are used in research.}, KEYWORDS = {Language Resources, Resources Documentation, Data Visualisation}, PAGES = {2529-2532}, URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html}, PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)}, ISBN = {978-2-9517408-9-1}, CONFERENCE_NAME = {Tenth International Conference on Language Resources and Evaluation (LREC 2016)}, CONFERENCE_PLACE = {Portoroz, Slovenia}, CONFERENCE_DATE = {23-28 may}, EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Goggi, S. and Grobelnik, M. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S.}, } @INPROCEEDINGS{GIANNINI_2016_INPROCEEDINGS_GBGP_348024, AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.}, TITLE = {Grey Literature citations in the age of Digital Repositories and Open Access}, YEAR = {2016}, ABSTRACT = {The work measures grey citations in the years 2012, 2013 and 2014 and then describes the features of GL documents cited in different areas of knowledge: Computational Linguistics, Computer Science and Engineering. With the aim of surveying a wide and varied range of resources, we selected a sample data based on the bibliographical references of articles contained in four journals - all indexed by Scopus Citation Database and ISI Web of Science, with an Impact Factor (IF) over the last three years - and two proceedings of international conferences held in 2012 and 2014.}, KEYWORDS = {Grey Literature Citations}, PAGES = {137-145}, URL = {https://publications.cnr.it/doc/348024}, VOLUME = {17}, ISBN = {978-90-77484-27-2}, CONFERENCE_NAME = {Seventeenth International Conference on Grey Literature: A New Wave of Textual and Non-Textual Grey literature}, CONFERENCE_PLACE = {Amsterdam, NL}, CONFERENCE_DATE = {1-2 December 2015}, BOOKTITLE = {A New Wave of Textual and Non-Textual Grey literature}, } @INPROCEEDINGS{GOGGI_2016_INPROCEEDINGS_GPBFMMDB_350374, AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Frontini, F. and Monachini, M. and Manzella, G. and De Mattei, M. and Bustaffa, F.}, TITLE = {A semantic engine for grey literature retrieval in the oceanography domain}, YEAR = {2016}, ABSTRACT = {Here we present the final results of the MAPS (Marine Planning and Service Platform) project, an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. The system takes as input non-textual data (measurements) and text - both published papers and documentation - and it provides an advanced search facility thanks to the rich set of metadata and, above all, to the possibility of a refined and domain targeted key-word indexing of texts using Natural Language Processing (NLP) techniques. The paper describes the system in its details providing also evidence of evaluation.}, KEYWORDS = {Information Extraction, Search Engine, Operative Oceanography}, PAGES = {104-111}, URL = {https://publications.cnr.it/doc/350374}, VOLUME = {17}, ISBN = {978-90-77484-27-2}, CONFERENCE_NAME = {Seventeenth International Conference on Grey Literature. A New Wave of Textual and Non-Textual Grey Literature}, CONFERENCE_PLACE = {Amsterdam}, CONFERENCE_DATE = {December 1st-2nd 2015}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{PARDELLI_2016_INPROCEEDINGS_PGGB_355458, AUTHOR = {Pardelli, G. and Goggi, S. and Giannini, S. and Biagioni, S.}, TITLE = {Two decades of terminology: European framework programmes titles}, YEAR = {2016}, ABSTRACT = {This work analyses a corpus made of the titles of research projects belonging to the last four European Commission Framework Programmes (FP4, FP5, FP6, FP7) during a time span of nearly two decades (1994-2012). The starting point is the idea of creating a corpus of titles which would constitute a terminological niche, a sort of "cluster map" offering an overall vision on the terms used and the links between them. Moreover, by performing a terminological comparison over a period of time it is possible to trace the presence of obsolete words in outdated research areas as well as of neologisms in the most recent fields. Within this scenario, the minimal purpose is to build a corpus of titles of European projects belonging to the several Framework Programmes in order to obtain a terminological mapping of relevant words in the various research areas: particularly significant would be those terms spread across different domains or those extremely tied to a specific domain. A term could actually be found in many fields and being able to acknowledge and retrieve this cross-presence means being able to linking those different domains by means of a process of terminological mapping.}, KEYWORDS = {Terminology Extraction, Natural Language Processing, Terminological Comparison}, PAGES = {373-378}, URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html}, PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)}, ISBN = {978-2-9517408-9-1}, CONFERENCE_NAME = {LREC 2016-Tenth International Conference on Language Resources and Evaluation}, CONFERENCE_PLACE = {Portoroz, Slovenia}, CONFERENCE_DATE = {23-28 May}, EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Goggi, S. and Grobelnik, M. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S.}, } @INPROCEEDINGS{BARTOLINI_2016_INPROCEEDINGS_BPGGB_362848, AUTHOR = {Bartolini, R. and Pardelli, G. and Goggi, S. and Giannini, S. and Biagioni, S.}, TITLE = {A terminological "journey" in the Grey Literature domain}, YEAR = {2016}, ABSTRACT = {"When we read the articles or papers of a particular domain, we can recognize some lexical items in the texts as technical terms. In a domain where new knowledge is generated, new terms are constantly created to fulfil the needs of the domain, while others become obsolete. In addition, existing terms may undergo changes of meaning..." (Kageura K.,1998/1999). According to Kaugera, our aim with this work is to make a "journey" in the Grey Literature (GL) domain in order to offer an overall vision on the terms used and the links" "between them. Moreover, by performing a terminological comparison over a given period of time it could be possible to trace the presence of obsolete words as well as of neologisms in the most recent research fields.Within this scenario, the work analyzes a corpus constituted of the entire amount of full" "research papers published in the GL conference series over a time span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words. "... corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents (Pej?ová P. et al., 2012). The work is split up in four sections: creation of the corpus by acquiring the digital papers of GL conference proceedings (GL5 - GL16)1; data cleaning; data processing; terminological" "analysis and comparison. The corpus - made up of 231 research papers (for a total amount of 785.042 tokens) - was processed using a Natural Language Processing (NLP) tool for term extraction developed at the Institute of Computational Linguistics "Antonio Zampolli" of CNR (Goggi et al. 2015; 2016). This tool is what is called a "pipeline" (that is, a sequence of different tools) which extracts lexical knowledge from texts: in short, this is a rule system tool for knowledge extraction and document indexing that combines NLP technologies for term extraction and techniques to measure the associative strength of multi-words. This tool extracts a list of single (monograms) and multi-word terms (bigrams and trigrams) ordered by frequency with respect to the context. The pipeline - used as semantic engine within the MAPS project - has been customized for the extraction of terms from our corpus. This survey on the results of the information extraction process performed by the described NLP tool has been a sort of linguistic path in the past and present of terminology used in GL proceedings. By means of samplings, it has been possible to obtain the terminological flow in GL domain and to determine if and how the lexicon was evolving over these twelve years and investigate on its dynamic nature.}, KEYWORDS = {Grey Literature, Digital Repositories, Open Access}, PAGES = {79-84}, URL = {https://publications.cnr.it/doc/362848}, VOLUME = {18}, ISBN = {978-90-77484-29-6}, CONFERENCE_NAME = {GL18-Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature}, CONFERENCE_PLACE = {New York, US}, CONFERENCE_DATE = {28-29 November 2016}, BOOKTITLE = {Leveraging Diversity in Grey Literature}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{PARDELLI_2016_INPROCEEDINGS_PGMBR_362073, AUTHOR = {Pardelli, G. and Goggi, S. and Monachini, M. and Bartolini, R. and Russo, I.}, TITLE = {A Geographical Visualization of GL Community: a Snapshot}, YEAR = {2016}, ABSTRACT = {"Today, in the spirit of science, grey literature communities are called to demonstrate their know-how and merit to wider audiences" [Farace Dominic J., 2011]. This quotation stresses the important role of the several international organizations in producing and disseminating knowledge in the field of Grey Literature (GL): the paper aims to provide a first snapshot of the geographical distribution of GL organizations and their participation to the annual International Conference on Grey Literature over the time (in the period from 2003 to 2015). Nowadays a visual representation of data is often associated with the traditional statistical graphs, in particular for representing complex phenomena by means of maps and diagrams, which allow a deeper and more focused analysis of the data. In our case the geographical representation of stakeholders in government, academics, business and industry aims at visualizing the GL community across the globe: it concerns 675 organizations which over the years have contributed to the development of a common vision on the most pressing issues of the field by using new paradigms such as Open Acces and the social networks.}, KEYWORDS = {Geographical Visualization, Grey Literature}, PAGES = {67-67}, URL = {https://publications.cnr.it/doc/362073}, VOLUME = {18}, ISBN = {978-90-77484-29-6}, CONFERENCE_NAME = {Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature}, CONFERENCE_PLACE = {New York}, CONFERENCE_DATE = {November 28-29, 2016}, BOOKTITLE = {GL18 Program Book}, EDITOR = {Farace, D. and Frantzen, J.}, } @ARTICLE{GIANNINI_2015_ARTICLE_GBGP_329507, AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.}, TITLE = {Mapping Italian grey communities: what is there beyond the Academy?}, YEAR = {2015}, ABSTRACT = {This research aims at verifying whether - and eventually how much - the grey literature available on the web is actually structured, accessible or even managed by systems dealing with its organization and aiming at its retrieval and storing. The utmost goal is to build up a map of non-academic communities and their mechanisms for managing, presenting and disseminating this type of material. It is a sort of journey among the streams of the Web, which channel meeting minutes, manifests, fliers, pictures, newspapers articles, journalistic services and audio/video material on various topics. These "grey" products - by conveying basic information about social and popular culture - store, represent and spread knowledge.}, KEYWORDS = {Italian Grey Literature A. 1 INTRODUCTORY AND SURVEY}, PAGES = {17-28}, URL = {http://www.greynet.org/thegreyjournal.html}, VOLUME = {11}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @ARTICLE{GOGGI_2015_ARTICLE_GMFBPDBM_334894, AUTHOR = {Goggi, S. and Monachini, M. and Frontini, F. and Bartolini, R. and Pardelli, G. and De Mattei, M. and Bustaffa, F. and Manzella, G.}, TITLE = {Marine Planning and Service Platform (MAPS) An Advanced Research Engine for Grey Literature in Marine Science}, YEAR = {2015}, ABSTRACT = {The MAPS (Marine Planning and Service Platform) project is a development of the Marine project (Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013) aiming at building a computer platform for supporting a Marine Information and Knowledge System, as part of the data management activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. We will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced search engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the great impact that the processing, re-use as well as application of grey data have on societal needs/problems and their answers.}, KEYWORDS = {Marine Science Search Engine Source Data Oceanography}, PAGES = {171-178}, URL = {https://publications.cnr.it/doc/334894}, VOLUME = {11}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @ARTICLE{GOGGI_2015_ARTICLE_GPGBB_329873, AUTHOR = {Goggi, S. and Pardelli, G. and Giannini, S. and Biagioni, S. and Battisti, M.}, TITLE = {La littérature grise des projets de recherche européens}, YEAR = {2015}, ABSTRACT = {Les projets scientifiques financés par la Commission européenne produisent de la littérature grise. Une étude menée en 2013 sur 226 projets CNR du 7e programme-cadre (2007-2013) a analysé la typologie, le format et la disponibilité des documents signalés sur le serveur Cordis (rapports de recherche et articles scientifiques) et les sites projets (contenant listes de partenaires, brochures, communiqués,...}, KEYWORDS = {Grey Literature. European Commission Projects}, PAGES = {34-34}, URL = {http://www.cairn.info/revue-i2d-information-donnees-et-documents-2015-1-p-34.htm}, VOLUME = {52}, DOI = {10.3917/i2d.151.0034}, PUBLISHER = {A. D. B. S (Paris, Francia)}, ISSN = {0012-4508}, JOURNAL = {I2D-Information, données \& documents. Pratiques \& recherches}, } @INPROCEEDINGS{DELGRATTA_2015_INPROCEEDINGS_DFMPRBGKQSC_342213, AUTHOR = {Del Gratta, R. and Frontini, F. and Monachini, M. and Pardelli, G. and Russo, I. and Bartolini, R. and Goggi, S. and Khan, F. and Quochi, V. and Soria, C. and Calzolari, N.}, TITLE = {Visualising Italian Language Resources: a Snapshot}, YEAR = {2015}, ABSTRACT = {This paper aims to provide a first snapshot of Italian Language Resources (LRs) and their uses by the community, as documented by the papers presented at two different conferences, LREC2014 and CLiC-it 2014. The data of the former were drawn from the LOD version of the LRE Map, while those of the latter come from manually analyzing the proceedings. The results are presented in the form of visual graphs and confirm the initial hypothesis that Italian LRs require concrete actions to enhance their visibility.}, KEYWORDS = {Italian Language Resources}, PAGES = {100-104}, URL = {https://books.openedition.org/aaccademia/1277?lang=it}, ISBN = {978-88-99200-62-6}, CONFERENCE_NAME = {Second Italian Conference on Computational Linguistics CLiC-it 2015}, CONFERENCE_PLACE = {Trento}, CONFERENCE_DATE = {3-4 December 2015}, BOOKTITLE = {Proceedings of the Second Italian Conference on Computational Linguistics CLiC-it 2015}, EDITOR = {Bosco, C. and Tonelli, S. and Zanzotto, F. M.}, } @INPROCEEDINGS{GIANNINI_2015_INPROCEEDINGS_GBGP_329374, AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.}, TITLE = {Mapping Italian grey communities: what is there beyond the Academy?}, YEAR = {2015}, ABSTRACT = {This research aims at verifying whether - and eventually how much - the grey literature available on the web is actually structured, accessible or even managed by systems dealing with its organization and aiming at its retrieval and storing. The utmost goal is to build up a map of non-academic communities and their mechanisms for managing, presenting and disseminating this type of material. It is a sort of journey among the streams of the Web, which channel meeting minutes, manifests, fliers, pictures, newspapers articles, journalistic services and audio/video material on various topics. These "grey" products - by conveying basic information about social and popular culture - store, represent and spread knowledge.}, KEYWORDS = {Italian Grey Literature A. 1 INTRODUCTORY AND SURVEY}, PAGES = {17-29}, URL = {http://www.textrelease.com/publications/proceedings.html}, VOLUME = {16}, PUBLISHER = {TextRelease (Amsterdam, NLD)}, ISBN = {978-90-77484-23-4}, CONFERENCE_NAME = {GL16-Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change}, CONFERENCE_PLACE = {Washington DC, USA (Library of Congress)}, CONFERENCE_DATE = {8-9 December 2014)}, BOOKTITLE = {Grey Literature Lobby: Engines and Requesters for Change}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{GOGGI_2015_INPROCEEDINGS_GMFBPDBM_329370, AUTHOR = {Goggi, S. and Monachini, M. and Frontini, F. and Bartolini, R. and Pardelli, G. and De Mattei, M. and Bustaffa, F. and Manzella, G.}, TITLE = {Marine Planning and Service Platform (MAPS): An Advanced Research Engine for Grey Literature in Marine Science}, YEAR = {2015}, ABSTRACT = {The MAPS (Marine Planning and Service Platform) project is a development of the Marine project (Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013) aiming at building a computer platform for supporting a Marine Information and Knowledge System, as part of the data management activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. We will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced search engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the great impact that the processing, re-use as well as application of grey data have on societal needs/problems and their answers.}, KEYWORDS = {Marine Science Search Engine Source Data Oceanography}, PAGES = {108-114}, URL = {http://www.textrelease.com/gl16program.html}, VOLUME = {16}, PUBLISHER = {TextRelease (Amsterdam, NLD)}, ISBN = {978-90-77484-23-4}, CONFERENCE_NAME = {Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change}, CONFERENCE_PLACE = {Library of Congress Washington D. C., USA}, CONFERENCE_DATE = {December 8-9 2014}, BOOKTITLE = {Grey Literature Lobby: Engines and Requesters for Change}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{GOGGI_2015_INPROCEEDINGS_GPSGB_318501, AUTHOR = {Goggi, S. and Pardelli, G. and Sassi, M. and Giannini, S. and Biagioni, S.}, TITLE = {A terminological survey on the titles of the Seventh Framework Programme (FP7)}, YEAR = {2015}, ABSTRACT = {This paper focuses on the automatic extraction of domain-specific knowledge from the European Commission projects of the 7th Framework Programme, hereinafter referred as FP7. The study is divided in three parts: the first part introduces the work starting from the building up of a corpus containing the titles of European Projects of the whole FP7 in order to obtain a relevant terminological sample for the different domains; the second describes software and methods while the third part focuses on the evaluation of results. Finally, we conclude by suggesting possible directions for further development of a comparison between terminological extraction from FP7 and FP5/FP6.}, KEYWORDS = {7th Framework Programme (FP7), Natural Language Processing, Terminology, Knowledge extraction, Grey Literature, I. 2. 7 Natural Language Processing. Text analysis, I. 2. 1 Applications and Expert Systems. Natural language interfaces}, PAGES = {223-227}, URL = {https://publications.cnr.it/doc/318501}, ISBN = {978-959-7174-28-8}, CONFERENCE_NAME = {Fourteenth International Symposium on Comunicación Social: retos y perspectivas}, CONFERENCE_PLACE = {Santiago de Cuba}, CONFERENCE_DATE = {19-23 de enero 2015}, EDITOR = {Ruiz Miyares, L. and Álvarez Silva, M. R. and Muñoz Alvarado, A.}, } @INPROCEEDINGS{GIANNINI_2015_INPROCEEDINGS_GBGP_342303, AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.}, TITLE = {Grey Literature citations in the age of Digital Repositories and Open Access}, YEAR = {2015}, ABSTRACT = {The work measures grey citations in the years 2012, 2013 and 2014 and then describes the features of GL documents cited in different areas of knowledge: Computational Linguistics, Computer Science and Engineering. With the aim to survey a wide and varied range of resources, we selected a sample data based on the bibliographic references of articles contained in 4 journals - all indexed by the ISI Web of Science and with an Impact Factor over the last three years - and two proceedings of international conferences held in 2012 and 2014.}, KEYWORDS = {Grey Literature, Digital Repositories, Open Access}, PAGES = {109-110}, URL = {http://greyguide.isti.cnr.it/attachments/category/27/GL17_Program_Book.pdf}, VOLUME = {17}, ISBN = {978-90-77484-26-5}, CONFERENCE_NAME = {Seventeenth International Conference on Grey Literature. A New Wave of Textual and Non-Textual Grey Literature}, CONFERENCE_PLACE = {Amsterdam, NL}, CONFERENCE_DATE = {December 1-2}, BOOKTITLE = {GL17 Program Book}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{GOGGI_2015_INPROCEEDINGS_GPBFMMDB_342221, AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Frontini, F. and Monachini, M. and Manzella, G. and De Mattei, M. and Bustaffa, F.}, TITLE = {A semantic engine for grey literature retrieval in the oceanography domain}, YEAR = {2015}, ABSTRACT = {Here we present the final results of MAPS (Marine Planning and Service Platform), an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. In previous publications the general architecture of the system as well as the set of metadata (Common Data Index) used to describe the documents were presented [3]; it was shown how individual oceanographic data-sets could be indexed within the MAPS library by types of measure, measurement tools, geographic areas, and also linked to specific textual documentation. Documentation is described using the current international standards: Title, Authors, Publisher, Language, Date of publication, Body/Institution, Abstract, etc.; serial publications are described in terms of ISSN, while books are assigned ISBN; content of various types on electronic networks is described by means of doi and url. Each description is linked to the document. Thanks to this, the MAPS library already enables researchers to go from structured oceanographic data to documents describing it. But this was not enough: documents may contain important information that has not been encoded in the metadata. Thus an advanced Search Engine was put in place that uses semantic-conceptual technologies in order to extract key concepts from unstructured text such as technical documents (reports and grey literature) and scientific papers and to make them indexable and searchable by the end user in the same way as the structured data (such as oceanographic observations and metadata) is. More specifically once a document is uploaded in the MAPS library, key domain concepts in documents are extracted via a natural language processing pipeline and used as additional information for its indexing. The key term identification algorithm is based on marine concepts that were pre-defined in a domain ontology, but crucially it also allows for the discovery of new related concepts. So for instance starting from the domain term salinity, related terms such as sea salinity and average sea salinity will also be identified as key terms and used for indexing and searching documents. A hybrid search system is then put in place, where users can search the library by metadata or by free text queries. In the latter case, the NLP pipeline performs an analysis of the text of the query, and when key concepts are matched, the relevant documents are presented. The results may be later refined by using other structured information (e.g. date of publication, area, ...). Currently a running system has been put in place, with data from satellites, buoys and sea stations; such data is documented and searchable by its relevant metadata and documentation. Results of quantitative evaluation in terms of information retrieval measures will be presented in the poster; more specifically, given an evaluation set defined by domain experts and composed of pre-defined queries together with documents that answer such queries, it will be shown how the system is highly accurate in retrieving the correct documents from the library. Though this work focuses on oceanography, its results may be easily extended to other domains; more generally, the possibility of enhancing the visibility and accessibility of grey literature via its connection to the data it describes and to an advanced full text indexing are of great relevance for the topic of this conference.}, KEYWORDS = {Information Extraction, Search Engine, Oceanography}, PAGES = {76-77}, URL = {https://publications.cnr.it/doc/342221}, VOLUME = {17}, ISBN = {978-90-77484-26-5}, CONFERENCE_NAME = {Seventeenth International Conference on Grey Literature. A New Wave of Textual and Non-Textual Grey Literature}, CONFERENCE_PLACE = {Amsterdam}, CONFERENCE_DATE = {December 1-2}, BOOKTITLE = {GL17 Program Book}, EDITOR = {Farace, D. and Frantzen, J.}, } @ARTICLE{GOGGI_2014_ARTICLE_GPGB_284602, AUTHOR = {Goggi, S. and Pardelli, G. and Giannini, S. and Biagioni, S.}, TITLE = {Grey Literature in European Commission Projects}, YEAR = {2014}, ABSTRACT = {The survey is focused on the documentation produced by the European Commission (EC) projects involved in the Framework Programme for Research and Technological Development (hereafter FP7) and managed by the Italian National Research Council (hereafter CNR). In particular, the Grey Literature (GL) available on CORDIS and European Projects websites was analysed. In order to verify how it is managed and whether it is compliant with EC recommendations, some categories were introduced to identify, measure and evaluate the usability and availability of projects production. Data was obtained from a sample of European projects websites.}, KEYWORDS = {Grey Literature, European Commission Projects}, PAGES = {133-144}, URL = {http://www.greynet.org/thegreyjournal/previousissues.html}, VOLUME = {10}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @ARTICLE{SASSI_2014_ARTICLE_SBP_280559, AUTHOR = {Sassi, M. and Biagioni, S. and Pardelli, G.}, TITLE = {A Linguistic and Gender Approach to 1841 Tuscany Population Census}, YEAR = {2014}, ABSTRACT = {The Census of 1841 in Tuscany was the first official data registry which tried to describe Tuscan population as a whole on the basis of the Granducato's territory. With the use of special ad-hoc created forms, all demographic and socioeconomic characteristics of families and single persons in "Granducato di Toscana" were described. Work is developed in five points: (1) informatics retrieval of linguistic information from Tuscany of 1800 focused by the arts and craftsmanship more in use in families of that time; (2) gender division of works and craftsmanship; (3) observation of lexical disparity in the four communities and terminological curiosities of that historical period; (4) actually no longer existing craftsmanship; and (5) diachronic analysis of communities, where possible. In this scenario, the authors will introduce the methodology they used for data analysis. Tables and figures will be used to better focus different moments and results of the work. A Glossary in Appendix will contain the English translation of the Italian terms extracted from the Corpus.}, KEYWORDS = {Tuscany Population Census, sociological analysis, gender analysis, the 19th work terminology, linguistic statistics}, PAGES = {318-329}, URL = {http://www.davidpublishing.com/show.html?16049}, VOLUME = {12}, PUBLISHER = {USA-China Business Review (Journal), Inc (New York, NY, Stati Uniti d'America)}, ISSN = {1539-8080}, JOURNAL = {US-China foreign language}, } @INPROCEEDINGS{DELGRATTA_2014_INPROCEEDINGS_DPS_281039, AUTHOR = {Del Gratta, R. and Pardelli, G. and Sara, G.}, TITLE = {The LRE Map disclosed}, YEAR = {2014}, ABSTRACT = {This paper describes a serialization of the LRE Map database according to the RDF model. Due to the peculiar nature of the LRE Map, many ontologies are necessary to model the map in RDF, including newly created and reused ontologies. The importance of having the LRE Map in RDF and its connections to other open resources is also addressed.}, KEYWORDS = {Language Resource, LOD, Metadata}, PAGES = {3534-3541}, URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html}, PUBLISHER = {EUROPEAN LANGUAGE RESOURCES ASSOC-ELRA FRANCE (Parigi, FRA)}, ISBN = {978-2-9517408-8-4}, CONFERENCE_NAME = {Ninth International Conference on Language Resources and Evaluation (LREC'14)}, CONFERENCE_PLACE = {Reykjavik, Iceland}, CONFERENCE_DATE = {26-31 may 2014}, BOOKTITLE = {Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)}, EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Loftsson, H. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.}, } @INPROCEEDINGS{GOGGI_2014_INPROCEEDINGS_GPGB_280394, AUTHOR = {Goggi, S. and Pardelli, G. and Giannini, S. and Biagioni, S.}, TITLE = {Grey Literature in European Commission Projects}, YEAR = {2014}, ABSTRACT = {The survey is focused on the documentation produced by the European Commission (EC) projects involved in the Framework Programme for Research and Technological Development (hereafter FP7) and managed by the Italian National Research Council (hereafter CNR). In particular, the Grey Literature (GL) available on CORDIS and European Projects websites was analysed. In order to verify how it is managed and whether it is compliant with EC recommendations, some categories were introduced to identify, measure and evaluate the usability and availability of projects production. Data was obtained from a sample of European projects websites.}, KEYWORDS = {Grey Literature. European Commission Projects, A. 1 INTRODUCTORY AND SURVEY}, PAGES = {98-109}, URL = {https://publications.cnr.it/doc/280394}, VOLUME = {15}, ISBN = {978-90-77484-22-7}, CONFERENCE_NAME = {GL15-Fifteenth International Conference on Grey Literature. The Grey Audit: a Field Assessment in Grey Literature}, CONFERENCE_PLACE = {Bratislava, Slovakia}, CONFERENCE_DATE = {2-3 December 2013}, BOOKTITLE = {The Grey Audit: a Field Assessment in Grey Literature}, EDITOR = {Farace, D. J. and Frantzen, J. and Service, G. I. L. N.}, } @INPROCEEDINGS{BIAGIONI_2014_INPROCEEDINGS_BDGP_280391, AUTHOR = {Biagioni, S. and Deluca, R. and Giannini, S. and Pardelli, G.}, TITLE = {I sistemi informativi della Biblioteca dell'Area della Ricerca di Pisa}, YEAR = {2014}, ABSTRACT = {Description of the CNR Library, (Pisa, Italy) and its services.}, KEYWORDS = {Sistemi informativi per biblioteche, Servizi bibliotecari}, URL = {https://publications.cnr.it/doc/280391}, CONFERENCE_NAME = {Seminario rivolto agli alunni dell'Istituto Tecnico Economico "F. Carrara" di Lucca, organizzato dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR di Pisa}, CONFERENCE_PLACE = {Pisa, Area della Ricerca CNR}, CONFERENCE_DATE = {31 marzo 2014}, } @INPROCEEDINGS{GIANNINI_2014_INPROCEEDINGS_GBGP_291438, AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.}, TITLE = {Mapping Italian Grey Communities: What is There Beyond the Academy?}, YEAR = {2014}, ABSTRACT = {The following title was published on an influential Italian newspaper, La Stampa, on November 7, 2013. "Tra i tesori della 'Letteratura Grigia' un'Eneide in napoletano del '600". The article is about the presentation of the "Fondo De Mauro" on the Italian Network of Popular Culture: this fund originates from a private collection built up in several decades and donated to the Network by Tullio De Mauro and his wife Silvana Ferreri in 2011; it is made up of thousands of books, brochures, pamphlets relating to Italian dialects and minority languages. In the field of healthcare, while browsing on the web, we found the title of a PhD thesis of last year: "Letteratura Grigia nelle meta-analisi delle prove ripartite con scelta casuale degli interventi di sanità". In the legal environment, the title of a Seminar at the University of Siena emerges from the web: "La "centralità" della legge e la letteratura grigia. Profili di politica del diritto in Italia tra Otto e Novecento" . From these findings, the idea of a survey on the wide variety of grey material available on Italian web portals arises. A first analysis shows that this material is available in different forms and dissemination is carried out through various means such as thematic bibliographies, newspapers articles, various types of documents published in pdf format or simple descriptions on web sites. The following are a few examples excerpted from some home pages belonging to our corpus: ? Collection of grey literature. The Historical Archive of Women candidates for becoming the repository where the memories about these themes will be stored... ? Grey literature ... Master copies · Reprints · Unreleased copies · Grey Literature. Archives for the history of Education... ? Grey literature. The high quality brand of parks... ? ... International grey literature; national and international legislative data on the topic of drug addiction and related themes; documentary archive ... ? Besides literature in German, there is literature in other languages and grey literature as well - in particular catalogues of museums and exhibitions... ? It is about a few thousand of books, brochures and documents of grey literature concerning two topics, Italian dialects and minority languages... Given this scenario, the research aims at verifying whether - and eventually how much - the grey literature available on the web is actually structured, accessible or even managed by systems dealing with its organization and aiming at its retrieval and storing. The utmost goal is to build up a map of non-academic communities and their mechanisms for managing, presenting and disseminating this type of material: a sort of journey among the streams of the web which channel meeting minutes, invites, manifests, fliers, pictures, newspapers articles, journalistic services and audio/video material on various topics. These "grey" products - by conveying basic information about social and popular culture - store, represent and spread knowledge. Significant examples could be identified in the web sites presenting the following matters: history of women's culture and of their movement in some specific Italian regions; projects dealing with the sustainability of urban environment with respect to childhood and adolescence; parks and other natural protected environments; archaeological documentation such as draft reports, diaries from the site, letters and miscellaneous documentation; nursing and health-related disciplines which produce guidelines, diagnostic and therapeutic courses, informative material for patients and their families. Also the theatrical culture is nourished by "grey products" as video archives, collections of music LPs and CDs, brochures, scripts, autograph manuscripts (i.e.. letters, correspondences, fliers, musical scores). In substance, a heterogeneous set of material which could reveal especially interesting to both researchers, scientists, professionals and simple fans and lovers of the various subjects if ever made available and usable. Focus Analysis of the documentation and production of taxonomies finalized at the creation of a map of non-academic communities and stakeholders involved in the management of grey material. Material and methods The survey examines the several disciplines, the typology, the institutional nature and the fields to which these grey communities belong, noticing as well the variety of documentation provided, the structure of information and the presentation and access modalities through the following steps: 1) Selection of the web portals as resulted from the query "letteratura grigia" OR "letteratura non convenzionale" OR "documentazione grigia" OR "materiale grigio". 2) Creation of a corpus made up of 28,000 occurrences. 3) Analysis of the various communities and of the grey material retrieved. 4) Statistical elaboration of the data. Conclusions: reflections on the communities and stakeholders involved in the management of grey literature and on the various ways of presenting the documentation provided by the web sites selected for this survey.}, KEYWORDS = {Italian Grey Literature}, PAGES = {21-25}, URL = {http://greyguide.isti.cnr.it/linkdoc.php?idcode=2014-G01-019\&authority=GLConference\&collection=GL16\&langver=en}, VOLUME = {16}, ISBN = {978-90-77484-24-1}, CONFERENCE_NAME = {Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change}, CONFERENCE_PLACE = {Library of Congress Washington D. C., USA}, CONFERENCE_DATE = {December 8-9, 2014}, EDITOR = {Farace, D. and Frantzen, J.}, } @INPROCEEDINGS{GOGGI_2014_INPROCEEDINGS_GMFBPDBM_291816, AUTHOR = {Goggi, S. and Monachini, M. and Frontini, F. and Bartolini, R. and Pardelli, G. and De Mattei, M. and Bustaffa, F. and Manzella, G.}, TITLE = {Marine Planning and Service Platform (MAPS): An Advanced Research Engine for Grey Literature in Marine Science}, YEAR = {2014}, ABSTRACT = {The MAPS (Marine Planning and Service Platform) project is a development of the Marine project (Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013) aiming at building a computer platform for supporting Operative Oceanography in its activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. Community and Requirements. Operative Oceanography is the branch of marine research which deals with the development of integrated systems for examining and modeling the ocean monitoring and forecast. Experts need access to real-time data on the state of the sea such as forecasts on temperatures, streams, tides and the relevant scientific literature. This finds application in many areas, ranging from civilian and military safety to protection of off-shore and coastal infrastructures. The metadata. The set of metadata associated with marine data is defined in the CDI (Common Data Index) documented standard. They encode: the types of sizes which have been measured; the measurement tools the platform which has been employed; the geographic area where measures have been taken; the environmental matrix; the descriptive documentation. As concerns the scientific documentation, at the current stage of the CDI standard, a document is shaped around the following metadata: Title, Authors, Version, ISBN/DOI, Topic, Date of publication, Body/Institution, Abstract. The search engine. The query system (which is actually under development) has been designed for operating with structured data - the metadata - and raw data - the associated technical and scientific documentation. Full-text technologies are often unsuccessful when applied to this type of queries since they assume the presence of specific keywords in the text; in order to fix this problem, the MAPS project suggests to use different emantic technologies for retrieving the text and data and thus getting much more complying results. In the Poster we will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced earch engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the 2 great impact that the processing, re-use as well as application of grey data have on societal needs/problems and their answers.}, KEYWORDS = {Marine Science Search Engine Source Data Oceanography}, PAGES = {93-94}, URL = {http://greyguide.isti.cnr.it/dfdownloadnew.php?ident=GLConference/GL16/2014-G01-015\&langver=en\&scelta=Metadata}, ISBN = {978-90-77484-24-1}, CONFERENCE_NAME = {Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change}, CONFERENCE_PLACE = {Library of Congress Washington D. C., USA}, CONFERENCE_DATE = {December 8-9, 2014}, EDITOR = {Farace, C. B. D. and Frantzen, J.}, } @TECHREPORT{FRONTINI_2014_TECHREPORT_FBMPG_287039, AUTHOR = {Frontini, F. and Bartolini, R. and Monachini, M. and Pardelli, G. and Goggi, S.}, TITLE = {Stato dell'arte dei motori semantici. Progetto MAPS, programma operativo regionale POR-FESR (2007-2013)}, YEAR = {2014}, ABSTRACT = {Il presente documento è il deliverable "D1.1 - Stato dell'Arte dei motori semantici del progetto MAPS (Marine Planning and Service Platform). Il progetto MAPS è una evoluzione del progetto precedente Marine. Tramite il progetto Marine (Bando Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013 - pos n.1) è stata realizzata una piattaforma informatica di supporto all'Oceanografia Operativa capace di raccogliere dati marini per renderli poi disponibili ai ricercatori e alle organizzazioni interessate tramite protocolli standard. Lo scopo del progetto MAPS è quello di realizzare una Catalogo di Documenti contenente informazioni per la piattaforma Marine. Caratteristica di MAPS è di fornire accesso ai dati oceanografici sia attraverso la ricerca per metadati, sia attraverso la ricerca semantica contenuta nella manualistica tecnico scientifica di riferimento.}, PAGES = {1-22}, URL = {https://publications.cnr.it/doc/287039}, } @ARTICLE{PARDELLI_2013_ARTICLE_PB_242950, AUTHOR = {Pardelli, G. and Biagioni, S.}, TITLE = {Quando la linguistica incontra l'informatica: una riflessione terminologica}, YEAR = {2013}, ABSTRACT = {This paper presents a case study to the use of words in the field of Natural Language Processing. This electronic processing of linguistic data leads to the diffusion of clear and concise words for describing a complex concept that would need a circumlocution to be described instead. The aim of this article is to provide thinking over of these new lexical forms over the time. We present a tabular representation summarizing terms extracted from the titles of papers presented at international conferences COLING, International Conference on Computational Linguistics in the period (1965-2010). The system used for the data processing is available at the Istituto di Linguistica Computazionale "A. Zampoilli" - CNR, Pisa, Italy.}, KEYWORDS = {Computational Linguistics, Computer Science, Terminology, Information extraction, Content Analysis and Indexing}, PAGES = {67-78}, URL = {http://caspur-ciberpublishing.it}, VOLUME = {3}, DOI = {10.2423/i22394303v3n1p67}, PUBLISHER = {Caspur-Ciber Publishing (Roma, Italia)}, ISSN = {2239-4303}, JOURNAL = {SCIRES-IT (Roma)}, } @INPROCEEDINGS{PARDELLI_2013_INPROCEEDINGS_PGS_254484, AUTHOR = {Pardelli, G. and Goggi, S. and Sassi, M.}, TITLE = {Open Grey for Language Technology: a ride on the network}, YEAR = {2013}, ABSTRACT = {Sommario in IngleseThe aim of this paper is to introduce the Open Access movement for Natural Language Processing (NLP) by means of a wide range of open access Grey Literature documentation available on the web. In 2008 Robert Dale, in the last issue of volume 35 of Computational Linguistics said: "There are a number of definitions of the term 'open access' in circulation, but almost all share the key principle that scientific literature should be freely available for all to read, download, copy, distribute, and use (with appropriate attribution) without restriction". At first glance it might seem that the Open Access movement has gradually become more influential in the field of language technology by building repositories accessible through the network. Today's digital archives are niches of intellectual production spread by means of a wide range of documents (such as journal articles and proceedings) which, paradoxically, the search engines do not always reach. The use of inappropriate terms in the formulation of queries and the fragmentation of repositories in this area of investigation does not allow to retrieve information on a large scale. The full paper, after a first introductory section, will be organized in two sections: 1) the first dedicated to the methodology for searching and tracing open access resources and to the criteria for analyzing and selecting the online documentation; 2) the second devoted to a description of the state-of-the-art of Open Access Grey Literature material in a statistical and thematic scenario. As things stand, standardization of computational systems interconnected by links and tools of various nature allowing Internet users to easily retrieve the information that the web naturally makes available would then be essential. Topics: Sustainability, Public Accessible Resources, Product and Service enhancements, Open Access, Curation and Preservation}, KEYWORDS = {Open Access Movement. Natural Lanuage Processing}, PAGES = {161-165}, URL = {https://publications.cnr.it/doc/254484}, PUBLISHER = {TEXTRELEASE, GL PROGRAM \& CONFERENCE BUREAU (Amsterdam, NLD)}, ISBN = {978-90-77484-20-3}, CONFERENCE_NAME = {GL14 Fourteenth International Conference on Grey Literature. Tracking Innovation Through Grey Literature}, CONFERENCE_PLACE = {Roma, Italy (CNR)}, CONFERENCE_DATE = {29-30 November 2012}, EDITOR = {Farace, D. J. and Frantzen, J. and Greynet}, } @INPROCEEDINGS{SASSI_2013_INPROCEEDINGS_SBP_254230, AUTHOR = {Sassi, M. and Biagioni, S. and Pardelli, G.}, TITLE = {A linguistic and gender approach to 1841 Tuscany population Census}, YEAR = {2013}, ABSTRACT = {The Census of 1841 in Tuscany was first official data registry which tried to describe Tuscan population as a whole on granducal basis. With the use of special ad hoc created forms all demographic and socioeconomic characteristics of families and single persons in "Granducato di Toscana" were described. These data of Census, now kept by the State Archive of Florence , supply a precious source for studies of all different aspects of the population and include following information: name, surname, age, gender, marital status, employment, religion, schoolarity, "social status". In the registrers for each community and parish a full account is given of homes, resident families, and composition of families including family servants. Each of those entities had a proper incremental code number. [Registers were generated and updated by priests, who at that time were only surely scholarised officers widespread on territory, that is why they are divided by parish, which is an administrative unit typical of canonic right, instead of quarters or "rioni" or "contrade" which instead had been long practiced in civil right. ] During early 80:s the research group of prof. Biagioli of Department of Modern History of Pisa University, charged the computational linguistic Institute of CNR with digitalization and the electronic processing of these data as well as of data from "Catasto" [public registry of buildings and land ownership] to enable statistical, demographical, historical, sociological and economic analysis . In this work the authors have used the only partially usable subset of data left of that work, concerning four communities in the province of Pisa i.e actual Bièntina, Càscina, Pontedera and San Giuliano Terme (at that time named "Baths of San Giuliano") and is more concerned with terminological and lexical issues a gender related analysis of work and craftmanships. Each of the four communities has its own peculiar profile. Work is developed in 5 points: a) Informatics retrieval of linguistic information from Tuscany of 1800 focused by the arts and craftmanships more in use in families of that time, b) gender division of works and craftmanships, c) observation of lexical disparity in the four communities and terminological curiosities of that historical period, d) actually no longer existing craftmanships, e) diacronic analysis of communities, where possible. In this scenery the authors will introduce the methodology they employed for data analysis. Tables and graphs will be used to better focus different moments and results of work. The authors give the English translation of the terms extracted from the Corpus (see Appendix Glossary).}, KEYWORDS = {1841 Tuscany Population Census, Terminology}, PAGES = {200-205}, URL = {https://publications.cnr.it/doc/254230}, PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)}, ISBN = {978-959-7174-22-6}, CONFERENCE_NAME = {XIII Simposio Internacional de Comunicación Social-Actulaizaciones en Comunicacion Social}, CONFERENCE_PLACE = {Santiago de Cuba}, CONFERENCE_DATE = {21-25 Jan 2013}, EDITOR = {Ruiz Miyares, L. and Álvarez Silva, M. R. and Muñoz Alvarado, A.}, } @INPROCEEDINGS{GOGGI_2013_INPROCEEDINGS_GPGB_277513, AUTHOR = {Goggi, S. and Pardelli, G. and Giannini, S. and Biagioni, S.}, TITLE = {Grey literature in European Commission projects}, YEAR = {2013}, ABSTRACT = {The latest recommendations issued by the European Commission go towards the revision of their policy on dissemination and preservation of scientific information in order to promote the access to the results of the community funded research by especially implementing the open access policy within 'Horizon 2020', the EU Framework Programme for Research and Innovation (2014-2020). The aim of the survey is to identify, measure and evaluate the usability and availability of grey literature provided by the European Commission projects web sites in order to verify whether this type of literature is compliant with EU recommendations.}, KEYWORDS = {Grey literature, EU Projects, A. 1 INTRODUCTORY AND SURVEY}, PAGES = {154-159}, URL = {https://publications.cnr.it/doc/277513}, ISBN = {978-90-77484-21-0}, CONFERENCE_NAME = {Fifteenth International Conference on Grey Literature. The Grey Audit: a field assessment in grey literature}, CONFERENCE_PLACE = {Bratislava, Slovak Republic}, CONFERENCE_DATE = {2-3 Dicembre 2013}, BOOKTITLE = {GL Program Books}, } @TECHREPORT{PARDELLI_2013_TECHREPORT_P_242269, AUTHOR = {Pardelli, G.}, TITLE = {Un modello bibliografico saussuriano}, YEAR = {2013}, ABSTRACT = {Il modello bibliografico saussuriano, presentato il 21 settembre 2012 al Seminario Internazionale organizzato dall'Università di Firenze presso la Facoltà di Lettere a conclusione del progetto, ha le caratteristiche di un repertorio in quanto volto a una fonte primaria di conoscenza legata a uno specifico autore e a una sola tipologia documentaria. Ciascuna scheda è strutturata per contenere i formati digitali e per divenire strumento di estrazione informativa dai vari ambienti indicizzati. Nella sostanza trattasi di un database bibliografico al passo con l'era delle risorse documentarie cartacee che migrano progressivamente nei formati richiesti dalla rete telematica: una trasposizione verso il digitale resa possibile anche dai numerosi progetti di ricerca nazionali e comunitari di cui un esempio prezioso è il Progetto PRIN coordinato dal Professor Daniele Gambarara. Il Web si configura così come strumento di reference per recuperi veloci di materiale bibliografico. La descrizione dell'involucro tecnologico di questo particolare segmento della bibliografia saussuriana è il tema argomentale del presente scritto, mirato a una raccolta di informazioni da convogliare e frammentare in un centinaio di record aventi tutti eguale struttura e organizzati puntualmente in campi e sotto campi, al fine di soddisfare bisogni conoscitivi attraverso una maschera di interrogazione disponibile in Internet grazie ad un vocabolario controllato di termini in linguaggio naturale .}, KEYWORDS = {Saussure Ferdinand, Bibliografia}, PAGES = {1-9}, URL = {https://publications.cnr.it/doc/242269}, } @INPROCEEDINGS{PARDELLI_2012_INPROCEEDINGS_PGS_218940, AUTHOR = {Pardelli, G. and Goggi, S. and Sassi, M.}, TITLE = {Grey Literature Between Tradition and Innovation: Is There a Continuum?}, YEAR = {2012}, ABSTRACT = {This study wants to explore ways of social media communication for Grey Literature. In particular it describes the role of social media in relation with traditional channels and how social media applications can be used for Grey.}, KEYWORDS = {Grey Literature, Communication Networks, Knowledge Networking, Knowledge Exchange}, PAGES = {165-169}, URL = {https://publications.cnr.it/doc/218940}, VOLUME = {13}, CONFERENCE_NAME = {Thirteenth International Conference on Grey Literature: The Grey Circuit, From Social Networking to Wealth Creation (GL 13)}, CONFERENCE_PLACE = {Washington D. C. USA}, CONFERENCE_DATE = {5-6 December 2011}, } @INPROCEEDINGS{PARDELLI_2012_INPROCEEDINGS_PSGB_217173, AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S. and Biagioni, S.}, TITLE = {From medical language processing to BioNLP domain}, YEAR = {2012}, ABSTRACT = {This paper presents the results of a terminological work on a reference corpus in the domain of Biomedicine. In particular, the research tends to analyse the use of certain terms in Biomedicine in order to verify their change over the time with the aim of retrieving from the net the very essence of documentation. The terminological sample contains words used in BioNLP and biomedicine and identifies which terms are passing from scientific publications to the daily press and which are rather reserved to scientific production. The final scope of this work is to determine how scientific dissemination to an ever larger part of the society enables a public of common citizens to approach communication on biomedical research and development; and its main source is a reference corpus made up of three main repositories from which information related to BioNLP and Biomedicine is extracted. The paper is divided in three sections: 1) an introduction dedicated to data extracted from scientific documentation; 2) the second section devoted to methodology and data description; 3) the third part containing a statistical representation of terms extracted from the archive: indexes and concordances allow to reflect on the use of certain terms in this field and give possible keys for having access to the extraction of knowledge in the digital era.}, KEYWORDS = {Information Extraction, Information Retrieval, Text mining, Digital Libraries}, PAGES = {2049-2055}, URL = {http://www.lrec-conf.org/proceedings/lrec2012/pdf/687_Paper.pdf}, VOLUME = {7}, PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)}, ISBN = {978-2-9517408-7-7}, CONFERENCE_NAME = {Eight International Conference on Language Resources and Evaluation. LREC'12}, CONFERENCE_PLACE = {Istanbul, Turkey}, CONFERENCE_DATE = {21-27 may 2012}, BOOKTITLE = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)}, EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Doğan, M. U. and Maegaard, B. and Mariani, J. and Odijk, J. and Piperidis, S.}, } @INPROCEEDINGS{PARDELLI_2012_INPROCEEDINGS_P_221541, AUTHOR = {Pardelli, G.}, TITLE = {Lineamenti di Linguistica Computazionale per il recupero informativo}, YEAR = {2012}, ABSTRACT = {Le ricerche linguistiche a partire dal secondo dopoguerra hanno avuto un ritmo di evoluzione e di espansione molto rapido grazie anche ai metodi di analisi introdotti, come l'uso dei metodi statistici o quantitativi nello studio delle lingue e delle opere letterarie. Nacquero nuovi settori di applicazione, la linguistica incontrò altre scienze e l' interdisciplinarità venne sempre più praticata fino a diventare indispensabile. L'introduzione di sistemi di automazione delle ricerche nelle analisi linguistiche vide la nascita della Linguistica Computazionale LC che mise in connessione lo studio della lingua e l'elaboratore elettronico. Dalla fine degli anni '40 all'inizio degli anni '60 gli utilizzi del calcolo elettronico per l'elaborazione di dati linguistici si articolarono in due filoni principali: - Gli spogli elettronici dei testi che diedero impulso alla lessicografia computazionale, avviata da Padre Roberto Busa nel 1951 con la compilazione delle concordanze dell'opera omnia di Tommaso d'Aquino; - I tentativi di traduzione automatica TA, in inglese machine translation MT, avviati da Weaver nel 1949 con la pubblicazione del memorandum "Translation". La TA divenne da subito nucleo e centro di spinta della LC utlilizzando il calcolatore per trasportare un testo da una lingua naturale all'altra. Il contenuto argomentale dei testi della Biblioteca dell'Istituto di Linguistica Computazionale si sviluppa per lo più sulle tematiche sopra descritte. L'articolo darà enfasi alla terminologia della LC, nella prima parte, quella introduttiva; nella seconda parte saranno fornite informazioni inerenti il patrimonio bibliografico, il software di gestione usato e indicazioni per il recupero informativo; la terza parte andrà a presentare il "Fondo Antonio Zampolli", preziosa collezione di testi, alcuni unici in Italia, nel settore del trattamento automatico della lingua, che va ad arricchire e completare la Biblioteca ILC. In appendice sarà fornita una tabella riassuntiva dei termini estratti dai titoli degli articoli presentati alle conferenze di Linguistica Computazionale COLING, dal 1965 - anno della prima conferenza tenuta a New York - al 2010, conferenza tenuta a Pechino. Trattasi di 23 conferenze internazionali di Linguistica Computazionale, fondamentali nella storia della disciplina. L'estrazione terminologica del corpus COLING è stata operata con gli strumenti di analisi testuale del laboratorio DylanLab dell'Istituto di Linguistica Computazionale.}, KEYWORDS = {Linguistica Computazionale, Terminologia, Repository}, URL = {https://publications.cnr.it/doc/221541}, CONFERENCE_NAME = {Seminario di Studi-Benvenuti in Biblioteca! Umanesimo e società nelle collezioni librarie del CNR}, CONFERENCE_PLACE = {Roma}, CONFERENCE_DATE = {29-30 maggio 2012}, } @INPROCEEDINGS{PARDELLI_2012_INPROCEEDINGS_PE_221547, AUTHOR = {Pardelli, G. and Enea, A.}, TITLE = {Per un'edizione digitale dei manoscritti di Ferdinand de Saussure: Verso la Costruzione del prototipo bibliografico}, YEAR = {2012}, ABSTRACT = {Per un'edizione digitale dei manoscritti di Ferdinand de Saussure - PRIN 2008 Unità operativa CNR-ILC Responsabile dott. Nilda Ruimy Relazione attività svolta da Gabriella Pardelli Obiettivo: costruzione del prototipo bibliografico saussurriano compatibile con le applicazioni sviluppate per il progetto e volte alla rete telematica. In particolare il prototipo si integra con l' ontologia di dominio sviluppata per la creazione del lessico saussurriano (ILC) e con l'applicazione di Natural Language Processing nata per il recupero della terminologia multilingue da immagini digitali (ILC). Metodologia: 1) scelta del software; 2) recupero delle informazioni bibliografiche ; 3) digitalizzazione 4) collegamento testo/immagine. 1) Il prototipo bibliografico degli scritti di Ferdinand de Saussure si avvale del software CDS/ISIS Computerised Documentation Service / Integrated Set of Information Systems. Il software è sviluppato, mantenuto e distribuito dall'UNESCO. L'applicazione permette l'associazione di file esterni (immagini e testi) oltre alla creazione di link tra record e archivi diversi. L'esportazione dei dati segue lo standard internazionale ISO2709. 2) La ricca bibliografia è stata elaborata dal coordinatore nazionale del progetto. Il recupero delle fonti saussurriane è stato svolto nella Biblioteca della Scuola Normale Superiore di Pisa e nella Biblioteca del Dipartimento di Linguistica di Pisa. 3) Le immagini sono state acquisite con la collaborazione di un fotografo professionista - fonti di prima generazione -. Invece per le fonti non recuperabili sul territorio italiano, l'acquisizione è frutto di portali europei dedicati a Saussure (Gallica) - fonti di seconda generazione - Con l'abbinamento della descrizione bibliografica alla rispettiva fonte digitalizzata il prototipo è stato ultimato. L'applicazione è stata presentata il 21 settembre 2012 al seminario internazionale organizzato dall'Università di Firenze, presso la Facoltà di Lettere , a conclusione del progetto. Consistenza: Il database contiene 150 record corredati dalla rispettiva immagine. Ogni record, diviso in campi e in ulteriori sotto campi, è stato pensato per organizzare e frammentare l'informazione e consentire indicizzazioni puntuali per recuperi informativi sui titoli, sulle lingue indagate da Saussure e oggetto di argomentazione linguistica (latino, greco, tedesco...), sulla tipologia della fonte documentaria, sulla data della comunicazione, sulla data della pubblicazione, sui commenti, sulle note, sulle riedizioni ...}, KEYWORDS = {Ferdinand de Saussure Banca dati bibliografica}, URL = {https://publications.cnr.it/doc/221547}, CONFERENCE_NAME = {Seminario internazionale Per un'edizione digitale dei manoscritti di Ferdinand de Saussure-Conclusione}, CONFERENCE_PLACE = {Università di Firenze}, CONFERENCE_DATE = {21-22 settembre 2012}, } @INPROCEEDINGS{PARDELLI_2012_INPROCEEDINGS_PSG_220806, AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S.}, TITLE = {Open Grey for Language Technology: a ride on the network}, YEAR = {2012}, ABSTRACT = {The aim of this paper is to introduce the Open Access movement for Natural Language Processing (NLP) by means of a wide range of open access Grey Literature documentation available on the web. In 2008 Robert Dale, in the last issue of volume 35 of Computational Linguistics said: "There are a number of definitions of the term 'open access' in circulation, but almost all share the key principle that scientific literature should be freely available for all to read, download, copy, distribute, and use (with appropriate attribution) without restriction". At first glance it might seem that the Open Access movement has gradually become more influential in the field of language technology by building repositories accessible through the network. Today's digital archives are niches of intellectual production spread by means of a wide range of documents (such as journal articles and proceedings) which, paradoxically, the search engines do not always reach. The use of inappropriate terms in the formulation of queries and the fragmentation of repositories in this area of investigation does not allow to retrieve information on a large scale. The full paper, after a first introductory section, will be organized in two sections: 1) the first dedicated to the methodology for searching and tracing open access resources and to the criteria for analyzing and selecting the online documentation; 2) the second devoted to a description of the state-of-the-art of Open Access Grey Literature material in a statistical and thematic scenario. As things stand, standardization of computational systems interconnected by links and tools of various nature allowing Internet users to easily retrieve the information that the web naturally makes available would then be essential. Topics: Sustainability, Public Accessible Resources, Product and Service enhancements, Open Access, Curation and Preservation}, KEYWORDS = {Open Access Movement Natural Language Processing}, PAGES = {89-94}, URL = {https://publications.cnr.it/doc/220806}, VOLUME = {14}, CONFERENCE_NAME = {GL14 Fourteenth International Conference on Grey Literature (GL14)}, CONFERENCE_PLACE = {National Research Council, Rome, Italy}, CONFERENCE_DATE = {29-30 November 2012}, } @ARTICLE{MARZI_2011_ARTICLE_MPS_186118, AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.}, TITLE = {A terminology based re-definition of Grey Literature}, YEAR = {2011}, ABSTRACT = {The conventionally accepted definition of Grey Literature, as Information produced and distributed by non-commercial publishing, does not take into consideration either the increasing availability of forms of grey knowledge, or the growing importance of computerbased encoding and management as the standard mode of creating and developing grey literature. Semi-automated terminological analysis of almost twenty years of terminological creativity in the proceedings of eleven GL International Conferences offers the opportunity to pave the way to a bottom-up redefinition of Grey Literature stemming from attested terminological creativity and lexical innovation. In this paper, we focus on a set of automatically-acquired terms obtained by subjecting our reference Corpus to a number of pre-processing steps of automated text analysis, such as concordances, frequency lists and lexical association scores. Acquired terms allow us to throw in sharp relief developing trends and important shifts of emphasis in the current understanding of the notion of Grey Literature.}, KEYWORDS = {Grey Literature, Terminology extraction}, PAGES = {19-23}, URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84869064979\&origin=inward}, VOLUME = {7}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @INPROCEEDINGS{MARZI_2011_INPROCEEDINGS_MPS_176389, AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.}, TITLE = {A terminology based re-definition of Grey Literature}, YEAR = {2011}, ABSTRACT = {The conventionally accepted definition of Grey Literature, as Information produced and distributed by non-commercial publishing, does not take into consideration either the increasing availability of forms of grey knowledge, or the growing importance of computer-based encoding and management as the standard mode of creating and developing grey literature. Semi-automated terminological analysis of almost twenty years of terminological creativity in the proceedings of eleven GL International Conferences offers the opportunity to pave the way to a bottom-up redefinition of Grey Literature stemming from attested terminological creativity and lexical innovation. In this paper, we focus on a set of automatically-acquired terms obtained by subjecting our reference Corpus to a number of pre-processing steps of automated text analysis, such as concordances, frequency lists and lexical association scores. Acquired terms allow us to throw in sharp relief developing trends and important shifts of emphasis in the current understanding of the notion of Grey Literature.}, KEYWORDS = {GL conference corpus, Grey literature definition, Terminology extraction}, PAGES = {27-31}, URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84883303651\&origin=inward}, VOLUME = {12}, PUBLISHER = {TextRelease (Amsterdam, NLD)}, ISSN = {1386-2316}, ISBN = {9789077484166}, CONFERENCE_NAME = {Twelfth International Conference on Grey Literature: Trasparency in Grey Literature, Grey Tech Approaches to High Tech Issues}, CONFERENCE_PLACE = {Praga}, CONFERENCE_DATE = {6-7 dicembre 2010}, BOOKTITLE = {Trasparency in Grey Literature, Grey Tech Approaches to High Tech Issues}, EDITOR = {Farace, D. J. and Fratzen, J.}, } @INPROCEEDINGS{PARDELLI_2011_INPROCEEDINGS_PSOBG_199282, AUTHOR = {Pardelli, G. and Sassi, M. and Orsolini, P. and Biagioni, S. and Giannini, S.}, TITLE = {An open archive of scientific communication}, YEAR = {2011}, ABSTRACT = {This paper presents the results of a terminological work conducted by the authors on a Digital Archives Net of the Italian National Research Council (CNR) in the field of Computer Science. In particular, the research tends to analyse the use of certain terms in Computer Science in order to verify their change over the time with the aim of retrieving from the net the very essence of documentation. Its main source is a reference corpus made up of 13,500 documents which collects the scientific productions of three CNR research Institutes. They are ISTI (Institute of Information Science and Technologies), IIT (Institute of Informatics and Telematics) and ILC (Institute of Computational Linguistics), all of them born from the "Centro Studi sulle Calcolatrici Elettroniche (CSCE)" and now belonging to the CNR Department of Information \& Communication Technologies and Cultural Identity. This study is divided in three sections: an introductory one dedicated to the data extracted from the scientific documentation: the data have in common the use of some terms proper of the Computer Science lexicon although these term belong to different branches (Linguistics, Informatics and Telematics); the second section is devoted to the description of the contents managed by the PUMA (Publication Management System) system; the third section contains a statistical representation of terms extracted from archive: some comparison tables between the occurrences of the most used terms in the scientific documentation produced by the three Institutes will be created and diagrams with percentages about the most frequently used terms will be displayed too. Lastly, indexes and concordances will allow to reflect on the use of certain terms in this field and give possible keys for having access to the extraction of knowledge in the digital era.}, KEYWORDS = {Digital Archives, Communication, Terminology, Open Access}, PAGES = {914-918}, URL = {http://www.santiago.cu/hosting/linguistica/simposios.php?s=XII}, VOLUME = {II}, PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)}, ISBN = {978-959-7174-19-6}, CONFERENCE_NAME = {Comunicación Social en el Siglo XXI. XII Simposio Internacional de Comunicacion Social}, CONFERENCE_PLACE = {Santiago de Cuba}, CONFERENCE_DATE = {17-21 gennaio 2011}, BOOKTITLE = {Comunicacion social en el siglo XXI, vol. II}, EDITOR = {Miyares, L. R. and Silva, M. R. Á.}, } @INPROCEEDINGS{PARDELLI_2011_INPROCEEDINGS_PSG_205788, AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S.}, TITLE = {Grey Literature Between Tradition and Innovation: Is there a Continuum?}, YEAR = {2011}, ABSTRACT = {This study wants to explore ways of social media communication for Grey Literature. In particular it describes the role of social media in relation with traditional channels and how social media applications can be used for Grey.}, KEYWORDS = {Grey Literature, Communication networks, Knowledge networking, knowledge exchange}, PAGES = {64-65}, URL = {https://publications.cnr.it/doc/205788}, VOLUME = {13}, ISBN = {978-90-77484-00-5}, CONFERENCE_NAME = {Thirteenth International Conference on Grey Literature: The Grey Circuit, From Social Networking to Wealth Creation}, CONFERENCE_PLACE = {Washington D. C. USA-Library of Congress}, CONFERENCE_DATE = {5-6 december 2011}, EDITOR = {Farace, D. J. and Frantzen, J.}, } @ARTICLE{MARZI_2010_ARTICLE_MPS_64555, AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.}, TITLE = {Grey literature and computational linguistics: From paper to net}, YEAR = {2010}, ABSTRACT = {The advent and exponential development of the World Wide Web has led to an increasing availability of unstructured knowledge and distributed information sources, meeting general public requirements that are hardly addressed by other more traditional information channels. This trend has concurrently raised a considerable interest in the application of Computational Linguistics (CL) methodologies to document access and retrieval, as they offer the unprecedented opportunity to make the subjective, user- centred information demands of Net citizens meet the ever changing and heterogeneous information flow of the web. Over the last five years, more and more Italian Universities have introduced CL courses into their Humanities curricula, making available on-line teaching materials, tutorials and language engineering software that appear to supply the lack of offer from traditional Italian publishing houses. In this paper, we consider in some detail the role played by this type of Grey Literature in bringing up a wider and increasingly more aware community of web users in Italy.}, KEYWORDS = {Grey Literature}, PAGES = {145-148}, URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-78149461778\&origin=inward}, VOLUME = {6}, PUBLISHER = {TextRelease (Amsterdam, Paesi Bassi)}, ISSN = {1574-1796}, JOURNAL = {The Grey journal (Print)}, } @INPROCEEDINGS{MARZI_2010_INPROCEEDINGS_MPS_84790, AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.}, TITLE = {Grey Literature and Computational Linguistics: From Paper to Net}, YEAR = {2010}, ABSTRACT = {The advent and exponential development of the World Wide Web has led to an increasing availability of unstructured knowledge and distributed information sources, meeting general public requirements that are hardly addressed by other more traditional information channels. This trend has concurrently raised a considerable interest in the application of Computational Linguistics (CL) methodologies to document access and retrieval, as they offer the unprecedented opportunity to make the subjective, user-centred information demands of Net citizens meet the ever changing and heterogeneous information flow of the web. Over the last five years, more and more Italian Universities have introduced CL courses into their Humanities curricula, making available on-line teaching materials, tutorials and language engineering software that appear to supply the lack of offer from traditional Italian publishing houses. In this paper, we consider in some detail the role played by this type of Grey Literature in bringing up a wider and increasingly more aware community of web users in Italy.}, KEYWORDS = {Computational Linguistics, Grey, Web-based information}, PAGES = {81-84}, URL = {https://publications.cnr.it/doc/84790}, VOLUME = {11}, PUBLISHER = {TextRelease (Amsterdam, NLD)}, ISSN = {1386-2316}, ISBN = {978-90-77484-13-5}, CONFERENCE_NAME = {Eleventh International Conference on Grey Literature. The Grey Mosaic, Piecing it All Together}, CONFERENCE_PLACE = {Washington, DC}, CONFERENCE_DATE = {14-15 dicembre 2009}, BOOKTITLE = {The Grey Mosaic, Piecing it All Together}, EDITOR = {Farace, D. J. and Frantzen, J.}, } @INPROCEEDINGS{SASSI_2010_INPROCEEDINGS_SPBCG_171547, AUTHOR = {Sassi, M. and Pardelli, G. and Biagioni, S. and Carlesi, C. and Goggi, S.}, TITLE = {A Digital Archive of Research Papers in Computer Science}, YEAR = {2010}, ABSTRACT = {This paper presents the results of a terminological work conducted by the authors on a Digital Archives Net of the Italian National Research Council (CNR) in the field of Computer Science. In particular, the research tends to analyse the use of certain terms in Computer Science in order to verify their change over the time with the aim of retrieving from the net the very essence of documentation. Its main source is a reference corpus made up of 13,500 documents which collects the scientific productions of three CNR research Institutes. They are ISTI (Institute of Information Science and Technologies), IIT (Institute of Informatics and Telematics) and ILC (Institute of Computational Linguistics), all of them born from the "Centro Studi sulle Calcolatrici Elettroniche (CSCE)" and now belonging to the CNR Department of Information \& Communication Technologies and Cultural Identity. This study is divided in three sections: 1) an introductory one dedicated to the data extracted from the scientific documentation: the data have in common the use of some terms proper of the Computer Science lexicon although these term belong to different branches (Linguistics, Informatics and Telematics); 2) the second section is devoted to the description of the contents managed by the PUMA (Publication Management System) system; 3) the third part contains a statistical representation of terms extracted from archive: some comparison tables between the occurrences of the most used terms in the scientific documentation produced by the three Institutes will be created and diagrams with percentages about the most frequently used terms will be displayed too. Lastly, indexes and concordances will allow to reflect on the use of certain terms in this field and give possible keys for having access to the extraction of knowledge in the digital era.}, KEYWORDS = {Digital libraries, Document Classification, Text categorisation, Text mining, Natural Language Processing. Text analysis}, PAGES = {1245-1248}, URL = {http://www.lrec-conf.org/proceedings/lrec2010/summaries/945.html}, PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)}, ISBN = {2-9517408-6-7}, CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation}, CONFERENCE_PLACE = {Valletta, Malta}, CONFERENCE_DATE = {17-23 Maggio 2010}, BOOKTITLE = {Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC'10)}, EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Rosner, M. and Tapias, D.}, } @INPROCEEDINGS{MARZI_2010_INPROCEEDINGS_MPS_186131, AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.}, TITLE = {A Terminology Based Re-Definition of Grey Literature}, YEAR = {2010}, ABSTRACT = {The Luxembourg Convention on Grey Literature held in 1997 offered the following definition of Grey Literature (expanded in New York, 2004): "Information produced and distributed on all levels of government, academics, business and industry in electronic and print formats not controlled by commercial publishing, i.e. where publishing is not the primary activity of the producing body". Is this definition still valuable? Is it so far completely satisfactory? Or does it rather need important modifications? We suggest that an interesting re-definition of GL can be based upon careful examination of the longitudinal trend of 10 years of terminological creativity in the proceedings of the GL international Conference. Our empirical basis is the Corpus of GreyText Inhouse Archive, available on http://www.greynet.org/opensiglerepository.html consisting of titles, themes, keywords and full abstracts, for a total amount of more than sixty thousand word tokens. In the full version of our paper, we intend to focus on a set of automatically-acquired terms (both single-word and multi-word terms) obtained by subjecting our reference Corpus to a number of pre-processing steps of automated text analysis, such as concordances, frequency lists and lexical association scores (e.g. Mutual Information on word pairs). To anticipate some of our results, the following three terms, that appear to be shared by various disciplinary sub-fields, mark, in our view, important stages in the evolution of our current understanding of GL: digital, access and web. The attribute digital, an increasingly popular synonym of the now obsolete electronic, emphasises the growing importance of computer-based encoding as the standard medium of GL. The noun access (defining the process of accessing text documents) is seen in the company of adjectives like easy, full, grey and open to shape up important conceptual innovations in the way GL material is distributed: e.g. open access focuses on the free accessibility of digital contents. Coupled with information, document and repository (note, however, that repository is generally understood as a technical synonym of open archive), access points to a conception of world-wide available, structured cultural contents. Finally, reference to the web lays emphasis on the huge importance of the World Wide Web as the standard means of disseminating GL. All these aspects are not fully taken into account in the standard definition of GL reported above. Our inquiry is intended to pave the way to a bottom-up re-definition of GL, stemming from the terminological creativity and lexical innovation monitored over ten years of technical work in the field.}, KEYWORDS = {Terminology extraction, Grey Literature definition, GL Conference corpus}, PAGES = {24-28}, URL = {https://publications.cnr.it/doc/186131}, VOLUME = {12}, ISSN = {1385-2308}, ISBN = {978-90-77484-15-9}, CONFERENCE_NAME = {Twelfth International Conference on Grey Literature: Trasparency in Grey Literature, Grey Tech Approaches to High Tech Issues}, CONFERENCE_PLACE = {Prague}, CONFERENCE_DATE = {6-7/12/2010}, BOOKTITLE = {Trasparency in Grey Literature, Grey Tech Approaches to High Tech Issues}, EDITOR = {Farace, D. J. and Fratzen, J.}, } @MISC{RUIMY_2010_MISC_RP_157474, AUTHOR = {Ruimy, N. and Pardelli, G.}, TITLE = {Un modello lessicale da customizzare per lo sviluppo di un thesaurus lessico elettronico della terminologia saussuriana}, YEAR = {2010}, ABSTRACT = {Progetto di ricerca PRIN 2008: Per un'edizione digitale dei manoscritti di Ferdinand de Saussure. Unità di Ricerca Istituto di Linguistica Computazionale Antonio Zampolli CNR -Pisa Linea di attività II.}, KEYWORDS = {Ontology. Computational Semantics}, PAGES = {1}, URL = {https://publications.cnr.it/doc/157474}, } @INPROCEEDINGS{CIGNONI_2009_INPROCEEDINGS_CPS_84740, AUTHOR = {Cignoni, L. and Pardelli, G. and Sassi, M.}, TITLE = {Grey Literature for Natural Language Processing: a Terminological and Statistical Approach}, YEAR = {2009}, ABSTRACT = {This paper presents the results of a study on grey literature (GL) in the field of Natural Language Processing (NLP). Our data has been collected in a corpus of ca 13,000 records corresponding to the titles of papers presented at International Conferences from 1950 to June 2008. A statistical representation of the most significant terms relative to GL in NLP and other interrelated disciplines associates old and new words, highlighting the terminological changes that have taken place in the course of time. Aim of our study is to contribute to the creation of language resources for the extraction of GL coming from the Web in order to help prevent the disappearance of documents containing NLP words that have undergone rapid development over the last decades. This paper is organised as follows: after a general introduction to our work, section 2 provides a historical overview of NLP; sections 3 and 4 offer an account of the most relevant terms used by specialists in different periods, and indicative of the changes that have taken place; section 5 describes the methodology we have used and also contains information on our GL database and a graphical representation of the data. Finally, the conclusions stress the need to integrate pre-existing or obsolete words and expressions, creating NLP synonym relations.}, KEYWORDS = {Computational Linguistics, Terminology, Grey Literature}, PAGES = {93-100}, URL = {https://publications.cnr.it/doc/84740}, VOLUME = {10}, PUBLISHER = {TextRelease (Amsterdam, NLD)}, ISBN = {978-90-77484-11-1}, CONFERENCE_NAME = {Tenth International Conference on Grey Literature: Designing the Grey Grid for Information Society}, CONFERENCE_PLACE = {Amsterdam}, CONFERENCE_DATE = {DEC 08-09, 2008}, BOOKTITLE = {Designing the Grey Grid for Information Society}, EDITOR = {Farace, D. J. and Frantzen, J.}, } @INPROCEEDINGS{PARDELLI_2009_INPROCEEDINGS_PSGO_84738, AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S. and Orsolini, P.}, TITLE = {Computational Linguistics Terminology}, YEAR = {2009}, ABSTRACT = {The aim of this article is to provide a statistical representation of significant terms used in the field of Natural Language Processing from the 1960's till nowadays, in order to draft a survey on the most significant research trends in that period. By retrieving these keywords it should be possible to highlight the ebb and flow of some thematic topics. The NLP terminological sample derives from a database - created for this purpose using the DBT software (Textual Data Base, ILC patent). Scientific presentations at the above-mentioned conferences point out a frequent recurrence of expressions such as mécanisation des études lexicologique, les machines à cartes perforées et leurs application lexicologique which trace back to the origin of electronic processing of linguistic data and to some solutions of linguistic-literary problems, to lexicographic researches, to the scientific terminology, to automatic dictionaries, to homographs, synonyms and the possibility of producing indexes and concordances by means of an electronic processor: Terms such as meccanizzazione, mechanical translation, machine à traduire used by experts of the field in the 1950s and 1960s seem to well testify the change, the shift, the beginning and then the final consecration of a rapidly evolving field: Natural Language Processing.}, KEYWORDS = {Computational Linguistics, Terminology}, PAGES = {303-307}, URL = {https://publications.cnr.it/doc/84738}, PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)}, ISBN = {978-959-7174-14-1}, CONFERENCE_NAME = {XI Simposio Internacional de Communicación Social}, CONFERENCE_PLACE = {Santiago de Cuba}, CONFERENCE_DATE = {19-23 de enero de 2009}, EDITOR = {Silvia, M. R. A. and Moreno, C. A. and Miyares, L. R.}, } @INPROCEEDINGS{SASSI_2009_INPROCEEDINGS_SPG_84757, AUTHOR = {Sassi, M. and Pardelli, G. and Goggi, S.}, TITLE = {Terminology Extraction from the web}, YEAR = {2009}, ABSTRACT = {This paper presents the results of a study on textual resources in the field of Human Language Technology (HLT). A statistical representation of the most significant terms in HLT and other interrelated disciplines associates old and new words, highlighting the terminological changes that have taken place in the course of time. Aim of our study is to contribute to the creation of language resources for the extraction of documentation coming from the Web in order to help preventing the disappearance of documents containing HLT words that have undergone rapid development over the last decades. This paper is organised as follows: after a general introduction to our work, section 2 provides a historical overview of HLT; sections 3 and 4 offer an account of the most relevant terms used by specialists in different periods, and those indicative of the changes that have taken place; section 5 describes the methodology we have used and also contains information on our database and a graphical representation of the data. Finally, the conclusions stress the need to integrate pre-existing or obsolete words and expressions, creating HLT synonym relations.}, KEYWORDS = {Terminology, Computational Linguistics, Web-based information}, PAGES = {417-420}, URL = {https://publications.cnr.it/doc/84757}, ISBN = {978-83-7177-746-2}, CONFERENCE_NAME = {4th Language Technology Conference: Human Language Technology as a challenge for Computer Science and Linguistics}, CONFERENCE_PLACE = {Poznan, PL}, CONFERENCE_DATE = {November 6-8, 2009}, EDITOR = {Vetulani, Z.}, } @INPROCEEDINGS{MARZI_2009_INPROCEEDINGS_MPS_112950, AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.}, TITLE = {Grey Literature and Computational Limguistics: From Paper to Net}, YEAR = {2009}, ABSTRACT = {The advent and exponential development of the World Wide Web has led to an increasing availability of unstructured knowledge and distributed information sources, meeting general public requirements that are hardly addressed by other more traditional information channels. This trend has concurrently raised a considerable interest in the application of Computational Linguistics (CL) methodologies to document access and retrieval, as they offer the unprecedented opportunity to make the subjective, user-centred information demands of Net citizens meet the ever changing and heterogeneous information flow of the web. Over the last five years, more and more Italian Universities have introduced CL courses into their Humanities curricula, making available on-line teaching materials, tutorials and language engineering software that appear to supply the lack of offer from traditional Italian publishing houses. In this paper, we consider in some detail the role played by this type of Grey Literature in bringing up a wider and increasingly more aware community of web users in Italy. Theme: Impact of Grey Literature on Net Citizens}, KEYWORDS = {Computational Linguistics, Grey Literature, Web-based information}, PAGES = {81-84}, URL = {https://publications.cnr.it/doc/112950}, VOLUME = {11}, ISBN = {978-90-77484-14-2}, CONFERENCE_NAME = {Eleventh International Conference on Grey Literature "The Grey Mosaic, Piecing it All Together"}, CONFERENCE_PLACE = {Washington, DC}, CONFERENCE_DATE = {14-15 December 2009}, BOOKTITLE = {Eleventh International Conference on Grey Literature "The Grey Mosaic, Piecing it All Together" Acronimo titolo evento}, EDITOR = {Farace, D. J. and Frantzen, J.}, } @INPROCEEDINGS{RUIMY_2009_INPROCEEDINGS_RBP_112946, AUTHOR = {Ruimy, N. and Bozzi, A. and Pardelli, G.}, TITLE = {Modèle lexical pour un thésaurus-lexique électronique de la terminologie saussurienne}, YEAR = {2009}, ABSTRACT = {Le modèle lexical SIMPLE que nous nous proposons d'adopter pour la création d'un thésaurus-lexique de la terminologie linguistique saussurienne a été créé dans le cadre du projet européen éponyme et a permis le développement de lexiques sémantiques monolingues harmonisés pour douze langues de l'Union Européenne. Dès sa création, il s'est imposé comme standard de facto et a ainsi inspiré de manière déterminante le standard international ISO pour les lexiques du Traitement Automatique des Langues. Dans le panorama de la Lexicographie Computationnelle, ce modèle lexical se distingue par certains aspects particulièrement novateurs. L'approche théorique adoptée pour la représentation de l'information sémantique est basée sur les principes fondamentaux de la théorie du Lexique Génératif (J. Pustejovsky, 1995 ; 2001 ). L'architecture flexible du modèle ainsi que la méthodologie de construction du lexique permettent d'encoder dans les entrées lexicales une ample gamme d'informations hautement structurées couvrant tous les aspects de la sémantique lexicale des mots ; ceci de manière cohérente, et au degré de granularité souhaité. La structuration conceptuelle du lexique est confiée à une ontologie linguistique mettant en relief le caractère multidimensionnel du sens lexical. L'ontologie SIMPLE est formée de types sémantiques indépendants des langues et a été conçue en prévision d'expansions ou de spécialisations visant à satisfaire aux exigences de domaines d'intérêt particuliers. Outre la classification ontologique et un certain nombre de traits sémantiques, les unités lexicales sont caractérisées par un réseau de relations sémantiques qui sont en majeure partie le fruit d'une relecture de la structure des qualia que Pustejovsky emprunte à Moravcsik, 1975 . Ces relations permettent de modéliser l'information concernant les différentes composantes sémantiques qui concourent à définir la structure interne d'une unité lexicale. Elles explicitent ses liens hyperonymiques et méronymiques mais aussi, sur l'axe syntagmatique, les liens aux différents prédicats qui contribuent à éclairer son sens, et en particulier l'origine et la fonction de l'entité dénotée. D'autres relations, telles que la synonymie, la polysémie logique et la dérivation morphologique sont également définies. Les lexèmes prédicatifs, et en particulier les verbes, sont de surcroît caractérisés par le scénario sémantique dans lequel ils sont impliqués. Celui-ci est décrit en termes de classe aspectuelle et de structure argumentale du prédicat, avec indication du rôle sémantique et des restrictions de sélection de chacun des arguments.}, KEYWORDS = {Computational Lexicon, Thesaurus}, PAGES = {1-17}, URL = {https://publications.cnr.it/doc/112946}, CONFERENCE_NAME = {Séminaire international "Publier les manuscrits de Ferdinand de Saussure"}, CONFERENCE_PLACE = {Arcavacata, Università della Calabria}, CONFERENCE_DATE = {1-3 ottobre 2009}, } @INPROCEEDINGS{CIGNONI_2008_INPROCEEDINGS_CPS_112937, AUTHOR = {Cignoni, L. and Pardelli, G. and Sassi, M.}, TITLE = {Grey Literature for Natural Language Processing: a Terminological and Statistical Approach}, YEAR = {2008}, ABSTRACT = {This paper presents the results of a study on grey literature (GL) in the field of Natural Language Processing (NLP). Our data has been collected in a corpus of ca 13,000 records corresponding to the titles of papers presented at International Conferences from 1950 to June 2008. A statistical representation of the most significant terms relative to GL in NLP and other interrelated disciplines associates old and new words, highlighting the terminological changes that have taken place in the course of time. Aim of our study is to contribute to the creation of language resources for the extraction of GL coming from the Web in order to help prevent the disappearance of documents containing NLP words that have undergone rapid development over the last decades. This paper is organised as follows: after a general introduction to our work, section 2 provides a historical overview of NLP; sections 3 and 4 offer an account of the most relevant terms used by specialists in different periods, and indicative of the changes that have taken place; section 5 describes the methodology we have used and also contains information on our GL database and a graphical representation of the data. Finally, the conclusions stress the need to integrate pre-existing or obsolete words and expressions, creating NLP synonym relations.}, KEYWORDS = {Computational Linguistics, Grey Literature}, PAGES = {116-120}, URL = {http://hdl.handle.net/10068/697993}, ISBN = {978-90-77484-12-8}, CONFERENCE_NAME = {Tenth International Conference on Grey Literature: Designing the Grey Grid for Information Society}, CONFERENCE_PLACE = {Amsterdam}, CONFERENCE_DATE = {December 8-9 2008}, EDITOR = {Farace, D. G. and Frantzen, J.}, } @TECHREPORT{PARDELLI_2008_TECHREPORT_PSOP_255578, AUTHOR = {Pardelli, G. and Sassi, M. and Orsolini, P. and Parrinelli, V.}, TITLE = {Verso la costruzione di una Biblioteca Digitale}, YEAR = {2008}, ABSTRACT = {A data base of the "Antonio Zampolli Fund" has been created and the respective catalogue has been published1. The work of analysis and selection of texts for cataloguing helped in creating this bibliography, in large part built on references extracted by books and journals. Very old bibliographical references have also been retrieved by curricula prepared by Professor Zampolli for various projects and commissions.}, KEYWORDS = {Biblioteca Digitale, Linguistica Computazionale}, PAGES = {1-43}, URL = {https://publications.cnr.it/doc/255578}, } @INPROCEEDINGS{PARDELLI_2007_INPROCEEDINGS_PSG_84678, AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S.}, TITLE = {A survey on Human Language Technology Terminology}, YEAR = {2007}, ABSTRACT = {This article originates from the revision of a 1969 unpublished article by Professor Antonio Zampolli carried out by Gabriella Pardelli and Manuela Sassi, two of his collaborators at the Institute of Computational Linguistics in Pisa. It is a technical report titled "Due Conversazioni sul Panorama Attuale della Linguistica Computazionale", drawn up by Zampolli on the occasion of two lectures at the Istituto di Matematica Ulisse Dini of Florence in June 1969. A synthesis of the introductory part - mainly based on some classifications for the various areas of Computational Linguistics - is reported here because the most interesting from the point of view of the relationship between automatic processing of linguistic data and other sciences. The rich bibliographic part has been extracted as well from the report and used for a terminological statistical analysis. Some sections, for example those on the International Conference on Computational Linguistics of 1969 and on the "Sezione Linguistica" of CNUCE in Pisa, have not - or only partly - been taken into account because already published by Zampolli in other books and journals (and not because considered less important). The whole revised technical report will soon be published in the "Quaderni di Linguistica Computazionale" edited by the Istituto di Linguistica Computazionale. The paper is divided in three parts: the first section is a terminological overview on the use of terms such like Computational Linguistics, Applied Linguistics and Mathematical Linguistics; the second has a statistical approach and shows the graphical representation of terms extracted from bibliographies and used in the 1960s; lastly, the conclusions. This contribution is a "historical" document which places itself at the beginning of a field which afterwards knew an exceptional development and it highlights both the continuity and the change which brought to the present Human Language Technology.}, KEYWORDS = {Human Language Technology, Terminology}, PAGES = {364-368}, URL = {https://publications.cnr.it/doc/84678}, PUBLISHER = {Wydawnictwo Poznanskie Sp. z o. o (Poznan, POL)}, ISBN = {978-90-77484-17-3}, CONFERENCE_NAME = {3rd Language \& Technology Conference}, CONFERENCE_PLACE = {Poznan}, CONFERENCE_DATE = {october 5-7, 2007}, BOOKTITLE = {Human Language Technologies as a Challenge for Computer Science and Linguistics}, EDITOR = {Vetulani, Z.}, } @INPROCEEDINGS{PARDELLI_2006_INPROCEEDINGS_PSGO_84640, AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S. and Orsolini, P.}, TITLE = {Natural Language Processing: A Terminological and Statistical Approach}, YEAR = {2006}, ABSTRACT = {The aim of this article is to provide a statistical representation of significant terms used in the field of Natural Language Processing from the 1960s till nowadays, in order to draft a survey on the most significant research trends in that period. By retrieving these keywords it should be possible to highlight the ebb and flow of some thematic topics. The NLP terminological sample derives from a database created for this purpose using the DBT software (Textual Data Base, ILC patent).}, KEYWORDS = {Natural Language Processing, Terminology}, PAGES = {2395-2398}, URL = {https://publications.cnr.it/doc/84640}, PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)}, ISBN = {2-9517408-2-4}, CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation}, CONFERENCE_PLACE = {Genoa}, CONFERENCE_DATE = {Genoa, 24-26 May}, } @ARTICLE{PARDELLI_2005_ARTICLE_PO_255647, AUTHOR = {Pardelli, G. and Orsolini, P.}, TITLE = {Bibliography of Antonio Zampolli (from 1962 to 2004)}, YEAR = {2005}, KEYWORDS = {Bibliography, Computational Linguistics}, PAGES = {501-517}, URL = {https://publications.cnr.it/doc/255647}, VOLUME = {15 (LI)}, PUBLISHER = {Polish Scientific Publishers PWN (Warszawa, Polonia)}, ISSN = {1230-2384}, JOURNAL = {Archives of Control Sciences}, } @INPROCEEDINGS{PARDELLI_2005_INPROCEEDINGS_PO_84598, AUTHOR = {Pardelli, G. and Orsolini, P.}, TITLE = {"Special Session in Memory of Antonio Zampolli"}, YEAR = {2005}, ABSTRACT = {It is certain that this bibliography needs to be further updates but it is with pleasure that we present it during this Special Session dedicated to Antonio Zampolli, along with a a short Curriculum vitae. A special thanks goes to Nicoletta Calzolari , Director of the Institute of Computational Linguistics, who always encouraged and supported our work with precious advices.}, PAGES = {1-50}, URL = {https://publications.cnr.it/doc/84598}, CONFERENCE_NAME = {L\&T'05-2nd Language Technologies as a Challenge for Computer Science and Linguistics in Memory of Antonio Zampolli}, CONFERENCE_PLACE = {Poznan}, CONFERENCE_DATE = {april 21-23, 2005}, } @MISC{PARDELLI_2005_MISC_PSGO_151553, AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S. and Orsolini, P.}, TITLE = {NLPterminology}, YEAR = {2005}, URL = {https://publications.cnr.it/doc/151553}, } @INPROCEEDINGS{PARDELLI_2004_INPROCEEDINGS_PSG_84614, AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S.}, TITLE = {From Weaver to the ALPAC Report}, YEAR = {2004}, ABSTRACT = {This paper presents a sample pertaining to the creation and the use of words in the field of Natural Language Processing (NLP) in the years 1949-1966. These words have been statistically sorted and the results could be taken as a proof that electronic processing of linguistic data leads to the diffusion of clear and concise words for describing a complex concept which would need a circumlocution to be described instead. The aim of this article is to provide an evolutionary overview of these new lexical forms in the various languages for the period taken into account and, whereas possible, a data register and a tabular representation have been prepared as well.}, KEYWORDS = {Terminology, Natural Language Processing}, PAGES = {2005-2008}, URL = {https://publications.cnr.it/doc/84614}, PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)}, ISBN = {2-9517408-1-6}, CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation}, CONFERENCE_PLACE = {Lisbona}, CONFERENCE_DATE = {26th, 27th \& 28 May 2004}, EDITOR = {Lino, T. and Xavier, M. F. and Ferreira, F. and Costa, R. and Silvia, R.}, } @ARTICLE{PARDELLI_2003_ARTICLE_P_64490, AUTHOR = {Pardelli, G.}, TITLE = {BIBLOS: historical, philosophical and philological digital library of the Italian National Research Council}, YEAR = {2003}, ABSTRACT = {The BIBLOS project was established in 1996 for the purpose of creating an Internet site which would combine and organise all the information gathered by the various branches of the National Research Council (CNR) relating to the Humanities. The browsing system is based on a subject catalogue which represents the main access to the file, and which includes information on three different research topics: linguistics, philosophy and antiquities. The Istitutes have already made available the information collected from their research activity and the databases which have been developed, usually in the form of bibliographic catalogues and specialised bibliographies.}, KEYWORDS = {IT for Library, Biblioteche virtuali, Documentazione, Catalogazione, CNR}, PAGES = {519-549}, URL = {https://publications.cnr.it/doc/64490}, VOLUME = {Anno XVIII-XIX, 1998-1999}, DOI = {10.1400/18171}, PUBLISHER = {Giardini editori e stampatori (Pisa, Italia)}, ISSN = {0392-6907}, JOURNAL = {Linguistica computazionale (Testo stamp.)}, } @TECHREPORT{ENEA_2003_TECHREPORT_EPOF_157340, AUTHOR = {Enea, A. and Pardelli, G. and Orsolini, P. and Fiorentini, G.}, TITLE = {Pubblicazioni ILC sul WEB}, YEAR = {2003}, URL = {https://publications.cnr.it/doc/157340}, } @MISC{ENEA_2003_MISC_EPOF_157336, AUTHOR = {Enea, A. and Pardelli, G. and Orsolini, P. and Fiorentini, G.}, TITLE = {Banca dati delle Pubblicazioni ILC sul WEB}, YEAR = {2003}, ABSTRACT = {Il repertorio delle pubblicazioni scientifiche dell'Istituto di Linguistica Computazionale disponibile in Internet è strutturato per censire i prodotti dell'attività di ricerca: Libri e loro capitoli; Articoli su riviste scientifiche nazionali e internazionali; Articoli in atti di convegni nazionali e internazionali; Deliverable di progetti comunitari; Rapporti tecnici e CD-Rom. Da pochi anni si sono aggiunte anche le pubblicazioni fruibili da Internet, in particolare dalle riviste elettroniche. A questa nuova tipologia appartengono anche alcuni riferimenti bibliografici delle pubblicazioni ILC. I riferimenti bibliografici si riconducono al: 1) Trattamento Automatico della Lingua, comprendente: risorse linguistiche (corpora testuali, lessici, thesauri), reti concettuali, strumenti di analisi linguistica del testo, strumenti di estrazione e rappresentazione del contenuto testuale; 2) Analisi filologica, letteraria e linguistica del testo: sistemi di gestione di basi di dati testuali, lessicali e dialettali, strumenti multimediali per lo studio della tradizione del testo, strumenti per la documentazione, conservazione e fruizione del patrimonio linguistico-culturale; 3) Applicazioni di varia natura: Traduzione automatica; Strumenti multimediali per la didattica e la disabilità; Tecnologie per il filtraggio di contenuti internet a tutela dei minori; Strumenti multilingue; Generazione automatica; Ontologia; Web Semantico. La descrizione delle scelte tecnologiche e del software utilizzato è descritta nella pubblicazione allegata.}, KEYWORDS = {Bibliografia, Linguistica Computazionale}, URL = {http://www.ilc.cnr.it/viewpage.php/sez=ricerca/id=58/vers=ita}, } @BOOK{PARDELLI_2002_BOOK_POSEG_231725, AUTHOR = {Pardelli, G. and Orsolini, P. and Sassi, M. and Enea, A. and Gazzetti, S.}, TITLE = {TAL Bibliography (1951-2002). Parte I}, YEAR = {2002}, ABSTRACT = {Il presente catalogo contiene molte delle bibliografie del Trattamento Automatico della Lingua TAL a partire dal secondo dopoguerra ad oggi e diverse bibliografie di opere di linguistica generale variamente collegate alla linguistica Computazionale CL, in varie formulazioni: glossematica, grammatica trasformazionale-generativa, fonetica, stilistica linguistica, psicolinguistica, sociolinguistica, didattica delle lingue, filosofia del linguaggio, storia della lingua, funzionalismo praghese, prosodismo inglese, ecc.. Sono compresi, inoltre, alcuni riferimenti alla documentazione di alcuni linguaggi di programmazione evoluti adatti alla elaborazione di dati linguistici. La tipologia delle opere presenti nel seguente catalogo sinteticamente può ricondursi a: - Le prime testimonianze del trattamento automatico del linguaggio: Busa (1951); - Atti di Congressi e Conferenze di varie Associazioni Internazionali (ACL, ALLC, COLING, TAL, ACLA, AILA, ecc.), tra i principali possiamo citare quelli dei congressi di CL tenuti a Yorktown Heights (IBM-64), a Grenoble (CITAL-67), a Praga (1968) e a Bergen (COLING-78); - Opere generali o introduttive delle applicazioni del calcolatore alle ricerche umanistiche e letterarie. Un esempio è dato dalla pubblicazione di F. De Tollenaere: i lavori presentati in questo survey del 1962 si riferiscono a ricerche nel settore Humanities di vari paesi: Stati Uniti, Inghilterra, Francia, Italia, Belgio, Olanda, Unione Sovietica, Cecoslovacchia, ecc. In questo gruppo, per la lessicografia, ricordiamo i due colloqui di Praga (1967) e di Pisa (1970)0; - Opere sull'uso di modelli matematici nella linguistica (Garvin, Maegaard). Gli argomenti trattati in queste opere nella maggior parte dei casi fanno riferimento a: 1. Valutazione statistica: compilazione di liste, dizionari, indici e di ricerche statistiche in genere (livello distribuzionale); 2. Elaborazione algoritmica dei sistemi sintattici e di vari modelli di acquisizione del linguaggio (livello sintattico); 3. Elaborazione automatica del contenuto del linguaggio (livello semantico); 4. Traduzione automatica (per le varie lingue); 5. Lessicografia (classica, romanza, slava, germanica, biblica, concordanze, indici e studi dialettologici, ecc.). E' stato possibile individuare le tematiche principali e gli argomenti più ricorrenti della soggettazione attraverso l'analisi di circa 5000 documenti nel settore del TAL. Mantenere una terminologia comune (normalizzazione) della soggettazione non è stato sempre possibile. L'interdisciplinarietà, sempre più praticata dopo gli anni '50, dovuta all'incontro dei metodi della linguistica con altre discipline e la terminologia dei primi anni in questo settore di indagine, ci avrebbero condotto alla dispersione dei soggetti, che sono stati rivisti in funzione di una maggiore omogeinità. I testi che studiano il linguaggio e i sistemi di automazione nelle ricerche e nelle analisi linguistiche sono stati descritti nel database principalmente in inglese e occasionalmente in francese per casi particolari (v. nell'indice dei Soggetti: Traduction Mécanique /Traduction Automatique) per rispettarne le prime testimonianze. Abbiamo preferito mantenere descrittori simili per evidenziare l'evoluzione della terminologia usata nei testi nel corso degli anni (v.: Automatic ... /Automated ...). Abbiamo evitato, per quanto possibile, l'uso di termini di eccessivo tecnicismo: ciò per rendere più agevole la ricerca attraverso Internet da parte di un'utenza non sempre specialistica. Il lavoro di soggettazione, analisi e selezione dei documenti per la costruzione di questo archivio è stato svolto da Gabriella Pardelli. Il software CDS-ISIS dell'Unesco è stato utilizzato per gli standard catalografici e, allo scopo, è stato attivato un server per l'accesso simultaneo al database. Il supporto informatico, anche per ciò che concerne il rilevamento dei dati per le indagini statistiche come il recupero automatico dei tag di sottocampo dei record bibliografici (lingua, paese, argomento, ecc.) è stato fornito interamente da Alessandro Enea. Paola Orsolini e Silvia Gazzetti si sono occupate del lavoro di catalogazione. L'elaborazione del catalogo generato dal database ISIS è stata effettuata da Manuela Sassi.}, KEYWORDS = {Bibliografia, Linguistica Computazionale}, PAGES = {1-187}, URL = {http://www.biblos.cnr.it/04_2_TALb.html}, PUBLISHER = {S. T. A. R. Servizio Tecnografico Area Ricerca CNR (Pisa, ITA)}, } @MISC{CECCOTTI_2002_MISC_CPS_242344, AUTHOR = {Ceccotti, M. L. and Pardelli, G. and Sassi, M.}, TITLE = {Per un'analisi del lessico linguistico-computazionale: da Weaver all'ALPAC Report}, YEAR = {2002}, ABSTRACT = {In questo report proponiamo una breve presentazione della 'preistoria' della linguistica computazionale, del periodo compreso tra la pubblicazione del memorandum di Warren Weaver del 1949 e del Report dell'Alpac del 1966. La preistoria della CL vuol dire essenzialmente traduzione automatica, dizionari di macchina, etc., attività di ricerca svolte da matematici, fisici. L'inglese è la lingua veicolo di tutto ciò e continuerà ad esserlo ancora per anni prima che anche in Europa - eccezione è l'Inghilterra - e nel resto del mondo siano tentate traduzioni, adattamenti, proposte, che guidano i primi passi della ricerca in questi ambiti.}, KEYWORDS = {Lessico linguistico-computazionale}, URL = {https://publications.cnr.it/doc/242344}, } @TECHREPORT{PARDELLI_2001_TECHREPORT_PC_241747, AUTHOR = {Pardelli, G. and Cignoni, L.}, TITLE = {Entrate Lessicali per il trattamento automatico del linguaggio (TAL)}, YEAR = {2001}, KEYWORDS = {Strumenti informatici, didattiche disciplinari}, PAGES = {1-9}, URL = {https://publications.cnr.it/doc/241747}, } @ARTICLE{LANZA_2000_ARTICLE_LP_229315, AUTHOR = {Lanza, C. and Pardelli, G.}, TITLE = {Una soggettazione automatica di letteratura grigia con algoritmi di rete neurale artificiale. Due esperimenti ICAS e ILC}, YEAR = {2000}, ABSTRACT = {The aim of this work is to create an automatic subject classification of grey literature documents using an artificial neural network. In particular, a software simulator of neural network with back-propagation learning scheme was used; training of the network was carried out on around 300 documents. The prototype developed follows the steps which were performed during the learning, the processing and the network querying phase. The analysis of the final tests provides targets to be referred to the percentage of document classification error for each subject. From this data it is possible to evince possible document-subject correlations and/or subject-subject correlations in order to construct a relational Database of the scientific documents available at the Institute of Computational Linguistics and at the Institute of Instrumental Analitical Chemistry.}, KEYWORDS = {Artificial Neural Network, IT for Library, Data Mining}, PAGES = {52-56}, URL = {https://publications.cnr.it/doc/229315}, VOLUME = {67}, PUBLISHER = {Istituto superiore di sanità (Roma, Italia)}, ISSN = {0393-5620}, JOURNAL = {ISTISAN congressi}, } @INPROCEEDINGS{CECCOTTI_2000_INPROCEEDINGS_CSP_228142, AUTHOR = {Ceccotti, M. L. and Sassi, M. and Pardelli, G.}, TITLE = {Un laboratorio multimediale dedicato a Carlo Emilio Gadda: il modello e i primi dati implementati in formato XML}, YEAR = {2000}, ABSTRACT = {In this paper we present of the Italian National Council of Research titled "Gadda 's Electronic Archive: Lexicographical and bibliographical Tools in XML". The text is made of two sections: in the first, we present Gadda's Electronic Archive, implemented at the ILC, and in the second, we show the project's objectives and the results achieved in the first months of work.}, KEYWORDS = {Gadda's Electronic Archive}, PAGES = {267-271}, URL = {https://publications.cnr.it/doc/228142}, PUBLISHER = {Associazione Italiana per l'Informatica ed il Calcolo Automatico (AICA) (Milano, ITA)}, CONFERENCE_NAME = {XXXVIII Congresso Annuale AICA: Le tecnologie dell'Informazione e della Comunicazione come sviluppo del Paese}, CONFERENCE_PLACE = {Taormina}, CONFERENCE_DATE = {27-30 Settembre}, } @INPROCEEDINGS{CECCOTTI_2000_INPROCEEDINGS_CSP_231335, AUTHOR = {Ceccotti, M. L. and Sassi, M. and Pardelli, G.}, TITLE = {Il soccorso informatico per lo studio di un autore difficile, C. E. Gadda}, YEAR = {2000}, ABSTRACT = {Nella prima parte di questo contributo si illustreranno le caratteristiche dell'Archivio Gadda in DBT, frutto di un lungo lavoro redazionale di transcodifica e di codifica. Nella seconda sarà brevemente descritta e motivata la realizzabilità di un sito web su Gadda, un modello di 'laboratorio culturale' che costituito inizialmente da alcuni brani gaddiani, da nostre recenti pubblicazioni, da dati bibliografici, potrebbe essere arricchito dall'apporto del lettore di Gadda, studioso,. studente, curioso...}, KEYWORDS = {Gadda C. E}, PAGES = {149-154}, URL = {https://publications.cnr.it/doc/231335}, PUBLISHER = {Associazione Italiana per l'Informatica ed il Calcolo Automatico (AICA) (Milano, ITA)}, CONFERENCE_NAME = {DIDAMATICA 2000, Informatica per la Didattica}, CONFERENCE_PLACE = {Cesena}, CONFERENCE_DATE = {4-5-6 maggio 2000}, BOOKTITLE = {Atti 1. Lavori Scientifici}, EDITOR = {Andronico, A. and Casadei, G. and Sacerdoti, G.}, } @INPROCEEDINGS{LANZA_2000_INPROCEEDINGS_LP_226416, AUTHOR = {Lanza, C. and Pardelli, G.}, TITLE = {Una soggettazione automatica di letteratura grigia con algoritmi di rete neurale artificiale. Due esperimenti ICAS e ILC}, YEAR = {2000}, ABSTRACT = {The aim of this work is to create an automatic subject classification of grey literature documents using an artificial neural network. In particular, a software simulator of neural network with back-propagation learning scheme was used; training of the network was carried out on around 300 documents. The prototype developed follows the steps which were performed during the learning, the processing and the network querying phase. The analysis of the final tests provides targets to be referred to the percentage of document classification error for each subject. From this data it is possible to evince possible document-subject correlations and/or subject-subject correlations in order to construct a relational Database of the scientific documents available at the Institute of Computational Linguistics and at the Institute of Instrumental Analitical Chemistry.}, KEYWORDS = {Artificial Neural Network, IT for Library, Data Mining}, PAGES = {52-56}, URL = {https://publications.cnr.it/doc/226416}, VOLUME = {67}, PUBLISHER = {Istituto Superiore di Sanità (Roma, ITA)}, CONFERENCE_NAME = {La letteratura grigia: politica e pratica. 3° Convegno Nazionale}, CONFERENCE_PLACE = {Roma}, CONFERENCE_DATE = {25-26 novembre 1999}, BOOKTITLE = {La letteratura grigia: politica e pratica}, EDITOR = {Alberani, V. and De Castro, P.}, } @INPROCEEDINGS{PARDELLI_1999_INPROCEEDINGS_P_241865, AUTHOR = {Pardelli, G.}, TITLE = {I risultati del Progetto BIBLOS}, YEAR = {1999}, ABSTRACT = {Il sito di BIBLOS e' entrato ufficialmente in servizio con questa Conferenza quando e' stato presentato presso la Sede Centrale del CNR (Aula Marconi). In tale occasione i responsabili delle Unità Operative degli Istituti del Comitato 08 hanno presentato i risultati raggiunti, in particolare il catalogo a soggetto. In tale occasione è stato presentato il soggettario e il prototipo bibliografico dell'unità operativa ILC.}, KEYWORDS = {Biblos Project}, URL = {https://publications.cnr.it/doc/241865}, CONFERENCE_NAME = {BIBLOS Biblioteca virtuale del settore Storico Filosofico e Filologico del Consiglio Nazionale delle Ricerche: I risultati del Progetto BIBLOS: la telematica al servizio della cultura umanistica}, CONFERENCE_PLACE = {Roma}, CONFERENCE_DATE = {16 novembre 1999}, } @BOOK{PARDELLI_1998_BOOK_PS_255948, AUTHOR = {Pardelli, G. and Sassi, M.}, TITLE = {I. L. C. Library}, YEAR = {1998}, ABSTRACT = {La stampa del catalogo dell'archivio librario dell'Istituto di Linguistica Computazionale I.L.C. è tratta dall'archivio elettronico. La registrazione del materiale bibliografico viene effettuata con il software CDS/ISIS dell'UNESCO. Tale sistema ci permette di descrivere il documento secondo gli standard internazionali. I dati bibliografici dell'archivio sono stati curati da Gabriella Pardelli, responsabile della Biblioteca dell'Istituto, le procedure informatiche relative all'indicizzazione e alla stampa complessiva del catalogo sono state effettuate da Manuela Sassi, Tecnologo dell'Istituto.}, KEYWORDS = {Catalogo, Linguistica Computazionale}, PAGES = {i-253}, URL = {https://publications.cnr.it/doc/255948}, PUBLISHER = {S. T. A. R. Servizio Tecnografico Area Ricerca CNR (Pisa, ITA)}, } @INPROCEEDINGS{LANZA_1998_INPROCEEDINGS_LP_241761, AUTHOR = {Lanza, C. and Pardelli, G.}, TITLE = {Sviluppo delle raccolte e procedure di gestione nelle Biblioteche dell'ICAS e dell'ILC}, YEAR = {1998}, ABSTRACT = {La gestione del materiale bibliografico è rappresentata da una serie di procedure che vanno dall'acquisizione all'accessibilità dei documenti. Nel presente articolo abbiamo cercato di illustrare la situazione attuale delle nostre Biblioteche, il contenuto argomentativo, il servizio informativo, l'importanza della cooperazione tra Biblioteche e la necessità di aggiornamento professionale costante per un settore, l'IT for Libray, in continuo divenire.}, KEYWORDS = {Linguistica Computazionale, Chimica Analitica e Strumentale, Biblioteche}, URL = {https://publications.cnr.it/doc/241761}, CONFERENCE_NAME = {La Biblioteca, un Servizio in Rete}, CONFERENCE_PLACE = {Follonica}, CONFERENCE_DATE = {1-2 ottobre 1998}, } @TECHREPORT{PARDELLI_1998_TECHREPORT_P_241822, AUTHOR = {Pardelli, G.}, TITLE = {Verso la costruzione di un soggettario per il Progetto BIBLOS all'Istituto di Linguistica Computazionale}, YEAR = {1998}, ABSTRACT = {This document describes a methodology aimed at building a subject catalogue at the Institute for Computational Linguistics within the framework of the Biblos Project (Virtual Humanities Library of the National Research Council).}, KEYWORDS = {Subject Indexing, Cataloguing Documentation, Progetto BIBLOS}, PAGES = {1-6}, URL = {https://publications.cnr.it/doc/241822}, } @TECHREPORT{PARDELLI_1998_TECHREPORT_PR_241842, AUTHOR = {Pardelli, G. and Rini, S.}, TITLE = {Progetto BIBLOS: realizzazione del prototipo per la messa in linea con INTERNET della banca dati bibliografica dell'Istituto di Linguistica Computazionale}, YEAR = {1998}, ABSTRACT = {INTRODUZIONE Nel presente lavoro abbiamo cercato di illustrare la tipologia e il contenuto argomentativo del materiale documentario, le relative procedure di selezione, di registrazione e di scarto per arrivare alla costruzione del prototipo bibliografico del progetto BIBLOS. L'Istituto di Linguistica Computazionale (ILC) del Consiglio Nazionale delle Ricerche (CNR) afferisce al Comitato per le Scienze Storiche, Filosofiche e Filologiche. L' Istituto, nell'ambito della propria area disciplinare, gestisce il patrimonio documentario ed eroga i propri servizi in conformità a quanto previsto nel DPR n.475/87 1 e nel DPR n.417/95 2. La biblioteca dell'Istituto raccoglie e conserva: a) le pubblicazioni di consultazione generale o specializzate acquistate nell'ambito dell'attività scientifica del CNR, indispensabili per studi e ricerche; b) le pubblicazioni che riguardano la ricerca scientifica e tecnologica edita dal CNR o con il suo contributo o sotto il suo patrocinio. La biblioteca dell' Istituto ha quindi il compito di curare la raccolta e la catalogazione di tutto il materiale in suo possesso nonché quello di coordinare il servizio di informazione, mediante l'accesso alle banche dati, per rendere disponibile il recupero di documenti anche attraverso il ricorso alle procedure di prestito interbibliotecario. L'assolvimento di tali compiti e la necessità di soddisfare un'utenza esigente comportano una continua e attenta valutazione nell'acquisizione delle raccolte, di fatto spesso condizionata dal dinamismo dell'attività scientifica. Tale attività genera una letteratura spesso caratterizzata da rapida obsolescenza, benchè certi documenti possano essere richiesti anche dopo molti anni dalla loro pubblicazione, per il valore culturale e storico. Tutti questi fattori, non disgiunti dalla razionalizzazione dei fondi destinati alla biblioteca e dallo spazio fisico disponibile, determinano un'attenta valutazione dell'intera attività di gestione.}, KEYWORDS = {Biblos Project}, PAGES = {1-11}, URL = {https://publications.cnr.it/doc/241842}, } @TECHREPORT{PARDELLI_1995_TECHREPORT_P_242262, AUTHOR = {Pardelli, G.}, TITLE = {Verso una catalogazione dei testi della Biblioteca dell'ILC}, YEAR = {1995}, ABSTRACT = {Il report focalizza la titplogia del materiale bibliografico e la scelta dei criteri di soggettazione per la LC.}, KEYWORDS = {Linguistica Computazionale, soggetti argomentativi}, PAGES = {1-12}, URL = {https://publications.cnr.it/doc/242262}, } @BOOK{PARDELLI_1992_BOOK_PSM_241726, AUTHOR = {Pardelli, G. and Sassi, M. and Marinai, E.}, TITLE = {L'Archivio librario dell'I. L. C}, YEAR = {1992}, ABSTRACT = {Questo lavoro nasce dalla richiesta di colleghi e studenti di avere a disposizione un catalogo cartaceo per il reperimento di dati bibliografici del patrimonio librario dell'Istituto di Linguistica Computazionale. La Biblioteca dell'ILC fino a questo momento, infatti, si è avvalsa soltanto del catalogo on-line, attualmente gestito da un sistema informativo basato sulla procedura automatica di spoglio elettronico, DBT (Data Base Testuale), che permette il recupero delle informazioni contenute nell'archivio librario in tempo reale. Il catalogo segue questa strutturazione :a) Introduzione b) Premessa c) Criteri di catalogazione, d)I campi del database e) Esempi di interrogazione f) Indice per argomenti g) Indice per autori .}, KEYWORDS = {Linguistica Computazionale, Cataloghi, Sistema DBT}, PAGES = {1-131}, URL = {https://publications.cnr.it/doc/241726}, PUBLISHER = {S. T. A. R. Servizio Tecnografico Area Ricerca CNR (Pisa, ITA)}, } @MISC{ZAMPOLLI_1989_MISC_ZMP_242294, AUTHOR = {Zampolli, A. and Marinelli, R. and Pardelli, G.}, TITLE = {I sistemi di documentazione dell'ILC}, YEAR = {1989}, ABSTRACT = {Il documento si concentra sui punti seguenti: a) Recupero e trasformazione dei materiali codificati su archivi magnetici e costruzione di un sistema informativo per la gestione mista di archivi con dati catalografici normalizzati e dati bibliografici; b) Sistema di gestione dell' d'archivio scientifico per le varie lingue; c) Recupero e trasformazione di informazioni bibliografiche da VM a altro sistema informativo.}, KEYWORDS = {Documentazione, Linguistica Computazionale}, PAGES = {1-13}, URL = {https://publications.cnr.it/doc/242294}, }