[{"id":132242,"last_updated":"2018-09-06 17:57:44","id_people":382393,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"I corpora digitali: dall'obsolescenza tecnologica, alla salvaguardia e alla condivisione","year":2017,"authors_people":"Eva Sassolini, Sebastiana Cucurullo, Alessandra Cinini","authors_cnr":["Cinini, Alessandra","Sassolini, Eva","Cucurullo, Sebastiana"],"authors_cnr_id":["11032","11479"],"authors_cnr_institute":[""],"authors":["Sassolini, E.","Cucurullo, S.","Cinini, A."],"abstract":"Studio e implementazione di un protocollo di recupero, conservazione e valorizzazione di testi e corpora digitali interessati da problemi di obsolescenza tecnologica. Le strategie di salva-guardia adottate si spingono oltre il salvataggio dei testi e la conservazione in un formato di rappresentazione in linea con gli standard internazionali (XML TEI), si pongono come obiettivo la valorizzazione di questo patrimonio attraverso nuove modalit\u00e0 di fruizione dei contenuti. Lo scopo \u00e8 affiancare le funzionalit\u00e0 classiche di analisi testuale, che da sempre caratterizzano le nostre attivit\u00e0 di ricerca, a nuove modalit\u00e0 grafiche e visuali di fruizione dei dati e, in alcuni casi, migrare verso dispositivi mobili e tecnologie App. In questo articolo, oltre al protocollo di recupero, presentiamo due sperimentazioni di valorizzazione di contenuti testuali. Nel primo caso proponiamo tecniche di visual analytics applicate ad un corpus testuale semi strutturato riguardante corrispondenza redatta in lingua italiana del 1600. Nel secondo caso abbiamo realizzato un'applicazione per sistema Android finalizzata all'interrogazione di dati testuali relativi ad un progetto di censimento di architetture moderne della regione Liguria.","keywords":["Testi digitali","Analisi testuale","Preservazione dei dati","Diffusione dei risultati"],"pages":"31-35","url":"https:\/\/www.garr.it\/it\/documenti\/3529-conferenza-2016-selected-papers-sassolini-et-al\/file","volume":"","doi":"10.26314\/GARR-Conf16-proceeedings-06","editors_people":"","editors":[""],"published":"","publisher":"Consortium GARR (Roma, ITA)","issn":"","isbn":"978-88-905077-6-2","conference_name":"Conferenza GARR 2016-The CreActive Network","conference_place":"Firenze","conference_date":"30\/11\/2016-02\/12\/2016"},{"id":132246,"last_updated":"2018-09-06 17:57:45","id_people":382931,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Rapporto Tecnico: Standardizzazione del corpus testuale del PRIN Crusca","year":2017,"authors_people":"Alessandra Cinini, Sebastiana Cucurullo, Eva Sassolini","authors_cnr":["Cinini, Alessandra","Sassolini, Eva","Cucurullo, Sebastiana"],"authors_cnr_id":["11032","11479"],"authors_cnr_institute":[""],"authors":["Cinini, A.","Cucurullo, S.","Sassolini, E."],"abstract":"Attivit\u00e0 previste nella convenzione operativa tra ILC-CNR e Accademia della Crusca che riguardano la progettazione e lo sviluppo di una piattaforma Web modulare per l'archiviazione, la gestione e l'interrogazione di corpora testuali in lingua italiana, con funzionalit\u00e0 derivate dal DBT (Data Base Testuale) nelle sue diverse implementazioni.Il lavoro preliminare svolto riguarda anche la normalizzazione dei testi e la conversione nello standard di rappresentazione XML TEI.","keywords":["Codifica dei testi","Analisi testuale","formato XML TEI"],"pages":"1-21","url":"https:\/\/publications.cnr.it\/doc\/382931","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132134,"last_updated":"2017-03-01 11:09:01","id_people":359168,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"ALT Explored: Integrating an Online Dialectometric Tool and an Online Dialect Atlas","year":2016,"authors_people":"Martijn Wieling, Eva Sassolini, Sebastiana Cucurullo and Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta","Sassolini, Eva","Cucurullo, Sebastiana"],"authors_cnr_id":["5595","11032","11479"],"authors_cnr_institute":[""],"authors":["Wieling, M.","Sassolini, E.","Cucurullo, S.","Montemagni, S."],"abstract":"In this paper, we illustrate the integration of an online dialectometric tool, Gabmap, together with an online dialect atlas, the Atlante Lessicale Toscano (ALT-Web). By using a newly created url-based interface to Gabmap, ALT-Web is able to take advantage of the sophisticated dialect visualization and exploration options incorporated in Gabmap. For example, distribution maps showing the distribution in the Tuscan dialect area of a specific dialectal form (selected via the ALT-Web website) are easily obtainable. Furthermore, the complete ALT-Web dataset as well as subsets of the data (selected via the ALT-Web website) can be automatically uploaded and explored in Gabmap. By combining these two online applications, macro- and micro-analyses of dialectal data (respectively offered by Gabmap and ALT-Web) are effectively and dynamically combined.","keywords":["Lexicon","Lexical Database","Tools","Systems","Applications"],"pages":"3265-3272","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2016\/index.html","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-2-9517408-9-1","conference_name":"LREC 2016","conference_place":"Portoro\u017e, Slovenia","conference_date":"23\/10\/2016"},{"id":132243,"last_updated":"2018-09-06 17:57:47","id_people":382394,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"I corpora digitali: dall'obsolescenza tecnologica, alla salvaguardia e alla condivisione","year":2016,"authors_people":"Eva Sassolini, Sebastiana Cucurullo, Alessandra Cinini","authors_cnr":["Cinini, Alessandra","Sassolini, Eva","Cucurullo, Sebastiana"],"authors_cnr_id":["11032","11479"],"authors_cnr_institute":[""],"authors":["Sassolini, E.","Cucurullo, S.","Cinini, A."],"abstract":"Il progetto di recupero, nato pochi anni fa come iniziativa fortemente voluta da ILC, prosegue oggi con la collaborazione di molte istituzioni pubbliche e private, impegnate sullo stesso fronte. Approccio al recupero a tappe: inizialmente lavorando su testi che erano stati prodotti per essere indicizzati con le prime procedure di analisi testuale presenti all'ILC sin dalla fine degli anni '70 del secolo scorso. Definizione di criteri da adottare per la scelta dei testi, basati sullo studio di casi significativi e sull'importanza dei materiali, spesso legati alla realizzazione di autorevoli progetti nazionali e internazionali.","keywords":["recupero testi","conversione in formato XML","valorizzazione dei risultati"],"pages":"1-3","url":"https:\/\/www.eventi.garr.it\/it\/conf16\/home\/materiali-conferenza-2016\/paper","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Conferenza GARR 2016-The CreActive Network","conference_place":"Firenze","conference_date":"30\/11\/2016-02\/12\/2016"},{"id":131805,"last_updated":"2016-04-12 15:45:21","id_people":353217,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Sviluppo di funzioni software per il recupero di testi dell'Archivio Testuale dell'ILC e conversione in un formato di rappresentazione XML\/TEI","year":2015,"authors_people":"Cucurullo Sebastiana","authors_cnr":["Cucurullo, Sebastiana"],"authors_cnr_id":["11479"],"authors_cnr_institute":[""],"authors":["Cucurullo, S."],"abstract":"Il presente rapporto documenta le attivit\u00e0 svolte nell'ambito della Convenzione Operativa relativa allo sviluppo di funzioni software per il recupero di testi dell'Archivio Testuale dell'ILC e la conversione in un formato di rappresentazione XML\/TEI, stipulata all'interno dell'Accordo di Collaborazione Scientifica ILC-CNR - Accademia della Crusca. In particolare, il rapporto si focalizza sui seguenti punti oggetto della Convenzione Operativa: 1. definizione di un formato di rappresentazione XML\/TEI che tenga conto da un lato della tipologia di annotazioni presenti nei testi di partenza e dall'altro delle analisi ed elaborazioni a cui i testi convertiti dovranno essere sottoposti; 2. sviluppo di procedure di conversione dal formato dei \"Periodici Milanesi\" al formato XML\/TEI e verifica dei risultati mediante parsing XML. Il Rapporto ripercorre le diverse fasi del lavoro, con particolare attenzione all'analisi dell'archivio testuale di partenza e ai risultati raggiunti, per arrivare a una discussione delle questioni che rimangono al momento aperte e degli sviluppi che possono prospettarsi per tali attivit\u00e0.","keywords":["banca-dati testuale","Periodici Milanesi"],"pages":"43","url":"https:\/\/publications.cnr.it\/doc\/353217","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132106,"last_updated":"2016-04-19 13:05:23","id_people":353218,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Sviluppo di funzioni software per il recupero di testi dell'Archivio Testuale dell' ILC e conversione in un formato di rappresentazione XML\/TEI Fase 2","year":2015,"authors_people":"Cucurullo Sebastiana","authors_cnr":["Cucurullo, Sebastiana"],"authors_cnr_id":["11479"],"authors_cnr_institute":[""],"authors":["Cucurullo, S."],"abstract":"Il presente rapporto documenta le attivit\u00e0 svolte nell'ambito della Convenzione Operativa relativa allo sviluppo di funzioni software per il recupero di testi dell'Archivio Testuale dell'ILC e la conversione in un formato di rappresentazione XML\/TEI, stipulata all'interno dell'Accordo di Collaborazione Scientifica ILC-CNR - Accademia della Crusca. In particolare, questo rapporto si focalizza sul seguente oggetto della Convenzione Operativa: \"sviluppo di procedure di conversione dal formato DBT al formato XML\/TEI, secondo le indicazioni contenute nel Report relativo alla Fase 1 e verifica dei risultati mediante parsing XML costituito dal corpus dell'800 e '900 di testi estratto dal Patrimonio Testuale ILC, la cui composizione \u00e8 stata concordata con l'Accademia della Crusca\". Buona parte delle soluzioni adottate per quella tipologia di testi \u00e8 stata scelta per essere utilizzata anche in testi non lemmatizzati, come nel caso di opere di autori italiani dell'Ottocento e del Novecento. La strutturazione generale del documento XML TEI in header e body e la definizione dei principali TAG utilizzati \u00e8 condivisa sia dai testi di questo Corpus che da quelli lemmatizzati dei Periodici Milanesi, da cui siamo partiti perch\u00e9 presentavano una maggiore casistica di codifiche e contemporaneamente un formato di origine pi\u00f9 lontano nel tempo. Si tratta infatti di formati e supporti di memorizzazione che precedono l'era del Personal Computer e che hanno gi\u00e0 subito la trasformazione da EBCDIC ad ASCII.","keywords":["Archivi Testuali"],"pages":"21","url":"https:\/\/publications.cnr.it\/doc\/353218","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132306,"last_updated":"2018-09-07 12:08:15","id_people":319040,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Industrial Philology: Problems and techniques of data and archives preservation for future generations","year":2014,"authors_people":"Sassolini, Eva; Sassi, Manuela; Cucurullo, Sebastiana; Cinini, Alessandra; Sbrulli, Stefano","authors_cnr":["Cucurullo, Sebastiana","Cinini, Alessandra","Sbrulli, Stefano","Sassolini, Eva","Sassi, Manuela"],"authors_cnr_id":["11032","19592"],"authors_cnr_institute":[""],"authors":["Sassolini, E.","Sassi, M.","Cucurullo, S.","Cinini, A.","Sbrulli, S."],"abstract":"The main objective of digital archiving of texts is their re-use and preservation. The concept that guides these initiatives is linked to structural and organizational needs which heavily influence the definition of the format specifications that describe the organisation of the archives at various levels and consists of a more or less complex document. A format specification provides the details needed to build a file from a text, establishes the admitted encodings and software applications that can decode the file and make its content accessible. These structural specifications can have an extremely variable size and they depend on the complexity of the format. Although some format specifications are, for the most part, independent of the specific software (for example, ASCII and Unicode codes), many of them are related to the historical period in which the texts were acquired and also by dated software technologies. The file format specification should evolve hand in hand with the related software, and the fate of one is in fact often linked to that of the other. It is therefore appropriate to face the issue of obsolescence of software together with the obsolescence of file formats and of storage medium.","keywords":["text management","text analysis"],"pages":"168-172","url":"https:\/\/publications.cnr.it\/doc\/319040","volume":"","doi":"","editors_people":"","editors":[""],"published":"The GL-conference series. Conference proceedings","publisher":"TransAtlantic (Amsterdam, Paesi Bassi)","issn":"1386-2316","isbn":"978-90-77484-22-7","conference_name":"GL15: Fifteenth International Conference on Grey Literature","conference_place":"Bratislava","conference_date":"2, 3 december 2013"},{"id":131797,"last_updated":"2016-05-20 12:04:33","id_people":353214,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Il Contributo Tecnologico dell'ILC al Progetto LinCi","year":2013,"authors_people":"Cucurullo Sebastiana, Sassi Manuela","authors_cnr":["Cucurullo, Sebastiana","Sassi, Manuela"],"authors_cnr_id":["11479","19592"],"authors_cnr_institute":["048","048"],"authors":["Cucurullo, S.","Sassi, M."],"abstract":"Il progetto \"la Lingua delle Citt\u00e0 (LinCi)\" ha l'obiettivo di mettere in luce alcuni fenomeni rilevanti - sia dal punto di vista lessicale che grammaticale - dell'italiano comune e informale, secondo l'opinione sull'uso dei parlanti intervistati. A tale scopo il gruppo dei linguisti che ha ideato il progetto ha elaborato un questionario di 200 domande riconducibili a vari campi semantici. La struttura del questionario consente inoltre al raccoglitore di ricavare informazioni di tipo grammaticale (per esempio sull'uso di certe forme pronominali o verbali), nonch\u00e9 giudizi di carattere metalinguistico sulla \"dialettalit\u00e0\" o meno di certe forme, sulle differenze tra registro formale e informale, sulla frequenza d'uso.","keywords":["lingua italiana","banche dati"],"pages":"81-99","url":"https:\/\/publications.cnr.it\/doc\/353214","volume":"","doi":"","editors_people":"Annalisa Nesi, Teresa Poggi Salani","editors":["Nesi, A.","Salani, T. P."],"published":"La lingua delle citt\u00e0 LinCi. La banca dati","publisher":"Accademia della Crusca (Firenze, ITA)","issn":"","isbn":"978-88-89369-51-7","conference_name":"","conference_place":"","conference_date":""},{"id":131807,"last_updated":"2016-05-20 12:04:32","id_people":353219,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"ASPETTI TECNICO-METODOLOGICI DEL PROGETTO LinCi","year":2013,"authors_people":"Cucurullo Sebastiana, Sassi Manuela","authors_cnr":["Cucurullo, Sebastiana","Sassi, Manuela"],"authors_cnr_id":["11479","19592"],"authors_cnr_institute":["048","048"],"authors":["Cucurullo, S.","Sassi, M."],"abstract":"l progetto \"la Lingua delle Citt\u00e0 (LinCi)\" ha l'obiettivo di mettere in luce i cambiamenti e l'evoluzione dei diversi dialetti italiani regionali, sia dal punto di vista grammaticale che lessicale. A tale scopo, \u00e8 stato elaborato un questionario di 200 domande su vari campi semantici: determinazioni temporali; forme di saluto; corpo umano; mestieri; oggetti domestici; cibi, frutta e verdura; rapporti sociali, ecc. La struttura del questionario consente inoltre al raccoglitore di ricavare informazioni di tipo grammaticale (per esempio sull'uso di certe forme pronominali e verbali), nonch\u00e9 giudizi di carattere metalinguistico, sulla \"dialettalit\u00e0\" o meno di certe forme, sulle differenze tra registro formale e informale, ecc. La collaborazione dell'Istituto di Linguistica Computazionale (ILC) al Progetto LinCi ha come obiettivo quello di fornire il supporto informatico all'unit\u00e0 di coordinamento per la creazione e gestione della banca-dati e la sua consultazione tramite il sito dedicato.","keywords":["Sociolinguistica","banca-dati DBT"],"pages":"47-50","url":"https:\/\/publications.cnr.it\/doc\/353219","volume":"11","doi":"","editors_people":"Annalisa Nesi","editors":["Nesi, A."],"published":"La lingua delle citt\u00e0 Raccolta di studi","publisher":"Franco Cesati Editore (Firenze, ITA)","issn":"","isbn":"9788876674563","conference_name":"","conference_place":"","conference_date":""},{"id":131717,"last_updated":"2015-08-04 12:31:38","id_people":206469,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Archivio Elettronico delle Concordanze Diacroniche dell'Orlando Furioso","year":2011,"authors_people":"Sebastiana Cucurullo, Manuela Sassi","authors_cnr":["Cucurullo, Sebastiana","Sassi, Manuela"],"authors_cnr_id":["11479","19592"],"authors_cnr_institute":["048","048"],"authors":["Cucurullo, S.","Sassi, M."],"abstract":"The project to build a digital electronic archiving of the concordances diachronic Orlando Furioso began in the '70s and had as its objective the study of a computational method for the treatment of variants.The basic text, provided by the \"Accademia della Crusca\", refers to the latest edition published in 1532 by the author, while the first 2 editions, published respectively in 1516 and in 1521, had not yet been the subject of electronic transcription. This has directed the staff of the project towards a reconstruction of the previous witnesses through accurate recording of the critical apparatus Debenedetti - Segre, 1960.","keywords":["DBT","Orlando Furioso","banca-dati testuale"],"pages":"11","url":"https:\/\/publications.cnr.it\/doc\/206469","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131380,"last_updated":"2015-08-04 12:31:42","id_people":136468,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Visual information to improve a lexical-semantic terminological resource","year":2010,"authors_people":"Marinelli R.; Spadoni G.; Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Marinelli, Rita"],"authors_cnr_id":["11479","13100"],"authors_cnr_institute":[""],"authors":["Marinelli, R.","Spadoni, G.","Cucurullo, S."],"abstract":"The lexical semantic database MariTerm contains structured information about the specialized terminology of the maritime domain (maritime navigation and transport). This paper describes the main phases of a project which aims to enhance the terminological database by means of a set of images: a) the structure of the terminological database; b) the domain conceptual modelling; c) the database management tool which, among its various features, allows visualization on demand of the image which is associated with the term being sought, contributing to clarification of the meaning of the term and increasing its information and communication potential.","keywords":["terminology","computational resources","terminological databases","visual information"],"pages":"493-500","url":"https:\/\/publications.cnr.it\/doc\/136468","volume":"1","doi":"","editors_people":"Rosario Caballero Rodriguez, M. Jesus Pinar Sanz","editors":["Rodriguez, R. C.","Sanz, M. J. P."],"published":"Modos y formas de la comunicaci\u00f2n humana-Ways and modes of human communication","publisher":"","issn":"","isbn":"978-84-8427-759-0","conference_name":"","conference_place":"","conference_date":""},{"id":131216,"last_updated":"2015-08-04 12:31:41","id_people":84770,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Lexical Semantic Resources in a Terminological Network","year":2010,"authors_people":"Marinelli R.; Roventini A.; Spadoni G.; Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Marinelli, Rita","Roventini, Adriana"],"authors_cnr_id":["11479","13100","18411"],"authors_cnr_institute":[""],"authors":["Marinelli, R.","Roventini, A.","Spadoni, G.","Cucurullo, S."],"abstract":"A research has been carried on and is still in progress aimed at the construction of three specialized lexicons organized as databases of relational type. The three databases contain terms belonging to the specialized knowledge fields of maritime terminology (technical-nautical and maritime transport domain), taxation law, and labour law with union labour rules, respectively. The EuroWordNet\/ItalWordNet model was firstly used to structure the terminological database of maritime domain. The methodology experimented for its construction was applied to construct the next databases. It consists in i) the management of corpora of specialized languages and ii) the use of generic databases to identify and extract a set of candidate terms to be codified in the terminological databases. The three specialized resources are described highlighting the various kinds of lexical semantic relations linking each term to the others within the single terminological database and to the generic resources WordNet and ItalWordNet. The construction of these specialized lexicons was carried on in the framework of different projects; but they can be seen as a first nucleus of an organized network of generic and specialized lexicons with the purpose of making the meaning of each term clearer from a cognitive point of view.","keywords":["Lexicon","Semantics","Lexical database","Ontologies"],"pages":"2288-2291","url":"https:\/\/publications.cnr.it\/doc\/84770","volume":"","doi":"","editors_people":"Nicoletta Calzolari, Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odjik, Stelios Piperidis, Mike Rosner, Daniel Tapias","editors":["Calzolari, N.","Choukri, K.","Maegaard, B.","Mariani, J.","Odjik, J.","Piperidis, S.","Rosner, M.","Tapias, D."],"published":"LREC'10-Seventh International Conference on Language Resources and Evaluation (La Valletta, Malta, 17-23 May 2010). Proceedings","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"2-9517408-6-7","conference_name":"Seventh International Conference on Language Resources and Evaluation","conference_place":"La Valletta, Malta","conference_date":"17-23 May 2010"},{"id":131237,"last_updated":"2015-08-04 12:31:39","id_people":84795,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Adding information to a terminological database by means of image files","year":2010,"authors_people":"Marinelli R.; Spadoni G.; Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Marinelli, Rita"],"authors_cnr_id":["11479","13100"],"authors_cnr_institute":["048","048"],"authors":["Marinelli, R.","Spadoni, G.","Cucurullo, S."],"abstract":"A lexical semantic database containing terms belonging to the specialized lexicon of the maritime navigation and maritime transport was built according to WordNet\/EuroWordNet model. Our paper present a project planning the enrichment of the terminological database by means of a set of images. A short description is given about a) the structure of the terminological database and the domain conceptual modelling; b) the various features of the database management tool, and, among all, the possibility of visualizing, on demand, the image which is associated with the term being sought, contributing to clarify and refine the meaning of the term, increasing its information and communication effectiveness.","keywords":["terminology","lexical databases","computational resources","images"],"pages":"347-353","url":"http:\/\/www.cfilt.iitb.ac.in\/gwc2010\/pdfs\/30_adding_image_info_to_wordnet__Marinelli.pdf","volume":"","doi":"","editors_people":"P. Bhattacharyya; C. Fellbaum; P. Vossen.","editors":["Bhattacharyya, P.","Fellbaum, C.","Vossen, P."],"published":"Proceedings of the 5th Global WordNet Conference, Mumbai India, 2010","publisher":"Narosa Publishing House (New Delhi, IND)","issn":"","isbn":"978-81-8487-083-1","conference_name":"5th Global WordNet Conference","conference_place":"Mumbai","conference_date":"January 31-February 4 2010"},{"id":131609,"last_updated":"2015-08-04 12:31:40","id_people":157479,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Descrizione attivit\u00e0 Progetto Servizi innovativi di Business Intelligence e p. m. i.: la costituzione di un Sistema di Aziende Estese (BISAE): il modulo ILC","year":2010,"authors_people":"Marinelli R.; Roventini A.; Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Marinelli, Rita","Roventini, Adriana"],"authors_cnr_id":["11479","13100","18411"],"authors_cnr_institute":[""],"authors":["Marinelli, R.","Roventini, A.","Cucurullo, S."],"abstract":"","keywords":["Risorse linguistiche, terminologia, database semantico-lessicali, corpora"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157479","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131305,"last_updated":"2015-08-04 12:31:43","id_people":112949,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Visual information to improve a lexical-semantic terminological resource","year":2009,"authors_people":"Marinelli R.; Spadoni G.; Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Marinelli, Rita"],"authors_cnr_id":["11479","13100"],"authors_cnr_institute":[""],"authors":["Marinelli, R.","Spadoni, G.","Cucurullo, S."],"abstract":"The lexical semantic database MariTerm contains structured information about the specialized terminology of the maritime domain (maritime navigation and transport). This paper describes the main phases of a project which aims to enhance the terminological database by means of a set of images: a) the structure of the terminological database; b) the domain conceptual modelling; c) the database management tool which, among its various features, allows visualization on demand of the image which is associated with the term being sought, contributing to clarification of the meaning of the term and increasing its information and communication potential","keywords":["Lexical Semantic Data Bases","Visual Information","Terminology"],"pages":"159-160","url":"https:\/\/publications.cnr.it\/doc\/112949","volume":"1","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"XXVII AESLA Conference \"Modos y formas de la comunicacion humana-Ways and modes of human communication\"","conference_place":"Ciudad Real","conference_date":"2009"},{"id":131603,"last_updated":"2015-08-04 12:31:44","id_people":157473,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"WP3. 1 Tecniche di analisi semantica per l\u0092estrazione di ontologie bio-medicali","year":2009,"authors_people":"Picchi Eugenio, Sassolini Eva, Cucurullo Sebastiana, Ensini Monica","authors_cnr":["Sassolini, Eva","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["11032","11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassolini, E.","Cucurullo, S.","Ensini, M."],"abstract":"","keywords":["Ontologie","Semantica computazionale","Terminologia medica"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157473","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131170,"last_updated":"2017-06-21 16:47:29","id_people":84719,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Mining the News with Semantic Press","year":2008,"authors_people":"Picchi E.; Sassolini E.; Cucurullo S.; Bertagna F.","authors_cnr":["Bertagna, Francesca","Cucurullo, Sebastiana","Sassolini, Eva","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["11032","11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassolini, E.","Cucurullo, S.","Bertagna, F."],"abstract":"","keywords":["Text mining","Press review"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84719","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LangTech 2008","conference_place":"Roma","conference_date":"2008"},{"id":131178,"last_updated":"2015-08-04 12:31:46","id_people":84727,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Semantic Press","year":2008,"authors_people":"Picchi E.; Sassolini E.; Cucurullo S.; Bertagna F.; Baroni P.","authors_cnr":["Bertagna, Francesca","Sassolini, Eva","Baroni, Paola","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["11032","11332","11479","16688"],"authors_cnr_institute":["048","048","048","048","048"],"authors":["Picchi, E.","Sassolini, E.","Cucurullo, S.","Bertagna, F.","Baroni, P."],"abstract":"In this paper Semantic Press<\/i>, a tool for the automatic press review, is introduced. It is based on Text Mining technologies and is tailored to meet the needs of the eGovernment and eParticipation communities. First, a general description of the application demands emerging from the eParticipation and eGovernment sectors is offered. Then, an introduction to the framework of the automatic analysis and classification of newspaper content is provided, together with a description of the technologies underlying it.","keywords":["Text Mining","Tools","Systems","Applications"],"pages":"2752-2756","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2008\/","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference Chair); Khalid Choukri; Bente Maegaard; Joseph Mariani; Jan Odjik; Stelios Piperidis; Daniel Tapias","editors":["Calzolari, N.","Choukri, K.","Maegaard, B.","Mariani, J.","Odjik, J.","Piperidis, S.","Tapias, D."],"published":"Proceedings of the Sixth International Conference on Language Resources and Evaluation","publisher":"European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)","issn":"","isbn":"2-9517408-4-0","conference_name":"LREC 2008-Sixth International Conference on Language Resources and Evaluation","conference_place":"Marrakech","conference_date":"26\/05\/2008-01\/06\/2008"},{"id":131438,"last_updated":"2009-09-24 00:00:00","id_people":151564,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Lessico italiano radiofonico 1995-2003","year":2008,"authors_people":"Cucurullo S., Picchi E., Biffi M.","authors_cnr":["Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["16688"],"authors_cnr_institute":[""],"authors":["Cucurullo, S.","Picchi, E.","Biffi, M."],"abstract":"","keywords":["Lessico radiofonico","Corpus parlato"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151564","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131439,"last_updated":"2009-09-24 00:00:00","id_people":151565,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Le concordanze diacroniche dell'Orlando Furioso","year":2008,"authors_people":"Cucurullo S., Picchi E., Sassi M., Segre C., Martignoni C., Morini L.","authors_cnr":["Cucurullo, Sebastiana","Picchi, Eugenio","Sassi, Manuela"],"authors_cnr_id":["16688","19592"],"authors_cnr_institute":[""],"authors":["Cucurullo, S.","Picchi, E.","Sassi, M.","Segre, C.","Martignoni, C.","Morini, L."],"abstract":"","keywords":["Furioso, Orlando","Concordanze diacroniche"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151565","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131442,"last_updated":"2009-09-24 00:00:00","id_people":151568,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Semantic Press","year":2008,"authors_people":"Picchi E., Cucurullo S., Sassolini E.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Picchi, Eugenio"],"authors_cnr_id":["11032","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Cucurullo, S.","Sassolini, E."],"abstract":"","keywords":["Rassegna stampa","Estrazione di informazione"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151568","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131556,"last_updated":"2017-06-21 16:04:11","id_people":157426,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Implementazione di procedure per la Named Entity Recognition","year":2007,"authors_people":"Picchi E., Sassolini E., Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassolini, E.","Cucurullo, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157426","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131557,"last_updated":"2017-06-21 16:04:15","id_people":157427,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Implementazione di procedure di Clustering","year":2007,"authors_people":"Picchi E., Sassolini E., Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassolini, E.","Cucurullo, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157427","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131558,"last_updated":"2017-06-21 16:04:19","id_people":157428,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Implementazione di procedure di Spidering per sistemi di Alerting","year":2007,"authors_people":"Picchi E., Sassolini E., Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassolini, E.","Cucurullo, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157428","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131566,"last_updated":"2017-06-21 16:04:27","id_people":157436,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"ALT-Web. Sito dell\u0092Atlante Lessicale Toscano (ALT) in rete","year":2007,"authors_people":"Picchi E., Montemagni S., Cucurullo S., Sassolini E., Paoli M.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["5595","11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Montemagni, S.","Cucurullo, S.","Sassolini, E.","Paoli, M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157436","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131559,"last_updated":"2017-06-21 16:04:23","id_people":157429,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Legislazione Toscana raccolta e illustrata da Lorenzo Cantini","year":2007,"authors_people":"Picchi E., Sassolini E., Cucurullo S. (a cura di)","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassolini, E.","Cucurullo, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157429","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131087,"last_updated":"2017-06-21 16:22:12","id_people":84625,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Next Generation Language Resources using Grid","year":2006,"authors_people":"Calzolari F., Sassolini E., Sassi M., Cucurullo S., Picchi E., Bertagna F., Enea A., Monachini M., Soria C., Calzolari N.","authors_cnr":["Bertagna, Francesca","Cucurullo, Sebastiana","Sassolini, Eva","Enea, Alessandro","Monachini, Monica","Soria, Claudia","Cucurullo, Sebastiana","Picchi, Eugenio","Sassi, Manuela","Zamorani, Nicoletta"],"authors_cnr_id":["8533","8945","9887","11479","16688","19592","26123"],"authors_cnr_institute":[""],"authors":["Calzolari, F.","Sassolini, E.","Sassi, M.","Cucurullo, S.","Picchi, E.","Bertagna, F.","Enea, A.","Monachini, M.","Soria, C.","Calzolari, N."],"abstract":"This paper presents a case study concerning the challenges and requirements posed by next generation language resources, realized as an overall model of open, distributed and collaborative language infrastructure. If a sort of \"new paradigm\" for language resource sharing is required, we think that the emerging and still evolving technology connected to Grid computing is a very interesting and suitable one for a concrete realization of this vision. Given the current limitations of Grid computing, it is very important to test the new environment on basic language analysis tools, in order to get the feeling of what are the potentialities and possible limitations connected to its use in NLP. For this reason, we have done some experiments on a module of the Linguistic Miner, i.e. the extraction of linguistic patterns from restricted domain corpora. The Grid environment has produced the expected results (reduction of the processing time, huge storage capacity, data redundancy) without any additional cost for the final user.","keywords":["grid","acquisition","topic classification"],"pages":"1858-1861","url":"https:\/\/publications.cnr.it\/doc\/84625","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"2-9517408-2-4","conference_name":"LREC 2006: 5th International Conference on Language Resources and Evaluation","conference_place":"Genova","conference_date":"24-26 Maggio 2006"},{"id":131091,"last_updated":"2012-05-31 18:50:31","id_people":84629,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Dialectal resources on-line: the ALT-Web experience","year":2006,"authors_people":"Cucurullo S., Montemagni S., Paoli M., Picchi E., Sassolini E.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":["048","048","048","048"],"authors":["Cucurullo, S.","Montemagni, S.","Paoli, M.","Picchi, E.","Sassolini, E."],"abstract":"The paper presents an on-line dialectal resource, ALT-Web, which gives access to the linguistic data of the Atlante Lessicale Toscano, a specially designed linguistic atlas in which lexical data have both a diatopic and diastratic characterisation. The paper focuses on: the dialectal data representation model; the access modalities to the ALT dialectal corpus; ontology-based search.","keywords":["Computational dialectology","Dialectal databases","Construction of lexical resources"],"pages":"1846-1851","url":"http:\/\/www.lrec-conf.org\/lrec2006\/","volume":"Proceedings","doi":"","editors_people":"","editors":[""],"published":"Dialectal resources on-line: the ALT-Web experience","publisher":"","issn":"","isbn":"2-9517408-2-4","conference_name":"LREC 2006: 5th International Conference on Language Resources and Evaluation","conference_place":"Genoa","conference_date":"24-25-26 Maggio 2006"},{"id":131121,"last_updated":"2012-05-07 15:39:56","id_people":84661,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Atlante Dialettale in rete: ALT-Web","year":2006,"authors_people":"Cucurullo S., Montemagni S., Paoli M., Picchi E., Sassolini E.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":["048","048","048","048"],"authors":["Cucurullo, S.","Montemagni, S.","Paoli, M.","Picchi, E.","Sassolini, E."],"abstract":"The paper presents an on-line dialectal resource, ALT-Web, which gives access to the linguistic data of the Lexical Atlas of Tuscany or Atlante Lessicale Toscano, a specially designed linguistic atlas in which lexical data have both a diatopic and diastratic characterisation. The paper illustrates ALT-Web with particular emphasis on: 1) the dialectal data representation model; 2) the access modalities to the ALT dialectal corpus designed to produce an output tailored to the specific needs of the different classes of users (both professionals and common citizens); 3) ontology-based search. These represent three main features which differentiate ALT-Web both from the previous digitalised ALT version and, most interestingly, from other on-line dialectal resources. At the time of writing, this is the first resource of this type in Italy, and one of the few at the international level.","keywords":["dialectal resources","information retrieval"],"pages":"661-672","url":"http:\/\/www.euralex.org\/publications\/","volume":"2","doi":"","editors_people":"E. Corino, C. Marello, C. Onesti","editors":["Corino, E.","Marello, C.","Onesti, C."],"published":"Proceedings in 12\u00b0 EURALEX International Congress, Congresso internazionale di lessicografia","publisher":"Edizioni dell'ORSO (Alessandria, ITA)","issn":"","isbn":"8876949186","conference_name":"12\u00b0 EURALEX International Congress","conference_place":"Torino","conference_date":"6-9 Settembre 2006"},{"id":131432,"last_updated":"2017-06-21 16:27:13","id_people":151557,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"ALTWEB","year":2006,"authors_people":"Picchi E., Montemagni S., Sassolini E., Cucurullo S., Paoli M.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["5595","11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Montemagni, S.","Sassolini, E.","Cucurullo, S.","Paoli, M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151557","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131435,"last_updated":"2023-03-13 08:46:16","id_people":151561,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Linguistic Miner","year":2006,"authors_people":"Picchi E., Sassi M., Ceccotti M.L., Sassolini E., Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Ceccotti, Maria Luigia","Cucurullo, Sebastiana","Picchi, Eugenio","Sassi, Manuela"],"authors_cnr_id":["3099","11479","16688","19592"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassi, M.","Ceccotti, M. L.","Sassolini, E.","Cucurullo, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151561","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131504,"last_updated":"2009-06-16 00:00:00","id_people":157373,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Atlante Lessicale Toscano in rete (ALT-Web). Relazione finale","year":2005,"authors_people":"Cucurullo S., Montemagni S., Paoli M., Picchi E., Sassolini E.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":[""],"authors":["Cucurullo, S.","Montemagni, S.","Paoli, M.","Picchi, E.","Sassolini, E."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157373","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131409,"last_updated":"2009-06-18 00:00:00","id_people":151532,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"ALTWEB","year":2005,"authors_people":"Picchi E., Montemagni S., Sassolini E., Cucurullo S., Paoli M.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Montemagni, S.","Sassolini, E.","Cucurullo, S.","Paoli, M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151532","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131410,"last_updated":"2018-01-22 16:59:01","id_people":151533,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Linguistic Miner","year":2005,"authors_people":"Picchi E., Sassi M., Ceccotti M.L., Sassolini E., Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Ceccotti, Maria Luigia","Cucurullo, Sebastiana","Picchi, Eugenio","Sassi, Manuela"],"authors_cnr_id":["3099","11479","16688","19592"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassi, M.","Ceccotti, M. L.","Sassolini, E.","Cucurullo, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151533","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131077,"last_updated":"2017-06-21 15:52:00","id_people":84615,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Linguistic Miner. An Italian Linguistic Knowledge System","year":2004,"authors_people":"Picchi E., Ceccotti M.L., Cucurullo S., Sassi M., Sassolini E.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Ceccotti, Maria Luigia","Cucurullo, Sebastiana","Picchi, Eugenio","Sassi, Manuela"],"authors_cnr_id":["3099","11479","16688","19592"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Ceccotti, M. L.","Cucurullo, S.","Sassi, M.","Sassolini, E."],"abstract":"Linguistic Miner is a project carried out at ILC whose objective is the development of an integrated system to build, organise and manage a corpus of Italian texts (of various origins and formats), and to design and constantly add new tools for the automatic extraction of tiered linguistic knowledge to be made available for many teaching, publishing, and other cultural purposes. The project is based on a notion that is preliminary to all the systems for corpus-based linguistic analysis: a language represented by the largest possible collection of heterogeneous texts is the best source of linguistic information at any level of analysis considered. The first goals of such a system are the semi-automated construction of an Italian data mine for the extraction of linguistic information, the validation of linguistic patterns, the installation of useful tools and resources for a range of different categories of Italian language users. The main feature of the project is its purpose of building large language reference corpora allowing for the creation and use of effective tools for the handling and processing, as well as the automatic linguistic synthesis, of such corpora.","keywords":["linguistic analysis","information extraction"],"pages":"1811-1814","url":"http:\/\/www.lrec-conf.org\/lrec2004\/","volume":"V","doi":"","editors_people":"","editors":[""],"published":"Proceedings of the 4th International Conference on Language Resources and Evaluation","publisher":"","issn":"","isbn":"2-9517408-1-6","conference_name":"LREC 2004: Fourth International Conference on Language Resources and Evaluation","conference_place":"Lisbona","conference_date":"26-27-28 Maggio 2004"},{"id":130952,"last_updated":"2014-11-27 13:57:27","id_people":64493,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Risorse monolingui e multilingui. Corpus bilingue italiano-arabo","year":2003,"authors_people":"Picchi E. , Sassolini E. , Nahli O. , Cucurullo S.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Nahli, Ouafae","Picchi, Eugenio"],"authors_cnr_id":["16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Sassolini, E.","Nahli, O.","Cucurullo, S."],"abstract":"Abstract - The objective of the project is twofold: on the one hand, the creation and elaboration of software procedures for the Arabic language and, on the other hand, the creation of linguistic resources for the management of large Arabic corpora. The linguistic resources are substantially the following: a) Morphological engine for the Arabic language. The engine is constituted by a number of modules: the algorithms and modules for generation and analysis, an appropriate encoding system for the representation of lexical data and of morphological characteristics of Arabic, the so-called \u0093lemmario\u0094, i.e. the archive of lemmas; b) The automatic alignment of parallel texts in Italian and Arabic language; c) Automatic tagging of Arabic texts, performed by using the above morphological engine; d) Systems for accessing and querying (raw and\/or tagged) Arabic texts and parallel Italian-Arabic corpora.","keywords":["Morfologia araba","Corpora bilingui","Analisi testuale","Aligner","Tagger"],"pages":"629-678","url":"https:\/\/publications.cnr.it\/doc\/64493","volume":"18-19","doi":"","editors_people":"","editors":[""],"published":"Linguistica computazionale (Online)","publisher":"Istituti Editoriali e Poligrafici Internazionali (Ghezzano La Fontina, Italia)","issn":"1824-1573","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131968,"last_updated":"2015-08-04 12:31:47","id_people":288585,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Italian Arabic Linguistic Tools","year":2002,"authors_people":"Picchi, Eugenio; Sassolini, Eva; Nahli, Ouafae; Cucurullo Sebastiana; Vargas, Isabel Maria","authors_cnr":["Nahli, Ouafae","Sassolini, Eva","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["11032","11479","16688"],"authors_cnr_institute":["048","048","048","048"],"authors":["Picchi, E.","Sassolini, E.","Nahli, O.","Cucurullo, S.","Vargas, I. M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/288585","volume":"Volume II","doi":"","editors_people":"","editors":[""],"published":"Third International Conference on Language Resources and Evaluation","publisher":"","issn":"","isbn":"","conference_name":"LREC 2002","conference_place":"Las Palmas de Gran Canaria, Spain","conference_date":"30th & 31 May 2002"}]