[{"id":366730,"last_updated":"2024-01-10 11:01:36","id_people":490948,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Il lemmario del \u00abGDLI\u00bb: dati quantitativi e prime osservazioni","year":2023,"authors_people":"Marco Biffi, Elisa Guadagnini, Simonetta Montemagni ed Eva Sassolini","authors_cnr":["Montemagni, Simonetta","Sassolini, Eva","Guadagnini, Elisa"],"authors_cnr_id":["5595","11032","12720"],"authors_cnr_institute":[""],"authors":["Biffi, M.","Guadagnini, E.","Montemagni, S.","Sassolini, E."],"abstract":"Dopo la realizzazione della versione elettronica del solo testo del \"Grande dizionario della lingua italiana\" (GDLI), si \u00e8 avviato un progetto di graduale informatizzazione della sua struttura. Questo articolo ne presenta il primo risultato, vale a dire l'estrazione automatica del lemmario che \u00e8 cos\u00ec per la prima volta quantificabile e individuabile. Una prima parte del testo \u00e8 dedicata all'illustrazione della strutturazione dei contenuti del dizionario e la loro rappresentazione secondo standard internazionalmente riconosciuti (XML-TEI); la seconda presenta una prima elaborazione dei dati del lemmario estratto; la terza propone una prima analisi comparativa con i lemmari di altri dizionari della lingua italiana.","keywords":["Lessicografia","Lessicografia digitale","Lessicografia storica"],"pages":"331-351","url":"https:\/\/accademiadellacrusca.it\/it\/riviste\/articoli\/slei-xl-2023\/8679","volume":"40","doi":"","editors_people":"","editors":[""],"published":"Studi di lessicografia italiana","publisher":"Le Lettere (Firenze, Italia)","issn":"0392-5218","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":354899,"last_updated":"2023-04-19 15:24:29","id_people":477716,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Parole in rete \/ reti di parole. Possibili impieghi didattici dei grandi vocabolari storici digitalizzati","year":2022,"authors_people":"Marco Biffi, Francesca De Blasi, Manuel Favaro, Elisa Guadagnini, Simonetta Montemagni e Eva Sassolini","authors_cnr":["Favaro, Manuel","De Blasi, Francesca","Montemagni, Simonetta","Sassolini, Eva","Guadagnini, Elisa"],"authors_cnr_id":["5595","11032","12720"],"authors_cnr_institute":[""],"authors":["Biffi, M.","De Blasi, F.","Favaro, M.","Guadagnini, E.","Montemagni, S.","Sassolini, E."],"abstract":"After a brief presentation of the great historical dictionaries of Italian, which are free to use online thanks to the digitalisation work carried out by the Accademia della Crusca, the contribution offers a number of examples of how these tools can be used for educational purposes. Finally, further didactic uses are described, which will be made possible thanks to the advanced digital tools that the Accademia della Crusca and the Istituto di Linguistica Computazionale \"Antonio Zampolli\" del Consiglio Nazionale delle Ricerche (ILC) are currently working on.","keywords":["Lessicografia italiana","Didattica dell'italiano","Lessicografia digitale"],"pages":"143-188","url":"https:\/\/italianoascuola.unibo.it\/article\/view\/14866","volume":"4","doi":"10.6092\/issn.2704-8128\/14866","editors_people":"","editors":[""],"published":"Italiano a scuola","publisher":"ABIS-AlmaDL (Bologna, Italia)","issn":"2704-8128","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":343148,"last_updated":"2022-10-21 15:19:30","id_people":472294,"institutes":["ILC","IGSG"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Making Italian Parliamentary Records Machine-Actionable: the Construction of the ParlaMint-IT corpus","year":2022,"authors_people":"Tommaso Agnoloni, Roberto Bartolini, Francesca Frontini, Simonetta Montemagni, Carlo Marchetti, Valeria Quochi, Manuela Ruisi, Giulia Venturi","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Agnoloni, Tommaso","Quochi, Valeria","Frontini, Francesca","Venturi, Giulia"],"authors_cnr_id":["5595","10441","11403","11893","15911","17692"],"authors_cnr_institute":[""],"authors":["Agnoloni, T.","Bartolini, R.","Frontini, F.","Montemagni, S.","Marchetti, C.","Quochi, V.","Ruisi, M.","Venturi, G."],"abstract":"This paper describes the process of acquisition, cleaning, interpretation, coding and linguistic annotation of a collection of parliamentary debates from the Senate of the Italian Republic covering the COVID-19 pandemic emergency period and a former period for reference and comparison according to the CLARIN ParlaMint prescriptions. The corpus contains 1199 sessions and 79,373 speeches for a total of about 31 million words, and was encoded according to the ParlaCLARIN TEI XML format. It includes extensive metadata about the speakers, sessions, political parties and parliamentary groups. As required by the ParlaMint initiative, the corpus was also linguistically annotated for sentences, tokens, POS tags, lemmas and dependency syntax according to the universal dependencies guidelines. Named entity annotation and classification is also included. All linguistic annotation was performed automatically using state-of-the-art NLP technology with no manual revision. The Italian dataset is freely available as part of the larger ParlaMint 2.1 corpus deposited and archived in CLARIN repository together with all other national corpora. It is also available for direct analysis and inspection via various CLARIN services and has already been used both for research and educational purposes.","keywords":["parliamentary debates","CLARIN ParlaMint","corpus creation","corpus annotation"],"pages":"117-124","url":"https:\/\/aclanthology.org\/2022.parlaclarin-1.17\/","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"","conference_name":"Workshop ParlaCLARIN III within the 13th Language Resources and Evaluation Conference","conference_place":"Marseille, France","conference_date":"20\/06\/2022"},{"id":132456,"last_updated":"2022-02-17 18:43:13","id_people":455303,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"La digitalizzazione del GDLI: un approccio linguistico per la corretta acquisizione del testo?","year":2021,"authors_people":"Sassolini Eva, Biffi Marco, De Blasi Francesca, Guadagnini Elisa, Montemagni Simonetta","authors_cnr":["De Blasi, Francesca","Montemagni, Simonetta","Sassolini, Eva","Guadagnini, Elisa"],"authors_cnr_id":["5595","11032","12720"],"authors_cnr_institute":[""],"authors":["Sassolini, E.","Biffi, M.","De Blasi, F.","Guadagnini, E.","Montemagni, S."],"abstract":"In questo articolo sono discussi metodi e strategie in via di elaborazione per la correzione (propedeutica alla successiva strutturazione) dei contenuti del Grande dizionario della lingua italiana (GDLI) fondato da Salvatore Battaglia, estratti da un formato digitale non standard. La presenza, in questo formato, di errori distribuiti di vario tipo ha condizionato la scelta dell'approccio all'estrazione e messo in luce tutte le difficolt\u00e0 dell'operazione. Le sperimentazioni fatte sino a oggi portano a privilegiare una strategia di correzione multilivello, che procede scomponendo in sezioni distinte l'individuazione e la correzione degli errori, in modo da rendere gestibili interventi complessi di correzione semi-automatica, altrimenti improponibili, e consentire un loro raffinamento progressivo. Parallelamente alla definizione di regole di riconoscimento di struttura e formato, stiamo analizzando metodi e procedure in grado di migliorare la qualit\u00e0 dell'input e specializzare i moduli di estrazione per i singoli campi della voce a partire dal \"lemma\". Le finalit\u00e0 del lavoro sono duplici: l'estrazione e strutturazione dei contenuti e la produzione di un formato standard di rappresentazione dei dati. Si tratta di un percorso difficile perch\u00e9 il formato dei dati rende l'uso di strumenti reperibili in letteratura non applicabile. Solamente al termine del lavoro potremo capire se esistono le condizioni per trasformare l'approccio adottato in un protocollo di intervento replicabile.","keywords":["dizionari digitali","risorse linguistiche","estrazione dell'informazione","correzione del testo post OCR"],"pages":"159-166","url":"https:\/\/aiucd2021.labcd.unipi.it\/wp-content\/uploads\/2021\/05\/AIUCD2021_BOA-versione3A.pdf","volume":"","doi":"10.6092\/unibo\/amsacta\/6712","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"9788894253559","conference_name":"AIUCD 2021-DH per la societ\u00e0: e-guaglianza, partecipazione, diritti e valori nell'era digitale","conference_place":"Pisa","conference_date":"19-22\/01\/2021"},{"id":132489,"last_updated":"2022-05-05 11:44:08","id_people":463861,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Linguistically annotated multilingual comparable corpora of parliamentary debates ParlaMint. ana 2. 1","year":2021,"authors_people":"Toma? Erjavec, Maciej Ogrodniczuk, Petya Osenova, Nikola Ljube?i?, Kiril Simov, Vladislava Grigorova, Micha? Rudolf, Andrej Pan?ur, Maty\u00e1? Kopp, Starka\u00f0ur Barkarson, Stein\u00feor Steingr\u00edmsson, Henk van der Pol, Griet Depoorter, Jesse de Does, Bart Jongejan, Dorte Haltrup Hansen, Costanza Navarretta, Mar\u00eda Calzada P\u00e9rez, Luciana D. de Macedo, Ruben van Heusden, Maarten Marx, \u00c7a?r? \u00c7\u00f6ltekin, Matthew Coole, Tommaso Agnoloni, Francesca Frontini, Simonetta Montemagni, Valeria Quochi, Giulia Venturi, Manuela Ruisi, Carlo Marchetti, Roberto Battistoni, Mikl\u00f3s Seb?k, Orsolya Ring, Roberts Dar?is, Andrius Utka, Mindaugas Petkevi?ius, Monika Briedien\u00e9, Tomas Krilavi?ius, Vaidas Morkevi?ius, Roberto Bartolini, Andrea Cimino, Sascha Diwersy, Giancarlo Luxardo, Paul Rayson","authors_cnr":["Cimino, Andrea","Montemagni, Simonetta","Bartolini, Roberto","Agnoloni, Tommaso","Quochi, Valeria","Frontini, Francesca","Venturi, Giulia"],"authors_cnr_id":["5595","10441","11403","11893","15911","17692"],"authors_cnr_institute":[""],"authors":["Erjavec, T.","Ogrodniczuk, M.","Osenova, P.","Ljube\u0161i\u0107, N.","Simov, K.","Grigorova, V.","Rudolf, M.","Pan\u010dur, A.","Kopp, M.","Barkarson, S.","Steingr\u00edmsson, S.","Van Der Pol, H.","Depoorter, G.","De Does, J.","Jongejan, B.","Haltrup Hansen, D.","Navarretta, C.","Calzada P\u00e9rez, M.","De Macedo, L. D.","Van Heusden, R.","Marx, M.","\u00c7\u00f6ltekin, \u00c7.","Coole, M.","Agnoloni, T.","Frontini, F.","Montemagni, S.","Quochi, V.","Venturi, G.","Ruisi, M.","Marchetti, C.","Battistoni, R.","Seb\u0151k, M.","Ring, O.","Dar\u0123is, R.","Utka, A.","Petkevi\u010dius, M.","Briedien\u0117, M.","Krilavi\u010dius, T.","Morkevi\u010dius, V.","Diwersy, S.","Luxardo, G.","Rayson, P."],"abstract":"ParlaMint 2.1 is a multilingual set of 17 comparable corpora containing parliamentary debates mostly starting in 2015 and extending to mid-2020, with each corpus being about 20 million words in size. The sessions in the corpora are marked as belonging to the COVID-19 period (from November 1st 2019), or being \"reference\" (before that date). The corpora have extensive metadata, including aspects of the parliament; the speakers (name, gender, MP status, party affiliation, party coalition\/opposition); are structured into time-stamped terms, sessions and meetings; with speeches being marked by the speaker and their role (e.g. chair, regular speaker). The speeches also contain marked-up transcriber comments, such as gaps in the transcription, interruptions, applause, etc. Note that some corpora have further information, e.g. the year of birth of the speakers, links to their Wikipedia articles, their membership in various committees, etc. The corpora are encoded according to the Parla-CLARIN TEI recommendation (https:\/\/clarin-eric.github.io\/parla-clarin\/), but have been validated against the compatible, but much stricter ParlaMint schemas. This entry contains the linguistically marked-up version of the corpus, while the text version is available at http:\/\/hdl.handle.net\/11356\/1432. The ParlaMint.ana linguistic annotation includes tokenization, sentence segmentation, lemmatisation, Universal Dependencies part-of-speech, morphological features, and syntactic dependencies, and the 4-class CoNLL-2003 named entities. Some corpora also have further linguistic annotations, such as PoS tagging or named entities according to language-specific schemes, with their corpus TEI headers giving further details on the annotation vocabularies and tools.","keywords":["dibattiti parlamentari","covid-19","ParlaCLARIN","parlamenti","discorso politico","CLARIN","linguistic annotation","pos-tagging","ner","linguistic dependency annotation","UD"],"pages":"","url":"http:\/\/hdl.handle.net\/11356\/1432","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132490,"last_updated":"2022-05-05 11:44:28","id_people":463865,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Multilingual comparable corpora of parliamentary debates ParlaMint 2. 1","year":2021,"authors_people":"Toma? Erjavec, Maciej Ogrodniczuk, Petya Osenova, Nikola Ljube?i?, Kiril Simov, Vladislava Grigorova, Micha? Rudolf, Andrej Pan?ur, Maty\u00e1? Kopp, Starka\u00f0ur Barkarson, Stein\u00feor Steingr\u00edmsson, Henk van der Pol, Griet Depoorter, Jesse de Does, Bart Jongejan, Dorte Haltrup Hansen, Costanza Navarretta, Mar\u00eda Calzada P\u00e9rez, Luciana D. de Macedo, Ruben van Heusden, Maarten Marx, \u00c7a?r? \u00c7\u00f6ltekin, Matthew Coole, Tommaso Agnoloni, Francesca Frontini, Simonetta Montemagni, Valeria Quochi, Giulia Venturi, Manuela Ruisi, Carlo Marchetti, Roberto Battistoni, Mikl\u00f3s Seb?k, Orsolya Ring, Roberts Dar?is, Andrius Utka, Mindaugas Petkevi?ius, Monika Briedien\u00e9, Tomas Krilavi?ius, Vaidas Morkevi?ius, Roberto Bartolini, Andrea Cimino, Sascha Diwersy, Giancarlo Luxardo, Paul Rayson","authors_cnr":["Montemagni, Simonetta","Agnoloni, Tommaso","Quochi, Valeria","Frontini, Francesca","Venturi, Giulia"],"authors_cnr_id":["5595","11403","11893","15911","17692"],"authors_cnr_institute":[""],"authors":["Erjavec, T.","Ogrodniczuk, M.","Osenova, P.","Ljube\u0161i\u0107, N.","Simov, K.","Grigorova, V.","Rudolf, M.","Pan\u010dur, A.","Kopp, M.","Barkarson, S.","Steingr\u00edmsson, S.","Van Der Pol, H.","Depoorter, G.","De Does, J.","Jongejan, B.","Haltrup Hansen, D.","Navarretta, C.","Calzada P\u00e9rez, M.","De Macedo, L. D.","Van Heusden, R.","Marx, M.","\u00c7\u00f6ltekin, \u00c7.","Coole, M.","Agnoloni, T.","Frontini, F.","Montemagni, S.","Quochi, V.","Venturi, G.","Ruisi, M.","Marchetti, C.","Battistoni, R.","Seb\u0151k, M.","Ring, O.","Dar\u0123is, R.","Utka, A.","Petkevi\u010dius, M.","Briedien\u0117, M.","Krilavi\u010dius, T.","Morkevi\u010dius, V.","Diwersy, S.","Luxardo, G.","Rayson, P."],"abstract":"ParlaMint 2.1 is a multilingual set of 17 comparable corpora containing parliamentary debates mostly starting in 2015 and extending to mid-2020, with each corpus being about 20 million words in size. The sessions in the corpora are marked as belonging to the COVID-19 period (after November 1st 2019), or being \"reference\" (before that date). The corpora have extensive metadata, including aspects of the parliament; the speakers (name, gender, MP status, party affiliation, party coalition\/opposition); are structured into time-stamped terms, sessions and meetings; with speeches being marked by the speaker and their role (e.g. chair, regular speaker). The speeches also contain marked-up transcriber comments, such as gaps in the transcription, interruptions, applause, etc. Note that some corpora have further information, e.g. the year of birth of the speakers, links to their Wikipedia articles, their membership in various committees, etc. The corpora are encoded according to the Parla-CLARIN TEI recommendation (https:\/\/clarin-eric.github.io\/parla-clarin\/), but have been validated against the compatible, but much stricter ParlaMint schemas. This entry contains the ParlaMint TEI-encoded corpora with the derived plain text version of the corpus along with TSV metadata on the speeches. Also included is the 2.0 release of the data and scripts available at the GitHub repository of the ParlaMint project. Note that there also exists the linguistically marked-up version of the corpus, which is available at http:\/\/hdl.handle.net\/11356\/1431.","keywords":["dibattiti parlamentari","covid-19","discorso politico","CLARIN","parlamenti","ParlaCLARIN"],"pages":"","url":"http:\/\/hdl.handle.net\/11356\/1431","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132486,"last_updated":"2023-11-06 19:31:48","id_people":463828,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Linguistically-driven Selection of Difficult-to-Parse Dependency Structures","year":2020,"authors_people":"Chiara Alzetta, Felice Dell'Orletta, Simonetta Montemagni, Giulia Venturi","authors_cnr":["Alzetta, Chiara","Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Alzetta, C.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"The paper illustrates a novel methodology meeting a twofold goal, namely quantifying the reliability of automatically generated dependency relations without using gold data on the one hand, and identifying which are the linguistic constructions negatively affecting the parser performance on the other hand. These represent objectives typically investigated in different lines of research, with different methods and techniques. Our methodology, at the crossroads of these perspectives, allows not only to quantify the parsing reliability of individual dependency types but also to identify and weight the contextual properties making relation instances more or less difficult to parse. The proposed methodology was tested in two different and complementary experiments, aimed at assessing the degree of parsing difficulty across (a) different dependency relation types, and (b) different instances of the same relation. The results show that the proposed methodology is able to identify difficult-to-parse dependency relations without relying on gold data and by taking into account a variety of intertwined linguistic factors. These findings pave the way to novel applications of the methodology, both in the direction of defining new evaluation metrics based purely on automatically parsed data and towards the automatic creation of challenge sets.","keywords":["Linguistic Complexity","Syntactic Parsing","Evaluation metrics"],"pages":"37-60","url":"https:\/\/journals.openedition.org\/ijcol\/719","volume":"6","doi":"10.4000\/ijcol.719","editors_people":"","editors":[""],"published":"Italian Journal of Computational Linguistics","publisher":"aAccademia University Press, Torino (Italia)","issn":"2499-4553","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132413,"last_updated":"2023-11-06 19:31:50","id_people":441971,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Metodi e Tecniche di Trattamento Automatico della Lingua per l'Estrazione di Conoscenza dalla Documentazione Scolastica","year":2020,"authors_people":"Venturi G., Dell'Orletta F., Montemagni S., Morini E. e Sagri M.T.","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Venturi, G.","Dell'Orletta, F.","Montemagni, S.","Morini, E.","Sagri, M. T."],"abstract":"Il contributo riguarda la creazione di un sistema integrato di \"knowledge management\", per la gestione e condivisione della conoscenza prodotta e utilizzata dalla scuola.","keywords":["Estrazione di informazione","Documenti scolastici","Indicizzazione","Terminology extraction"],"pages":"49-68","url":"https:\/\/publications.cnr.it\/doc\/441971","volume":"2","doi":"10.3280\/CAD2020-002005","editors_people":"","editors":[""],"published":"Cadmo (Testo stamp.)","publisher":"Franco Angeli (Napoli, Italia)","issn":"1122-5165","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132411,"last_updated":"2023-11-06 19:32:01","id_people":441967,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Verba et Acta. Un esperimento per promuovere l'evoluzione delle compe-tenze linguistiche degli studenti degli istituti professionali","year":2020,"authors_people":"Vertecchi, Benedetto; Agrusti, Francesco; Dell'Orletta, Felice; Montemagni, Simonetta; Venturi, Giulia","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Vertecchi, B.","Agrusti, F.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"Ricerche in corso. Verba et Acta. Un esperimento per promuovere l'evoluzione delle competenze linguistiche degli studenti degli istituti professionali","keywords":["Evoluzione competenze linguistiche","Annotazione linguistica","Previsione dello sviluppo delle competenze di scrittura"],"pages":"109-117","url":"https:\/\/publications.cnr.it\/doc\/441967","volume":"","doi":"10.3280\/CAD2020-001008","editors_people":"","editors":[""],"published":"Cadmo (Testo stamp.)","publisher":"Franco Angeli (Napoli, Italia)","issn":"1122-5165","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132426,"last_updated":"2023-11-06 19:31:55","id_people":444113,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Quantitative linguistic investigations across universal dependencies treebanks","year":2020,"authors_people":"Alzetta C.; Dell'Orletta F.; Montemagni S.; Osenova P.; Simov K.; Venturi G.","authors_cnr":["Alzetta, Chiara","Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Alzetta, C.","Dell'Orletta, F.","Montemagni, S.","Osenova, P.","Simov, K.","Venturi, G."],"abstract":"The paper illustrates a case study aimed at identifying cross-lingual quantitative trends in the distribution of dependency relations in treebanks for typologically different languages. Preliminary results show interesting differences rooted either in language-specific peculiarities or cross-lingual annotation inconsistencies, with a potential impact on different application scenarios.","keywords":["Universal Dependencies Treebanks","Cross-linguistic analysis","Typology"],"pages":"1-7","url":"http:\/\/ceur-ws.org\/Vol-2769\/paper_59.pdf","volume":"2769","doi":"","editors_people":"","editors":[""],"published":"CEUR workshop proceedings","publisher":"M. Jeusfeld c\/o Redaktion Sun SITE, Informatik V, RWTH Aachen (Aachen, Germania)","issn":"1613-0073","isbn":"979-12-80136-28-2","conference_name":"7th Italian Conference on Computational Linguistics (CLiC-it)","conference_place":"Online","conference_date":"1-3\/03\/2021"},{"id":132427,"last_updated":"2023-11-06 19:31:38","id_people":444114,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"AcCompl-it @ EVALITA2020: Overview of the acceptability & complexity evaluation task for Italian","year":2020,"authors_people":"Brunato D.; Chesi C.; Dell'Orletta F.; Montemagni S.; Venturi G.; Zamparelli R.","authors_cnr":["Brunato, Dominique Pierina","Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Brunato, D.","Chesi, C.","Dell'Orletta, F.","Montemagni, S.","Venturi, G.","Zamparelli, R."],"abstract":"The Acceptability and Complexity evaluation task for Italian (AcCompl-it) was aimed at developing and evaluating methods to classify Italian sentences according to Acceptability and Complexity. It consists of two independent tasks asking participants to predict either the acceptability or the complexity rate (or both) of a given set of sentences previously scored by native speakers on a 1-to-7 points Likert scale. In this paper, we introduce the datasets distributed to the participants, we describe the different approaches of the participating systems and provide a first analysis of the obtained results.","keywords":["Shared Task","Linguistic Complexity","Acceptability"],"pages":"1-8","url":"http:\/\/ceur-ws.org\/Vol-2765\/paper163.pdf","volume":"2765","doi":"","editors_people":"","editors":[""],"published":"CEUR workshop proceedings","publisher":"M. Jeusfeld c\/o Redaktion Sun SITE, Informatik V, RWTH Aachen (Aachen, Germania)","issn":"1613-0073","isbn":"","conference_name":"EVALITA '20, Evaluation of NLP and Speech Tools for Italian","conference_place":"Online","conference_date":"17\/12\/2020"},{"id":132394,"last_updated":"2023-11-06 19:31:54","id_people":435966,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Profiling-UD: a Tool for Linguistic Profiling of Texts","year":2020,"authors_people":"Dominique Brunato, Andrea Cimino, Felice Dell'Orletta, Simonetta Montemagni, Giulia Venturi","authors_cnr":["Cimino, Andrea","Brunato, Dominique Pierina","Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Brunato, D.","Cimino, A.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"In this paper, we introduce Profiling-UD, a new text analysis tool inspired to the principles of linguistic profiling that can support language variation research from different perspectives. It allows the extraction of more than 130 features, spanning across different levels of linguistic description. Beyond the large number of features that can be monitored, a main novelty of Profiling-UD is that it has been specifically devised to be multilingual since it is based on the Universal Dependencies framework. In the second part of the paper, we demonstrate the effectiveness of these features in a number of theoretical and applicative studies in which they were successfully used for text and author profiling.","keywords":["Computational Language Variation Analysis","Linguistic Profiling","Universal Dependencies"],"pages":"7145-7151","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2020\/pdf\/2020.lrec-1.883.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"979-10-95546-34-4","conference_name":"Conference on Language Resources and Evaluation (LREC)","conference_place":"","conference_date":"11-16\/05\/2020"},{"id":132393,"last_updated":"2023-11-06 19:32:02","id_people":435958,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Voices of the Great War: A Richly Annotated Corpus of Italian Texts on the First World War","year":2020,"authors_people":"Alessandro Lenci, Simonetta Montemagni, Federico Boschetti, Irene De Felice, Stefano dei Rossi, Felice Dell'Orletta, Michele Di Giorgio, Martina Miliani, Lucia C. Passaro, Angelica Puddu, Giulia Venturi, Nicola Labanca","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice","Boschetti, Federico","Venturi, Giulia"],"authors_cnr_id":["5595","14329","14630","17692"],"authors_cnr_institute":[""],"authors":["Lenci, A.","Montemagni, S.","Boschetti, F.","De Felice, I.","Dei Rossi, S.","Dell'Orletta, F.","Di Giorgio, M.","Miliani, M.","Passaro, L. C.","Puddu, A.","Venturi, G.","Labanca, N."],"abstract":"Voci della Grande Guerra (\"Voices of the Great War\") is the first large corpus of Italian historical texts dating back to the period of First World War. This corpus differs from other existing resources in several respects. First, from the linguistic point of view it gives account of the wide range of varieties in which Italian was articulated in that period, namely from a diastratic (educated vs. uneducated writers), diaphasic (low\/informal vs. high\/formal registers) and diatopic (regional varieties, dialects) points of view. From the historical perspective, through a collection of texts belonging to different genres it represents different views on the war and the various styles of narrating war events and experiences. The final corpus is balanced along various dimensions, corresponding to the textual genre, the language variety used, the author type and the typology of conveyed contents. The corpus is annotated with lemmas, part-of-speech, terminology, and named entities. Significant corpus samples representative of the different \"voices\" have also been enriched with meta-linguistic and syntactic information. The layer of syntactic annotation forms the first nucleus of an Italian historical treebank complying with the Universal Dependencies standard. The paper illustrates the final resource, the methodology and tools used to build it, and the Web Interface for navigating it.","keywords":["Historical Corpora","Linguistic and Meta-linguistic Annotation","Information Extraction"],"pages":"911-918","url":"https:\/\/www.aclweb.org\/anthology\/2020.lrec-1.114.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"979-10-95546-34-4","conference_name":"Conference on Language Resources and Evaluation (LREC)","conference_place":"","conference_date":"11-16\/05\/2020"},{"id":132356,"last_updated":"2023-11-06 19:32:08","id_people":423880,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"INFERRING QUANTITATIVE TYPOLOGICAL TRENDS FROM MULTILINGUAL TREEBANKS. A CASE STUDY","year":2019,"authors_people":"Alzetta, Chiara; Dell'Orletta, Felice; Montemagni, Simonetta; Venturi, Giulia","authors_cnr":["Alzetta, Chiara","Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Alzetta, C.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"In the past decades, linguistic typology went through a renewing phase that involved a significant change in the research questions and methods of the discipline, which is now interested in fine-grained features underlying language diversity. In this paper, we propose a novel approach to address the newly defined needs of linguistic typology by extracting qualitative and quantitative information about a wide range of features from multilingual annotated corpora based on Natural Language Processing methods and techniques. We tested our method in a case study focusing on word order variation in two widely investigated constructions, VERB-SUBJ(ect) and NOUN-ADJ(ective), with a specific view to structural and functional factors underlying the preference for one or the other order, both intra- and cross-linguistically, and their interaction. Preliminary experiments have been carried out aimed at acquiring typological evidence from a selection of linguistically annotated treebanks for three different languages, namely Italian, Spanish and English. Our results show the effectiveness of the method in letting similarities and differences also emerge from typologically close languages.","keywords":["language typology","multilingual annotated corpora","linguistic knowledge extraction and modelling","word order variation"],"pages":"209-242","url":"https:\/\/www.rivisteweb.it\/doi\/10.1418\/95391","volume":"18","doi":"10.1418\/95391","editors_people":"","editors":[""],"published":"Lingue e linguaggio","publisher":"Il Mulino, Bologna (Italia)","issn":"1720-9331","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132354,"last_updated":"2023-11-06 19:32:10","id_people":423874,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Le parole del miglioramento. Come le scuole descrivono il cambiamento","year":2019,"authors_people":"Dell'Orletta F., Greco S., Montemagni S., Morini E., Rossi F., Sagri M.T., Venturi G.","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Greco, S.","Montemagni, S.","Morini, E.","Rossi, F.","Sagri, M. T.","Venturi, G."],"abstract":"Il presente contributo intende illustrare i risultati di una ricerca condotta con l'uso di strumenti di trattamento automatico del linguaggio (Natural Language Processing: nlp) su quanto dichiarato dalle scuole in circa 2500 Piani di Miglioramento (modello indire ) con l'obiettivo di comprendere le scelte strategiche in un'ottica di miglioramento continuo. Il disegno d'analisi permette di restituire sia una visione complessiva dei Piani di Miglioramento che approfondimenti qualitativi di confronto tra tipologie di scuola e aree geografiche e relativi a tematiche strategiche quali formazione e innovazione.","keywords":["Piano di Miglioramento","Natural Language Processing","Formazione","Innovazione"],"pages":"47-68","url":"https:\/\/www.rivistainfanzia.it\/pvw\/app\/default\/pvw_sito.php?sede_codice=1PWPSE01&page=2432193","volume":"1\/2019","doi":"","editors_people":"","editors":[""],"published":"Psicologia dell'educazione","publisher":"Edizioni Centro Studi Erickson (Gardolo (TN), Italia)","issn":"1971-3711","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132357,"last_updated":"2023-11-06 19:32:06","id_people":423881,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Dissecting Treebanks to Uncover Typological Trends. A Multilingual Comparative Approach","year":2019,"authors_people":"Alzetta C., Dell'Orletta F., Montemagni S., Venturi G.","authors_cnr":["Alzetta, Chiara","Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Alzetta, C.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"Over the last years, linguistic typology started attracting the interest of the community working on cross- and multi-lingual NLP as a way to tackle the bottleneck deriving from the lack of annotated data for many languages. Typological information is mostly acquired from publicly accessible typological databases, manually constructed by linguists. As reported in Ponti et al. (2018), despite the abundant information contained in them for many languages, these resources suffer from two main shortcomings, i.e. their limited coverage and the discrete nature of features (only \"the majority value rather than the full range of possible values and their corresponding frequencies\" is reported). Corpus-based studies can help to automatically acquire quantitative typological evidence which might be exploited for polyglot NLP. Recently, the availability of corpora annotated following a cross-linguistically consistent annotation scheme such as the one developed in the Universal Dependencies project is prompting new comparative linguistic studies aimed to identify similarities as well as idiosyncrasies among typologically different languages (Nivre, 2015). The line of research described here is aimed at acquiring quantitative typological evidence from UD treebanks through a multilingual contrastive approach.","keywords":["Natural Language Processing","Linguistic Typology"],"pages":"1-3","url":"https:\/\/typology-and-nlp.github.io\/2019\/assets\/2019\/papers\/5.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-950737-29-1","conference_name":"1st TyP-NLP: The Workshop on Typology for Polyglot NLP, ACL workshop","conference_place":"Firenze","conference_date":"01\/08\/2019"},{"id":132307,"last_updated":"2023-11-06 19:32:19","id_people":391617,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Assessing the Impact of Iterative Error Detection and Correction. A Case Study on the Italian Universal Dependency Treebank","year":2018,"authors_people":"Alzetta C., Dell'Orletta F., Montemagni S., Simi M., Venturi G.","authors_cnr":["Alzetta, Chiara","Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Alzetta, C.","Dell'Orletta, F.","Montemagni, S.","Simi, M.","Venturi, G."],"abstract":"Detection and correction of errors and inconsistencies in \"gold treebanks\" are becoming more and more central topics of corpus annotation. The paper illustrates a new incremental method for enhancing treebanks, with particular emphasis on the extension of error patterns across different textual genres and registers. Impact and role of corrections have been assessed in a dependency parsing experiment carried out with four different parsers, whose results are promising. For both evaluation datasets, the performance of parsers increases, in terms of the standard LAS and UAS measures and of a more focused measure taking into account only relations involved in error patterns, and at the level of individual dependencies.","keywords":["Error Detection","Universal Dependency Treebanks","Syntactic parsing"],"pages":"1-7","url":"http:\/\/universaldependencies.org\/udw18\/PDFs\/39_Paper.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-948087-84-1","conference_name":"Universal Dependencies Workshop 2018 (UDW 2018)","conference_place":"Brussels","conference_date":"01\/11\/2018"},{"id":132241,"last_updated":"2023-11-06 19:32:22","id_people":382333,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Dangerous Relations in Dependency Treebanks","year":2018,"authors_people":"Chiara Alzetta, Felice Dell'Orletta, Simonetta Montemagni, Giulia Venturi","authors_cnr":["Venturi, Giulia","Alzetta, Chiara","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Alzetta, C.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"The paper illustrates an effective and innovative method for detecting erroneously annotated arcs in gold dependency treebanks based on an algorithm originally developed to measure the reliability of automatically produced dependency relations. The method permits to significantly restrict the error search space and, more importantly, to reliably identify patterns of systematic recurrent errors which represent dangerous evidence to a parser which tendentially will replicate them. Achieved results demonstrate effectiveness and reliability of the method.","keywords":["Dependency treebanks","Error Detection","Linguistic Annotation"],"pages":"201-210","url":"http:\/\/aclweb.org\/anthology\/W\/W17\/W17-7624.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-80-88132-04-2","conference_name":"16th International Workshop on Treebanks and Linguistic Theories","conference_place":"Praga","conference_date":"23-24 gennaio 2018"},{"id":132252,"last_updated":"2023-11-06 19:32:36","id_people":385342,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Universal Dependencies and Quantitative Typological Trends. A Case Study on Word Order","year":2018,"authors_people":"Chiara Alzetta, Felice Dell'Orletta, Simonetta Montemagni, Giulia Venturi","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Alzetta, C.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"The paper presents a new methodology aimed at acquiring typological evidence from \"gold\" treebanks for different languages. In particular, it investigates whether and to what extent algorithms developed for assessing the plausibility of automatically produced syntactic annotations could contribute to shed light on key issues of the linguistic typological literature. It reports the first and promising results of a case study focusing on word order patterns carried out on three different languages (English, Italian and Spanish).","keywords":["Linguistic Knowledge Extraction","Dependency Treebanks","Linguistic Typology"],"pages":"4540-4549","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2018\/pdf\/1109.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"979-10-95546-00-9","conference_name":"Proceedings of the 11th Edition of the Language Resources and Evaluation Conference (LREC 2018)","conference_place":"Miyazaki (Japan)","conference_date":"7-12 maggio 2018"},{"id":132351,"last_updated":"2023-11-06 19:32:18","id_people":423871,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A NLP-based analysis of reflective writings by Italian teachers","year":2018,"authors_people":"Chiriatti G.; Della Gala V.; Dell'Orletta F.; Montemagni S.; Pettenati M.C.; Sagri M.T.; Venturi G.","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["Chiriatti, G.","Della Gala, V.","Dell'Orletta, F.","Montemagni, S.","Pettenati, M. C.","Sagri, M. T.","Venturi, G."],"abstract":"This paper reports first results of a wider study devoted to exploit the potentialities of a NLP-based approach to the analysis of a corpus of reflective writings on teaching activities. We investigate how a wide set of linguistic features allows reconstructing the linguistic profile of the texts written by the Italian teachers and predicting whether are reflective.","keywords":["Natural Language Processing","Reflective Writings","Linguistic Profiling","Document Classification"],"pages":"1-7","url":"http:\/\/www.scopus.com\/record\/display.url?eid=2-s2.0-85057733802&origin=inward","volume":"2253","doi":"","editors_people":"","editors":[""],"published":"CEUR workshop proceedings","publisher":"M. Jeusfeld c\/o Redaktion Sun SITE, Informatik V, RWTH Aachen (Aachen, Germania)","issn":"1613-0073","isbn":"","conference_name":"5th Italian Conference on Computational Linguistics (CLiC-it)","conference_place":"Torino","conference_date":"10-12\/12\/2018"},{"id":132352,"last_updated":"2023-11-06 19:32:27","id_people":423872,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Italian in the Trenches: Linguistic annotation and analysis of texts of the great war","year":2018,"authors_people":"De Felice I.; Dell'Orletta F.; Venturi G.; Lenci A.; Montemagni S.","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice","Venturi, Giulia"],"authors_cnr_id":["5595","14329","17692"],"authors_cnr_institute":[""],"authors":["De Felice, I.","Dell'Orletta, F.","Venturi, G.","Lenci, A.","Montemagni, S."],"abstract":"The paper illustrates the design and development of a textual corpus representative of the historical variants of Italian during the Great War, which was enriched with linguistic (lemmatization and pos-tagging) and meta-linguistic annotation. The corpus, after a manual revision of the linguistic annotation, was used for specializing existing NLP tools to process historical texts with promising results.","keywords":["Natural Language Processing","Automatic Linguistic Annotation"],"pages":"1-5","url":"http:\/\/www.scopus.com\/record\/display.url?eid=2-s2.0-85057734451&origin=inward","volume":"2253","doi":"","editors_people":"","editors":[""],"published":"CEUR workshop proceedings","publisher":"M. Jeusfeld c\/o Redaktion Sun SITE, Informatik V, RWTH Aachen (Aachen, Germania)","issn":"1613-0073","isbn":"","conference_name":"5th Italian Conference on Computational Linguistics (CLiC-it)","conference_place":"Pisa","conference_date":"10-12\/12\/2018"},{"id":132236,"last_updated":"2023-11-06 19:32:43","id_people":382249,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"La qualit\u00e0 dei consensi informati. Un'analisi linguistico-computazionale della leggibilit\u00e0 dei testi","year":2017,"authors_people":"Venturi G., Dell'Orletta F., Montemagni S., Flore E., Bellandi T.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Venturi, G.","Dell'Orletta, F.","Montemagni, S.","Flore, E.","Bellandi, T."],"abstract":"La leggibilit\u00e0 dei testi delle informative di consenso per le procedure diagnostico-terapeutiche \u00e8 un requisito fondamentale, per offrire alle persone assistite l'accesso alle informazioni necessarie a una scelta consapevole delle opzioni disponibili per curare i diversi problemi di salute. La disponibilit\u00e0 di un testo leggibile \u00e8 inoltre un aiuto per i medici responsabili della comunicazione e della raccolta del consenso, che possono impiegarlo come un ausilio alle informazioni presentate in forma verbale durante il colloquio, in modo tale da poter condividere una base di conoscenze minime da condividere con il paziente e i suoi familiari. Seppure le evidenze siano limitate in merito alla relazione tra la qualit\u00e0 del consenso e l'attitudine al contenzioso da parte dei pazienti in caso di trattamenti che esitano in un danno attribuibile alle cure (Durand et al., 2015), si tratta di un ambito di ricerca di crescente interesse nella letteratura sulla sicurezza (Wu et al., 2005; Manta et al., 2017). Nella casistica regionale della Toscana sulle richieste di risarcimento, solo l'1% dei sinistri include problemi di consenso informato (dati Centro GRC), probabilmente anche a causa di una sottovalutazione del diritto all'informazione da parte dei cittadini che si sottopongono a interventi programmati, connessa con una limitata consapevolezza del potere di scegliere le proprie cure che ogni persona dovrebbe poter esercitare posta di fronte alle opzioni terapeutiche disponibili per i propri problemi di salute.","keywords":["Consenso informato","valutazione automatica della leggibilit\u00e0","Trattamento Automatico del Linguaggio"],"pages":"35-39","url":"http:\/\/www.formas.toscana.it\/rivistadellasalute\/fileadmin\/files\/fascicoli\/2017\/212\/SeT_fascicolo_212.pdf","volume":"212","doi":"","editors_people":"","editors":[""],"published":"Salute e territorio","publisher":"ETS (Pisa, Italia)","issn":"0392-4505","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132181,"last_updated":"2017-03-03 18:11:52","id_people":367892,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Exploring the role of extra-linguistic factors in defining dialectal variation patterns through cluster comparison","year":2017,"authors_people":"Simonetta Montemagni, Martijn Wieling","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Wieling, M."],"abstract":"This paper contributes to two open issues in the dialectometric literature, i.e. i) whether and how patterns of linguistic variation are influenced by extra-linguistc features such as the geomorphology of the area, or cultural, administrative and political boundaries, and ii) whether and how the influence of extra-linguistic factors remains stable across linguistically-grounded partitions of data. To investigate these issues, a case study focusing on lexical variation has been carried out on a regional lexical atlas of Tuscan dialects. A variety of extra-linguistic features was taken into account, whose impact and role has been evaluated with respect to both the whole dialectal dataset and across different semantic fields.","keywords":["dialectometric literature","dialectology","linguistic variation","dialect","Tuscan","lexical atlas"],"pages":"241-251","url":"http:\/\/www.let.rug.nl\/festschriftnerbonne\/25.%20Montemagni%20&%20Wieling.pdf","volume":"Tributes 32","doi":"","editors_people":"Martijn Wieling, Martin Kroon, Gertjan van Noord and Gosse Bouma","editors":["Wieling, M.","Kroon, M.","Van Noord, G.","Bouma, G."],"published":"From Semantics to Dialectometry. Festschrift in honor of John Nerbonne","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132237,"last_updated":"2023-11-06 19:32:42","id_people":382252,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Identifying predictive features for textual genre classification: The key role of syntax","year":2017,"authors_people":"Cimino A.; Wieling M.; Dell'Orletta F.; Montemagni S.; Venturi G.","authors_cnr":["Venturi, Giulia","Cimino, Andrea","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Cimino, A.","Wieling, M.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"The paper investigates impact and role of different feature types for the specific task of Automatic Genre Classification with the final aim of identifying the most predictive ones. The goal was pursued by carrying out incremental feature selection through Grafting using different sets of linguistic features. Achieved results for discriminating among four traditional textual genres show the key role played by syntactic features, whose impact turned out to vary across genres.","keywords":["Textual Genre Classification","Feature Selection","Syntactic Features"],"pages":"1-6","url":"http:\/\/www.scopus.com\/record\/display.url?eid=2-s2.0-85037370866&origin=inward","volume":"2006","doi":"","editors_people":"","editors":[""],"published":"CEUR workshop proceedings","publisher":"M. Jeusfeld c\/o Redaktion Sun SITE, Informatik V, RWTH Aachen (Aachen, Germania)","issn":"1613-0073","isbn":"","conference_name":"Italian Conference on Computational Linguistics (CLiC-it)","conference_place":"Roma","conference_date":"11-12 dicembre 2017"},{"id":132251,"last_updated":"2023-11-06 19:32:57","id_people":385220,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Monitoraggio linguistico di Scritture Brevi: aspetti metodologici e primi risultati","year":2016,"authors_people":"D. BRUNATO, F. DELL'ORLETTA, S. MONTEMAGNI, G. VENTURI","authors_cnr":["Venturi, Giulia","Brunato, Dominique Pierina","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Brunato, D.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"Se da un lato le tecnologie del linguaggio svolgono un ruolo ormai indiscusso per l'accesso al contenuto testuale, ci\u00f2 non appare scontato quando si va a considerare il loro ruolo nella valutazione delle strutture linguistiche sottostanti al testo. Questo contributo si focalizza sulla definizione di una metodologia innovativa di monitoraggio linguistico della lingua italiana che a partire dall'output di strumenti di annotazione linguistica automatica permette di ricostruire un profilo linguistico di una collezione di testi rappresentativa di una specifica variet\u00e0 d'uso della lingua. Tale metodologia \u00e8 stata applicata a un corpus di tweet allo scopo di far luce su interrogativi aperti quali la possibilit\u00e0 di rintracciare tendenze lessicali, morfo-sintattiche e sintattiche peculiari all'interno di questa tipologia testuale; di studiare come queste tendenze si rapportino ai tratti caratterizzanti della lingua scritta e parlata; di individuare possibili differenze nella forma linguistica in cui si twittano contenuti di natura diversa.","keywords":["Trattamento Automatico del Linguaggio","Monitoraggio Linguistico","Variet\u00e0 d'Uso della Lingua","Lingua del Web"],"pages":"149-176","url":"https:\/\/publications.cnr.it\/doc\/385220","volume":"N. S. 5","doi":"","editors_people":"","editors":[""],"published":"Quaderni Aion","publisher":"Universit\u00e0 degli Studi di Napoli \"L'Orientale\" (Napoli, Italia)","issn":"1825-2796","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132178,"last_updated":"2017-03-03 18:18:12","id_people":367820,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Voci della Grande Guerra: An Annotated Corpus of Italian Texts on World War I","year":2016,"authors_people":"Alessandro Lenci, Nicola Labanca, Claudio Marazzini, Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Lenci, A.","Labanca, N.","Marazzini, C.","Montemagni, S."],"abstract":"Voci della Grande Guerra (Voices of the Great War) is a scientific and cultural initiative with the aim of preserving and promoting the memory of Italy in World War I through the creation of a corpus of digital texts selected by historians and linguists in order to be representative of the different ways to experience and describe the Italian war by its protagonists. With the help of advanced techniques of computational linguistics, semantic web and information visualization, the digitized historical materials will be explored with an online interface to enable easy but effective and innovative search modalities. The project will allow experts as well as non-experts to become acquainted with \"linguistic polyphony\" of Italy during World War I.","keywords":["Great War","World War","digital texts","corpus","Italian","Voci della Grande Guerra","Voices of the Great War"],"pages":"101-108","url":"http:\/\/www.ai-lc.it\/IJCoL\/v2n2\/6-lenci_et_al.pdf","volume":"2","doi":"","editors_people":"","editors":[""],"published":"Italian Journal of Computational Linguistics","publisher":"aAccademia University Press, Torino (Italia)","issn":"2499-4553","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132182,"last_updated":"2017-03-06 13:06:44","id_people":367809,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Tracking linguistic features underlying lexical variation patterns: A case study on Tuscan dialects","year":2016,"authors_people":"Simonetta Montemagni, Martijn Wieling","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Wieling, M."],"abstract":"In this paper, we illustrate the application of hierarchical spectral partitioning of bipartite graphs in the study of lexical variation in Tuscany based on the data from a regional linguistic atlas. This method makes it possible not only to identify existing patterns of lexical variation in Tuscany, but also to uncover the underlying lexical features in terms of the most characteristic concept-lexicalization pairs. The results are promising, demonstrating the potential of the method for tracking the linguistic features underlying identified patterns of lexical variation and change across generations.","keywords":["tuscan","dialects","lexical variation","linguistic atlas"],"pages":"117-135","url":"http:\/\/langsci-press.org\/catalog\/view\/81\/146\/376-1","volume":"1","doi":"10.17169\/langsci.b81.146","editors_people":"Marie-H\u00e9l\u00e8ne C\u00f4t\u00e9, Remco Knooihuizen & John Nerbonne","editors":["C\u00f4t\u00e9, M.","Knooihuizen, R.","Nerbonne, J."],"published":"The future of dialects","publisher":"Language Science Press (Berlin, DEU)","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132180,"last_updated":"2017-03-06 14:38:01","id_people":367813,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Infrequent forms: Noise or not?","year":2016,"authors_people":"Martijn Wieling, Simonetta Montemagni.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Wieling, M.","Montemagni, S."],"abstract":"In this study we ask the question whether simplifying the data in dialectometrical studies by removing infrequent forms is advantageous to uncovering the geographical structure in dialect data. By investigating lexical variation in a large corpus of Tuscan dialect data via hierarchical bipartite spectral graph partitioning, we are able to identify the main geographical areas together with their linguistic basis. In order to assess the influence of infrequent forms, we conduct two analyses: one which includes only lexical variants used by at least 0.5% of the informants, and another which includes all lexical variants in the data. Using this approach we show that using all data enables us to find a geographical characterization with a more adequate linguistic basis than by using the trimmed data.","keywords":["dialectometrical studies","dialectology","dialect data","lexical variation","Tuscan"],"pages":"215-224","url":"http:\/\/langsci-press.org\/catalog\/view\/81\/78\/367-1","volume":"Language Variation 1","doi":"10.17169\/langsci.b81.78","editors_people":"Marie-H\u00e9l\u00e8ne C\u00f4t\u00e9, Remco Knooihuizen, John Nerbonne","editors":["C\u00f4t\u00e9, M.","Knooihuizen, R.","Nerbonne, J."],"published":"The Future of Dialects","publisher":"Language Science Press (Berlin, DEU)","issn":"","isbn":"978-3-946234-18-0","conference_name":"","conference_place":"","conference_date":""},{"id":132190,"last_updated":"2018-10-23 09:30:04","id_people":372004,"institutes":["ILC"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings CLiC-it 2016 and EVALITA 2016","year":2016,"authors_people":"Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S."],"abstract":"Proceedings of Third Italian Conference on Computational Linguistics (CLiC-it 2016) & Fifth Evaluation Campaign of Natural Language Processing and Speech Tools for Italian. Final Workshop (EVALITA 2016)","keywords":["Computational Linguistics Natural Language Processing Speech Tools for Italian CLiC-it EVALITA"],"pages":"","url":"http:\/\/ceur-ws.org\/Vol-1749\/","volume":"1749","doi":"","editors_people":"","editors":[""],"published":"","publisher":"CEUR-WS. org (Aachen, DEU)","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132192,"last_updated":"2018-10-23 09:30:03","id_people":372022,"institutes":["ILC"],"type":"editorial","type_order":4,"type_people":"article","title":"Nota Editoriale","year":2016,"authors_people":"Roberto Basili, Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Basili, R.","Montemagni, S."],"abstract":"","keywords":["Computational Linguistics CLiC-it natural language processing"],"pages":"7-10","url":"http:\/\/www.ai-lc.it\/IJCoL\/v2n1\/00_nota_editoriale.pdf","volume":"2","doi":"","editors_people":"","editors":[""],"published":"Italian Journal of Computational Linguistics","publisher":"aAccademia University Press, Torino (Italia)","issn":"2499-4553","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132166,"last_updated":"2023-11-06 19:32:51","id_people":366749,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"CItA: an L1 Italian Learners Corpus to Study the Development of Writing Competence","year":2016,"authors_people":"Barbagli A., Lucisano P., Dell'Orletta F., Montemagni S., Venturi G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Barbagli, A.","Lucisano, P.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"In this paper, we present the CItA corpus (Corpus Italiano di Apprendenti L1), a collection of essays written by Italian L1 learners collected during the first and second year of lower secondary school. The corpus was built in the framework of an interdisciplinary study jointly carried out by computational linguistics and experimental pedagogists and aimed at tracking the development of written language competence over the years and students' background information.","keywords":["Italian Learner Corpus","Diachronic Evolution of Written Language Competence","Error Annotation"],"pages":"88-95","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2016\/pdf\/536_Paper.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-9-1","conference_name":"Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016)","conference_place":"Portoroz (Slovenia)","conference_date":"23-28 maggio 2016"},{"id":132170,"last_updated":"2023-11-06 19:32:53","id_people":366757,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Esplorazioni computazionali nello spazio dell'interlingua: verso una nuova metodologia di indagine","year":2016,"authors_people":"Dell'Orletta F., Montemagni S. e Venturi G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"Il presente contributo intende proporre un innovativo approccio all'identificazione delle caratteristiche linguistiche che aiutano a definire l'interlingua. Tale approccio consiste nella ricostruzione del profilo linguistico di corpora di produzioni scritte da apprendenti una lingua seconda basato su strumenti di trattamento automatico del linguaggio.","keywords":["interlingua","annotazione linguistica automatica","monitoraggio linguistico"],"pages":"143-161","url":"https:\/\/www.bulzoni.it\/it\/catalogo\/lingue-in-contatto-contact-linguistics.html","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Bulzoni Editore (Roma, ITA)","issn":"","isbn":"978-88-6897-029-1","conference_name":"XLVIII Congresso Internazionale di Studi della Societ\u00e0 di Linguistica Italiana (SLI 2014)","conference_place":"Udine","conference_date":"25-27 settembre 2014"},{"id":132191,"last_updated":"2018-10-23 09:30:04","id_people":372010,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Preface","year":2016,"authors_people":"Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S."],"abstract":"Our very warm welcome to CLiC - it 2016 (http:\/\/clic - it2016.dieti.unina.it\/), the 3 rd edition of the Italian Conference on Computational Linguistics , held on December 5 th and 6 th , in Naples, Italy, co - located with Evalita 2016 ( http:\/\/www.evalita.it\/2016 ), hosted and locally organized by Universit\u00e0 Federico II, one the oldest public and laic universities in the world. The organization of the conference is the result of a fruitful conjoint effort of different research groups (Istituto di Linguistica Computazionale \"Antonio Zampolli\" del CNR, Universit\u00e0 degli Studi di Bari Aldo Moro and Universit\u00e0 degli Studi di Napoli Federico II) showing the nationwide spreading of Computational Linguistics in Italy. The CLiC - it conference series is organized by the Italian Association for Computational Linguistics (AILC) and has clearly established itself as the premier national forum for research and development in the fields of Computational Linguistics (CL) and Natural Language Processing (NLP), where leading researchers and practitioners from academia and industry meet to share their challenges, solutions, research results, and experiences. CLiC - it covers all aspects of computational linguistics and natural language (both written and spoken) processing, and targets state - of - art theoretical results, experimental methodologies, technologies, as well as application perspectives, which may contribute to advance the field.","keywords":["Computational Linguistics Natural Language Processing Speech Tools for Italian CLiC-it EVALITA"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/372010","volume":"1749","doi":"","editors_people":"Simonetta Montemagni","editors":["Montemagni, S."],"published":"Proceedings CLiC-it 2016 and EVALITA 2016","publisher":"CEUR-WS. org (Aachen, DEU)","issn":"","isbn":"","conference_name":"CLiC-it & EVALITA 2016","conference_place":"Napoli","conference_date":"5-7\/12\/2016"},{"id":132168,"last_updated":"2023-11-06 19:32:52","id_people":366754,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Dieci sfumature di marcatezza sintattica: Verso una nozione computazionale di complessita","year":2016,"authors_people":"Tusa E.; Dell'orletta F.; Montemagni S.; Venturi G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Tusa, E.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"In this work, we will investigate whether and to what extent algorithms typically used to assess the reliability of the output of syntactic parsers can be used to study the correlation between processing complexity and the linguistic notion of markedness. Although still preliminary, achieved results show the key role of features such as dependency direction and length in defining the markedness degrees of a given syntactic construction.","keywords":["marcatezza sintattica","complessit\u00e0 linguistica","annotazione linguistica automatica"],"pages":"1-6","url":"http:\/\/www.scopus.com\/record\/display.url?eid=2-s2.0-85009279517&origin=inward","volume":"1749","doi":"","editors_people":"","editors":[""],"published":"CEUR workshop proceedings","publisher":"M. Jeusfeld c\/o Redaktion Sun SITE, Informatik V, RWTH Aachen (Aachen, Germania)","issn":"1613-0073","isbn":"","conference_name":"Italian Conference on Computational Linguistics (CLiC-it)","conference_place":"Napoli","conference_date":"5-6 dicembre 2016"},{"id":132134,"last_updated":"2017-03-01 11:09:01","id_people":359168,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"ALT Explored: Integrating an Online Dialectometric Tool and an Online Dialect Atlas","year":2016,"authors_people":"Martijn Wieling, Eva Sassolini, Sebastiana Cucurullo and Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta","Sassolini, Eva","Cucurullo, Sebastiana"],"authors_cnr_id":["5595","11032","11479"],"authors_cnr_institute":[""],"authors":["Wieling, M.","Sassolini, E.","Cucurullo, S.","Montemagni, S."],"abstract":"In this paper, we illustrate the integration of an online dialectometric tool, Gabmap, together with an online dialect atlas, the Atlante Lessicale Toscano (ALT-Web). By using a newly created url-based interface to Gabmap, ALT-Web is able to take advantage of the sophisticated dialect visualization and exploration options incorporated in Gabmap. For example, distribution maps showing the distribution in the Tuscan dialect area of a specific dialectal form (selected via the ALT-Web website) are easily obtainable. Furthermore, the complete ALT-Web dataset as well as subsets of the data (selected via the ALT-Web website) can be automatically uploaded and explored in Gabmap. By combining these two online applications, macro- and micro-analyses of dialectal data (respectively offered by Gabmap and ALT-Web) are effectively and dynamically combined.","keywords":["Lexicon","Lexical Database","Tools","Systems","Applications"],"pages":"3265-3272","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2016\/index.html","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-2-9517408-9-1","conference_name":"LREC 2016","conference_place":"Portoro\u017e, Slovenia","conference_date":"23\/10\/2016"},{"id":132200,"last_updated":"2023-11-06 19:33:14","id_people":366713,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"State of the Art Language Technologies for Italian: The EVALITA 2014 Perspective","year":2015,"authors_people":"Attardi, Giuseppe; Basile, Valerio; Bosco, Cristina; Caselli, Tommaso; Dell'Orletta, Felice; Montemagni, Simonetta; Patti, Viviana; Simi, Maria; Sprugnoli, Rachele","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Attardi, G.","Basile, V.","Bosco, C.","Caselli, T.","Dell'Orletta, F.","Montemagni, S.","Patti, V.","Simi, M.","Sprugnoli, R."],"abstract":"Shared task evaluation campaigns represent a well established form of competitive evaluation, an important opportunity to propose and tackle new challenges for a specific research area and a way to foster the development of benchmarks, tools and resources. The advantages of this approach are evident in any experimental field, including the area of Natural Language Processing. An outlook on state-of-the-art language technologies for Italian can be obtained by reflecting on the results of the recently held workshop \"Evaluation of NLP and Speech Tools for Italian\", EVALITA 2014. The motivations underlying individual shared tasks, the level of knowledge and development achieved within each of them, the impact on applications, society and economy at large as well as directions for future research will be discussed from this perspective.","keywords":["Evaluation Campaign","Natural Language Processing","Dependency Parsing","Sentiment Analysis","Temporal Processing"],"pages":"43-61","url":"https:\/\/publications.cnr.it\/doc\/366713","volume":"9","doi":"10.3233\/IA-150076","editors_people":"","editors":[""],"published":"Intelligenza Artificiale","publisher":"Associazione Italiana per l'Intelligenza Artificiale (Bari, Italia)","issn":"1724-8035","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132127,"last_updated":"2023-11-06 19:33:10","id_people":357152,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Il ruolo delle tecnologie del linguaggio nel monitoraggio dell'evoluzione delle abilit\u00e0 di scrittura: primi risultati","year":2015,"authors_people":"Barbagli A., Lucisano P., Dell'Orletta F., Montemagni S., Venturi G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Barbagli, A.","Lucisano, P.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"L'ultimo decennio ha visto l'affermarsi a livello internazionale dell'uso di tecnologie del linguaggio per lo studio dei processi di apprendimento. Questo contributo riporta i primi e promettenti risultati di uno studio interdisciplinare che si \u00e8 avvalso di metodi e tecniche di analisi propri della linguistica computazionale, della linguistica e della pedagogia sperimentale. Lo studio, finalizzato al monitoraggio dell'evoluzione del processo di apprendimento della lingua italiana, \u00e8 stato condotto a partire dalle produzione scritte di studenti della scuola secondaria di primo grado con strumenti di annotazione linguistica automatica e di estrazione di conoscenza e ha portato all'identificazione di un insieme di tratti qualificanti il processo di apprendimento linguistico.","keywords":["evoluzione delle competenze linguistiche","Didattica Sperimentale","Estrazione di conoscenza","Annotazione linguistica automatica"],"pages":"99-117","url":"https:\/\/journals.openedition.org\/ijcol\/326","volume":"","doi":"10.4000\/ijcol.326","editors_people":"","editors":[""],"published":"Italian Journal of Computational Linguistics","publisher":"aAccademia University Press, Torino (Italia)","issn":"2499-4553","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132062,"last_updated":"2015-05-02 18:08:13","id_people":330110,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Harmonizing and merging Italian treebanks: Towards a merged Italian dependency treebank and beyond","year":2015,"authors_people":"Simi M.; Montemagni S.; Bosco C.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Simi, M.","Montemagni, S.","Bosco, C."],"abstract":"In this paper we address the challenge of combining existing CoNLL-compliant dependency-annotated corpora with the final aim of constructing a bigger treebank for the Italian language. To this end, we defined amethodology formapping different annotation schemes, based on: (i)The analysis of similarities and differences of considered source and target dependency annotation schemes; (ii) The analysis of the performance of state of the art dependency parsers trained on the source and target treebanks; (iii) The mapping of the source annotation scheme(s) onto a set of target (possibly underspecified) data categories. This methodology was applied in two different case studies. The first one was aimed at constructing a \"Merged Italian Dependency Treebank\" (MIDT) starting from existing Italian dependency treebanks, namely TUT and ISST-TANL. The second case study, still ongoing, consists in the conversion of the MIDT resource into the Stanford Dependencies de facto standard with the final aim of developing an \"Italian Stanford Dependency Treebank\" (ISDT).","keywords":["Harmonization and merging of resources","Italian","Dependency Treebank"],"pages":"3-23","url":"http:\/\/www.scopus.com\/inward\/record.url?eid=2-s2.0-84927143016&partnerID=q2rCbXpz","volume":"589","doi":"10.1007\/978-3-319-14206-7_1","editors_people":"Basili, Roberto; Bosco, Cristina; Delmonte, Rodolfo; Moschitti, Alessandro; Simi, Maria","editors":["Basili, R.","Bosco, C.","Delmonte, R.","Moschitti, A.","Simi, M."],"published":"Harmonization and Development of Resources and Tools for Italian Natural Language Processing within the PARLI Project","publisher":"Springer International Publishing (CH-6330 Cham (ZG), CHE)","issn":"","isbn":"978-3-319-14205-0","conference_name":"","conference_place":"","conference_date":""},{"id":132126,"last_updated":"2023-11-06 19:33:05","id_people":357146,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"CItA: un Corpus di Produzioni Scritte di Apprendenti l'Italiano L1 Annotato con Errori","year":2015,"authors_people":"Alessia Barbagli, Pietro Lucisano, Felice Dell'Orletta, Simonetta Montemagni, Giulia Venturi","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Barbagli, A.","Lucisano, P.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"In questo articolo presentiamo CItA il primo corpus di produzioni scritte di apprendenti l'italiano L1 del primo e del secondo anno della scuola secondaria di primo grado annotato con errori grammaticali, ortografici e lessicali. Le specificit\u00e0 del corpus e la sua natura diacronica lo rendono particolarmente utile sia per applicazioni linguistico-computazionali sia per studi socio-pedagogici.","keywords":["Apprendiemento della lingua madre","evoluzione delle competenze linguistiche"],"pages":"31-35","url":"http:\/\/www.italianlp.it\/wp-content\/uploads\/2016\/03\/CItA_errori.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Accademia University Press (Torino, ITA)","issn":"","isbn":"978-88-99200-62-6","conference_name":"2nd Italian Conference on Computational Linguistics (CLiC-it)","conference_place":"Trento","conference_date":"3-4 dicembre 2015"},{"id":132076,"last_updated":"2023-11-06 19:33:09","id_people":332693,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Design and Annotation of the First Italian Corpus for Text Simplification","year":2015,"authors_people":"Brunato D., Dell'Orletta F., Venturi G., Montemagni S.","authors_cnr":["Venturi, Giulia","Brunato, Dominique Pierina","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048","048"],"authors":["Brunato, D.","Dell'Orletta, F.","Venturi, G.","Montemagni, S."],"abstract":"In this paper, we present design and construction of the first Italian corpus for automatic and semi--automatic text simplification. In line with current approaches, we propose a new annotation scheme specifically conceived to identify the typology of changes an original sentence undergoes when it is manually simplified. Such a scheme has been applied to two aligned Italian corpora, containing original texts with corresponding simplified versions, selected as representative of two different manual simplification strategies and addressing different target reader populations. Each corpus was annotated with the operations foreseen in the annotation scheme, covering different levels of linguistic description. Annotation results were analysed with the final aim of capturing peculiarities and differences of the different simplification strategies pursued in the two corpora.","keywords":["Annotation Scheme","Automatic Text Simplification"],"pages":"31-34","url":"https:\/\/aclweb.org\/anthology\/W\/W15\/W15-1604.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-941643-47-1","conference_name":"Proceedings of LAW IX-The 9th Linguistic Annotation Workshop","conference_place":"Denver, Colorado","conference_date":"5 giugno 2015"},{"id":132089,"last_updated":"2023-11-06 19:33:12","id_people":340387,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"NLP-Based Readability Assessment of Health-Related Texts: a Case Study on Italian Informed Consent Forms","year":2015,"authors_people":"Giulia Venturi, Tommaso Bellandi, Felice Dell'Orletta, Simonetta Montemagni","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Venturi, G.","Bellandi, T.","Dell'Orletta, F.","Montemagni, S."],"abstract":"The paper illustrates the results of a case study aimed at investigating and enhancing the accessibility of Italian health-related documents by relying on advanced NLP techniques, with particular attention to informed consent forms. Results achieved show that the features automatically extracted from the linguistically annotated text and ranging across different levels of linguistic description have a high discriminative power in order to guarantee a reliable readability assessment.","keywords":["Readability assessment","health-related information"],"pages":"131-141","url":"http:\/\/www.aclweb.org\/anthology\/W15-2618","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-941643-32-7","conference_name":"Sixth International Workshop on Health Text Mining and Information Analysis (Louhi)","conference_place":"Lisbona","conference_date":"17 settembre 2015"},{"id":132179,"last_updated":"2017-03-03 18:19:34","id_people":367807,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"The contribution of dialectometry to the study of the dialects of Italy. A case study on Tuscan","year":2015,"authors_people":"Simonetta Montemagni, Martijn Wieling, John Nerbonne","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Wieling, M.","Nerbonne, J."],"abstract":"We will illustrate the extent to which the recent advances of dialectometry can help to gain insight into the nature of linguistic variation - both synchronically and diachronically - in the study of the dialects of Tuscany, which have a special status in the complex puzzle of Italian dialects. This will be done by discussing the results achieved in a case study carried out over the last five years based on the corpus of dialectal data of the Atlante Lessicale Toscano ('Lexical Atlas of Tuscany', henceforth ALT, Giacomelli et al., 2000), a regional linguistic atlas focusing on dialec tal variation throughout Tuscany, a region where both Tuscan and non-Tuscan dialects are spoken.","keywords":["dialectometry","lexical atlas","italian dialects","Tuscany","Atlante Lessicale Toscano"],"pages":"","url":"http:\/\/media.leidenuniv.nl\/legacy\/montemagni-wieling-nerbonne.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Italian Dialect Meeting 2015 & CIDSM X","conference_place":"Leiden University-Centre for Linguistics","conference_date":"23 June 2015"},{"id":132090,"last_updated":"2015-12-17 17:39:07","id_people":340388,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Language technologies for automatic readability assessment of health-related Information: a preliminary investigation into the informed consent forms used in a regional health service","year":2015,"authors_people":"Giulia Venturi, Sabrina Rinnone, Simonetta Montemagni, Manuela Sassi, Giuseppina Terranova, Elisabetta Flore, Tommaso Bellandi","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Sassi, Manuela"],"authors_cnr_id":["5595","19592"],"authors_cnr_institute":["048","048","048"],"authors":["Venturi, G.","Rinnone, S.","Montemagni, S.","Sassi, M.","Terranova, G.","Flore, E.","Bellandi, T."],"abstract":"Rationale: Within an information society, where everyone should be able to access all available information, improving access to written language is becoming more and more a central issue. This is the case for health-related information which should be accessible to all members of the society, including people who have reading difficulties as a result of a low education level or of language-based learning disabilities or because the language of the text is not their native language. Moreover, the breakdown of doctor-patient communication is one of the most frequent cause of adverse events. Research questions: We conducted a preliminary investigation to assess the readability of a corpus of informed consent forms used before a clinical procedure in the hospitals of a Regional Healthcare Service. Secondary goals include the comparison of readability across specialties and healthcare trusts. Methods: Providing complex scientific information in a way that is comprehensible to a lay person is a challenge that nowadays can be addressed by resorting to advanced Natural Language Processing (NLP) techniques, which make it possible to monitor the linguistic complexity of texts at the syntactic and lexical levels and to support their simplification, whenever needed. The study has been carried out by combining NLP-enabled feature extraction and state-of-the-art machine learning algorithms. To this end we used READ-IT, the first NLP-based readability assessment tool for Italian. Results: We analysed 584 documents, covering 29 specialties, for a total of 607.790 word tokens, currently used at the 36 public hospitals in Tuscany. Although the readability level of all documents in the corpus is low, both at the lexical and syntactic level, significant differences can be observed between specialties and healthcare trust releasing the forms. With the readability level ranging between 0 (easy-to-read) and 100 (difficult-to-read), it resulted that the pediatric informed consent documents are the most easy-to-read forms (with an average score of 75) while the most difficult-to read documents are documents of the surgical area (whose average score is 80) (standard deviation 2). Discussion: The state of the art resulting from this preliminary study shows that NLP-based readability assessment tools can help to measure the linguistic complexity of informed consent forms and guide the editor to identify linguistically complex passages that need to be simplified, either syntactically or lexically. The use of an assessment tool designed for the general language is the main limitation of the study and should be addressed through the customization of the tool to assess the readability of the healthcare jargon. A further step of the research consider also the design of a guidance to prepare readable informed consent forms.","keywords":["Readability assessment","health-related information"],"pages":"","url":"http:\/\/static1.squarespace.com\/static\/561c0d01e4b0b5ad2e65cc48\/t\/561d44dfe4b089431662d174\/1444758751213\/LibrettoProgramma.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"ISCOME 2015 Conference: \"The Golden Bridge: Communication and Patient Safety\"","conference_place":"Montecatini Terme","conference_date":"15-16 giugno 2015"},{"id":131881,"last_updated":"2023-11-06 19:33:16","id_people":285640,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Assessing document and sentence readability in less resourced languages and across textual genres","year":2014,"authors_people":"Felice Dell'Orletta, Simonetta Montemagni, Giulia Venturi","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"In this paper, we tackle three underresearched issues of the automatic readability assessment literature, namely the evaluation of text readability in less resourced languages, with respect to sentences (as opposed to documents) as well as across textual genres. Different solutions to these issues have been tested by using and refining READ-IT, the first advanced readability assessment tool for Italian, which combines traditional raw text features with lexical, morpho-syntactic and syntactic information. In READ-IT readability assessment is carried out with respect to both documents and sentences, with the latter constituting an important novelty of the proposed approach: READ-IT shows a high accuracy in the document classification task and promising results in the sentence classification scenario. By comparing the results of two versions of READ-IT, adopting a classification- versus ranking-based approach, we also show that readability assessment is strongly influenced by textual genre; for this reason a genre-oriented notion of readability is needed. With classification-based approaches, reliable results can only be achieved with genre-specific models: Since this is far from being a workable solution, especially for less resourced languages, a new ranking method for readability assessment is proposed, based on the notion of distance.","keywords":["readability assessment","less resourced languages","multi-level linguistic annotation","textual genres"],"pages":"163-193","url":"http:\/\/www.ingentaconnect.com\/content\/jbp\/itl\/2014\/00000165\/00000002\/art00005","volume":"165","doi":"10.1075\/itl.165.2.03del","editors_people":"","editors":[""],"published":"ITL. Internationaler technischer Literaturanzeiger (Online)","publisher":"Peeters Publishers (Leuven, Belgio)","issn":"1783-1490","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131877,"last_updated":"2015-02-17 23:21:15","id_people":285543,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Lexical differences between Tuscan dialects and standard Italian: Accounting for geographic and socio-demographic variation using generalized additive mixed modeling","year":2014,"authors_people":"Wieling, Martijn; Montemagni, Simonetta; Nerbonne, John; Baayen, R. Harald","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Wieling, M.","Montemagni, S.","Nerbonne, J.","Baayen, R. H."],"abstract":"This study uses a generalized additive mixed-effects regression model to predict lexical differences in Tuscan dialects with respect to standard Italian. We used lexical information for 170 concepts used by 2,060 speakers in 213 locations in Tuscany. In our model, geographical position was found to be an important predictor, with locations more distant from Florence having lexical forms more likely to differ from standard Italian. In addition, the geographical pattern varied significantly for low- versus high-frequency concepts and older versus younger speakers. Younger speakers generally used variants more likely to match the standard language. Several other factors emerged as significant. Male speakers as well as farmers were more likely to use lexical forms different from standard Italian. In contrast, higher-educated speakers used lexical forms more likely to match the standard. The model also indicates that lexical variants used in smaller communities are more likely to differ from standard Italian. The impact of community size, however, varied from concept to concept. For a majority of concepts, lexical variants used in smaller communities are more likely to differ from the standard Italian form. For a minority of concepts, however, lexical variants used in larger communities are more likely to differ from standard Italian. Similarly, the effect of the other community- and speaker-related predictors varied per concept. These results clearly show that the model succeeds in teasing apart different forces influencing the dialect landscape and helps us to shed light on the complex interaction between the standard Italian language and the Tuscan dialectal varieties. In addition, this study illustrates the potential of generalized additive mixed-effects regression modeling applied to dialect data.*","keywords":["Tuscan dialects","lexical variation","generalized additive modeling","mixed-effects regression modeling","geographical variation"],"pages":"669-692","url":"http:\/\/www.linguisticsociety.org\/files\/wieling.pdf","volume":"90","doi":"","editors_people":"","editors":[""],"published":"Language (Baltimore)","publisher":"Linguistic Society of America [etc. ] (Washington, DC [etc. ], Stati Uniti d'America)","issn":"0097-8507","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132064,"last_updated":"2023-11-06 19:33:25","id_people":330112,"institutes":["ILC"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings of the Fourth International Workshop EVALITA 2014","year":2014,"authors_people":"Cristina Bosco, Piero Cosi, Felice Dell'Orletta, Mauro Falcone, Simonetta Montemagni, Maria Simi","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048"],"authors":["Bosco, C.","Cosi, P.","Dell'Orletta, F.","Falcone, M.","Montemagni, S.","Simi, M."],"abstract":"","keywords":["Trattamento Automatico del Linguaggio","Speech Processing","Lingua Italiana"],"pages":"167","url":"http:\/\/clic.humnet.unipi.it\/proceedings\/Proceedings-EVALITA-2014.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Pisa University Press (Pisa, ITA)","issn":"","isbn":"978-88-67414-72-7","conference_name":"","conference_place":"","conference_date":""},{"id":123736,"last_updated":"2015-02-17 13:54:19","id_people":310637,"institutes":["ILC","ITTIG","IGSG"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings of the Fourth Workshop on Semantic Processing of Legal Texts","year":2014,"authors_people":"Francesconi E., Montemagni S., Peters W., Venturi G., Wyner A.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Francesconi, Enrico"],"authors_cnr_id":["5595","10498"],"authors_cnr_institute":["048","048","104"],"authors":["Francesconi, E.","Montemagni, S.","Peters, W.","Venturi, G.","Wyner, A."],"abstract":"","keywords":[""],"pages":"33","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/workshops\/LREC2014Workshop-SPLeT%20Proceedings.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"PARIGI: ELRA (Parigi, FRA)","issn":"","isbn":"978-2-9517408-8-4","conference_name":"","conference_place":"","conference_date":""},{"id":131990,"last_updated":"2023-11-06 19:33:27","id_people":294078,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Tecnologie del linguaggio e monitoraggio dell'evoluzione delle abilit\u00e0 di scrittura nella scuola secondaria di primo grado","year":2014,"authors_people":"Barbagli A., Lucisano P., Dell'Orletta F., Montemagni S., Venturi G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Barbagli, A.","Lucisano, P.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"L'ultimo decennio ha visto l'affermarsi a livello internazionale dell'uso di tecnologie del linguaggio per lo studio dei processi di apprendimento. Questo contributo, che si colloca all'interno di una ricerca pi\u00f9 ampia di pedagogia sperimentale, riporta i primi e promettenti risultati di uno studio finalizzato al monitoraggio dell'evoluzione del processo di apprendimento della lingua italiana condotto a partire dalle produzione scritte degli studenti con strumenti di annotazione linguistica automatica e di estrazione di conoscenza.","keywords":[""],"pages":"23-27","url":"http:\/\/www.italianlp.it\/wp-content\/uploads\/2014\/12\/Tecnologie-del-linguaggio-per-la-scuola.pdf","volume":"","doi":"10.12871\/CLICIT201415","editors_people":"Roberto Basili, Alessandro Lenci, Bernardo Magnini","editors":["Basili, R.","Lenci, A.","Magnini, B."],"published":"Proceedings of the First Italian Conference on Computational Linguistics (CLiC-it 2014)","publisher":"Pisa University Press srl (Pisa, ITA)","issn":"","isbn":"978-8-86741-472-7","conference_name":"First Italian Conference on Computational Linguistics (CLiC-it 2014)","conference_place":"Pisa","conference_date":"9-11 dicembre 2014"},{"id":131935,"last_updated":"2023-11-06 19:33:19","id_people":288050,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Computational Analysis of Historical Documents: An Application to Italian War Bulletins in World War I and II","year":2014,"authors_people":"Boschetti F., Cimino A., Dell'Orletta F., Lebani G.E., Passaro L., Picchi P., Venturi G., Montemagni S. Lenci A.","authors_cnr":["Dell'Orletta, Felice","Venturi, Giulia","Cimino, Andrea","Montemagni, Simonetta","Picchi, Paolo","Boschetti, Federico"],"authors_cnr_id":["5595","12761","14630"],"authors_cnr_institute":[""],"authors":["Boschetti, F.","Cimino, A.","Dell'Orletta, F.","Lebani, G. E.","Passaro, L.","Picchi, P.","Venturi, G.","Montemagni, S.","Lenci, A."],"abstract":"World War (WW) I and II represent crucial landmarks in the history on mankind: They have affected the destiny of whole generations and their consequences are still alive throughout Europe. In this paper we present an ongoing project to carry out a computational analysis of Italian war bulletins in WWI and WWII, by applying state-of-the-art tools for NLP and Information Extraction. The annotated texts and extracted information will be explored with a dedicated Web interface, allowing for multidimensional access and exploration of historical events through space and time.","keywords":["World War I"],"pages":"70-75","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/workshops\/LREC2014Workshop-LRT4HDA%20Proceedings.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of workshop on Language resources and technologies for processing and linking historical documents and archives-Deploying Linked Open Data in Cultural Heritage-LREC 2014, 26 May, Reykjavik, Iceland","publisher":"European language resources association (ELRA) (Paris, FRA)","issn":"","isbn":"","conference_name":"LREC 2014","conference_place":"Reykjavik","conference_date":"26 May"},{"id":131989,"last_updated":"2023-11-06 19:33:21","id_people":294073,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Defining an annotation scheme with a view to automatic text simplification","year":2014,"authors_people":"Brunato D., Dell'Orletta F., Venturi G., Montemagni S.","authors_cnr":["Venturi, Giulia","Brunato, Dominique Pierina","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048","048"],"authors":["Brunato, D.","Dell'Orletta, F.","Venturi, G.","Montemagni, S."],"abstract":"This paper presents the preliminary steps of ongoing research in the field of automatic text simplification. In line with current approaches, we propose here a new annotation scheme specifically conceived to identify the typologies of changes an original sentence undergoes when it is manually simplified. Such a scheme has been tested on a parallel corpus available for Italian, which we have first aligned at sentence level and then annotated with simplification rules.","keywords":[""],"pages":"87-92","url":"http:\/\/www.italianlp.it\/wp-content\/uploads\/2014\/12\/Text-simplification.pdf","volume":"","doi":"10.12871\/CLICIT2014118","editors_people":"Roberto Basili, Alessandro Lenci, Bernardo Magnini","editors":["Basili, R.","Lenci, A.","Magnini, B."],"published":"Proceedings of the First Italian Conference on Computational Linguistics (CLiC-it 2014)","publisher":"Pisa University Press srl (Pisa, ITA)","issn":"","isbn":"978-8-86741-472-7","conference_name":"First Italian Conference on Computational Linguistics (CLiC-it 2014)","conference_place":"Pisa","conference_date":"9-11 dicembre 2014"},{"id":131883,"last_updated":"2023-11-06 19:33:26","id_people":285670,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"T2K: a System for Automatically Extracting and Organizing Knowledge from Texts","year":2014,"authors_people":"Felice Dell'Orletta, Giulia Venturi, Andrea Cimino, Simonetta Montemagni","authors_cnr":["Venturi, Giulia","Cimino, Andrea","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048","048"],"authors":["Dell'Orletta, F.","Venturi, G.","Cimino, A.","Montemagni, S."],"abstract":"In this paper, we present T2K, a suite of tools for automatically extracting domain-specific knowledge from collections of Italian and English texts. T2K (Text-To-Knowledge v2) relies on a battery of tools for Natural Language Processing (NLP), statistical text analysis and machine learning which are dynamically integrated to provide an accurate and incremental representation of the content of vast repositories of unstructured documents. Extracted knowledge ranges from domain-specific entities and named entities to the relations connecting them and can be used for indexing document collections with respect to different information types. T2K also includes \"linguistic profiling\" functionalities aimed at supporting the user in constructing the acquisition corpus, e.g. in selecting texts belonging to the same genre or characterized by the same degree of specialization or in monitoring the \"added value\" of newly inserted documents. T2K is a web application which can be accessed from any browser through a personal account which has been tested in a wide range of domains.","keywords":["Natural Language Processing","Information Extraction","Knowledge Management"],"pages":"2062-2070","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/pdf\/590_Paper.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-2-9517408-8-4","conference_name":"International Conference on Language Resources and Evaluation (LREC)","conference_place":"Reykjavik","conference_date":"26-31 maggio 2014"},{"id":131991,"last_updated":"2023-11-06 19:33:17","id_people":294084,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Assessing the readability of sentences: which corpora and features?","year":2014,"authors_people":"Dell'Orletta F., Wieling M., Cimino A., Venturi G., Montemagni S.","authors_cnr":["Venturi, Giulia","Cimino, Andrea","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048","048"],"authors":["Dell'Orletta, F.","Wieling, M.","Cimino, A.","Venturi, G.","Montemagni, S."],"abstract":"The paper investigates the problem of sentence readability assessment, which is modelled as a classification task, with a specific view to text simplification. In particular, it addresses two open issues connected with it, i.e. the corpora to be used for training, and the identification of the most effective features to determine sentence readability. An existing readability assessment tool developed for Italian was specialized at the level of training corpus and learning algorithm. A maximum entropy-based feature selection and ranking algorithm (grafting) was used to identify to the most relevant features: it turned out that assessing the readability of sentences is a complex task, requiring a high number of features, mainly syntactic ones.","keywords":[""],"pages":"163-173","url":"http:\/\/acl2014.org\/acl2014\/W14-18\/pdf\/W14-1820.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of 9th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2014)","publisher":"Association for Computational Linguistics (Stroudsburg, USA)","issn":"","isbn":"978-1-941643-03-7","conference_name":"9th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2014)","conference_place":"Baltimore, Maryland, USA","conference_date":"26 giugno 2014"},{"id":132063,"last_updated":"2015-05-03 14:35:08","id_people":330111,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"DH@ILC: linee di attivit\u00e0 e ricerca","year":2014,"authors_people":"Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S."],"abstract":"Le principali linee di ricerca e sviluppo dell'ILC nel settore delle DH possono essere ricondotte ai seguenti filoni: acquisizione e conservazione di testi; progettazione e sviluppo di risorse e strumenti per il trattamento automatico di lingue classiche e variet\u00e0 storiche della lingua; progettazione e sviluppo di strumenti per l'analisi del testo; costruzione di un'infrastruttura italiana per la ricerca nell'ambito delle scienze umane e sociali.","keywords":["Digital Humanities","Trattamento Automatico del Linguaggio","Risorse Linguistiche"],"pages":"101-111","url":"https:\/\/publications.cnr.it\/doc\/330111","volume":"","doi":"","editors_people":"Maristella Agosti, Francesca Tomasi","editors":["Agosti, M.","Tomasi, F."],"published":"Collaborative Research Practices and Shared Infrastructures for Humanities Computing","publisher":"CLEUP (Padova, ITA)","issn":"","isbn":"9788867872602","conference_name":"2nd AIUCD Annual Conference","conference_place":"Padova, Italy","conference_date":"11-12 December 2013"},{"id":132056,"last_updated":"2015-04-23 22:57:04","id_people":329779,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Less is More? Towards a Reduced Inventory of Categories for Training a Parser for the Italian Stanford Dependencies","year":2014,"authors_people":"Simi Maria; Bosco Cristina; Montemagni Simonetta","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Simi, M.","Bosco, C.","Montemagni, S."],"abstract":"Stanford Dependencies (SD) represent nowadays a de facto standard as far as dependency annotation is concerned. The goal of this paper is to explore pros and cons of different strategies for generating SD annotated Italian texts to enrich the existing Italian Stanford Dependency Treebank (ISDT). This is done by comparing the performance of a statistical parser (DeSR) trained on a simpler resource (the augmented version of the Merged Italian Dependency Treebank or MIDT+) and whose output was automatically converted to SD, with the results of the parser directly trained on ISDT. Experiments carried out to test reliability and effectiveness of the two strategies show that the performance of a parser trained on the reduced dependencies repertoire, whose output can be easily converted to SD, is slightly higher than the performance of a parser directly trained on ISDT. A non-negligible advantage of the first strategy for generating SD annotated texts is that semi-automatic extensions of the training resource are more easily and consistently carried out with respect to a reduced dependency tagset. Preliminary experiments carried out for generating the collapsed and propagated SD representation are also reported.","keywords":["Italian Treebank","Harmonization and Merging of Resources","Stanford Dependencie s"],"pages":"","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2014\/pdf\/818_Paper.pdf","volume":"","doi":"","editors_people":"Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Loftsson, H.","Maegaard, B.","Mariani, J.","Moreno, A.","Odijk, J.","Piperidis, S."],"published":"Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-8-4","conference_name":"Ninth International Conference on Language Resources and Evaluation (LREC'14)","conference_place":"Reykjavik, Iceland","conference_date":"26-31 May 2014"},{"id":123731,"last_updated":"2015-02-17 13:31:15","id_people":310539,"institutes":["ILC","ITTIG","IGSG"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Investigating the relationship between neuroscience and law: a case study on a corpus of Italian case law texts","year":2014,"authors_people":"M.T.Sagri, D. Tiscornia, S. Montemagni, G. Venturi,","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Sagri, Maria Teresa","Tiscornia, Daniela"],"authors_cnr_id":["5595","11040","20276"],"authors_cnr_institute":["048","048","104","104"],"authors":["Sagri, M. T.","Tiscornia, D.","Montemagni, S.","Venturi, G."],"abstract":"","keywords":["Neuroscience linguistic and lexico-semantic analysis"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/310539","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Language and Law in Social Practice 3rd International Conference","conference_place":"Florence","conference_date":"14-15-16-17 May 2014"},{"id":132004,"last_updated":"2023-11-06 19:33:33","id_people":310619,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Linguistically-driven selection of correct arcs for dependency parsing","year":2013,"authors_people":"Dell'Orletta F.; Venturi G.; Montemagni S.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Dell'Orletta, F.","Venturi, G.","Montemagni, S."],"abstract":"LISCA is an unsupervised algorithm aimed at assigning a quality score to each arc generated by a dependency parser in order to produce a decreasing ranking of arcs from correct to incorrect ones. LISCA exploits statistics about a set of linguistically-motivated and dependency-based features extracted from a large corpus of automatically parsed sentences and uses them to assign a quality score to each arc of a parsed sentence belonging to the same domain of the automatically parsed corpus. LISCA has been successfully tested on two datasets belonging to two different domains and in all experiments it turned out to outperform different baselines, thus showing to be able to reliably detect correct arcs also representing domain-specific peculiarities.","keywords":["Correct arcs","Dependency parsing"],"pages":"125-136","url":"http:\/\/cys.cic.ipn.mx\/ojs\/index.php\/CyS\/article\/view\/1517","volume":"17","doi":"","editors_people":"","editors":[""],"published":"Computaci\u00f3n y Sistemas","publisher":"","issn":"1405-5546","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132058,"last_updated":"2016-03-21 19:10:10","id_people":329781,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Tecnologie linguistico-computazionali e monitoraggio della lingua italiana","year":2013,"authors_people":"Montemagni Simonetta","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"In una riflessione su dove stia andando l'italiano del terzo millennio, \u00e8 legittimo chiedersi se e in che misura le tecnologie linguistico-computazionali possano essere di aiuto nel monitoraggio della lingua italiana nelle sue variet\u00e0 diamesiche, diafasiche e diastratiche, nonch\u00e9 sull'asse diacronico. L'obiettivo del presente contributo consiste nel fornire una risposta, sebbene preliminare, a questo interrogativo, primariamente sul versante metodologico. In particolare, si vuole mostrare che mediante il ricorso a tecnologie linguistico-computazionali \u00e8 oggi possibile monitorare un ampio spettro di tratti, che spaziano tra i diversi livelli di descrizione linguistica (primariamente, lessico, morfo-sintassi e sintassi), in relazione a corpora di sempre pi\u00f9 vaste dimensioni. Questo rappresenta un cambio fondamentale nello studio della variazione linguistica, in particolare della lingua italiana, fino a oggi basato su corpora di dimensioni relativamente ridotte e tipicamente condotto mediante un'analisi (semi-)manuale del testo. Come vedremo, l'uso di vasti corpora testuali combinato con il ricorso a tecnologie linguistico-computazionali per l'analisi e il monitoraggio linguistico rendono oggi possibili analisi sempre pi\u00f9 accurate e affidabili, che coprono aspetti della struttura linguistica rimasti fino a ora inesplorati in quanto difficilmente attingibili mediante un'analisi manuale del testo.","keywords":["Monitoraggio Linguistico","Trattamento Automatico del Linguaggio","Variet\u00e0 d'Uso della Lingua"],"pages":"145-172","url":"http:\/\/www.italianlp.it\/wp-content\/uploads\/2014\/04\/montemagni_silta_submission_rif.pdf","volume":"XLII","doi":"","editors_people":"","editors":[""],"published":"Studi italiani di linguistica teorica ed applicata","publisher":"Pacini Editore (Opedaletto (PI), Italia)","issn":"0390-6809","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131941,"last_updated":"2014-11-23 21:39:42","id_people":288064,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Synchronic patterns of Tuscan phonetic variation and diachronic change: Evidence from a dialectometric study","year":2013,"authors_people":"Montemagni, Simonetta; Wieling, Martijn; de Jonge, Bob; Nerbonne, John","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S.","Wieling, M.","De Jonge, B.","Nerbonne, J."],"abstract":"A careful investigation of synchronic patterns of linguistic variation with underlying linguistic features can lead to important insights into the comprehension of diachronic phonetic processes. In this article, we showed that the method of spectral partitioning of bipartite graphs applied to synchronic dialectal data can effectively and reliably be used to investigate diachronic processes, thus contributing to a deeper understanding of the relationship between synchronic variation and diachronic change. This was illustrated through a case study carried out on Tuscan dialects, focusing on so-called Tuscan 'gorgia', a lenition process consisting of the spirantization of stop consonants. In particular, from a quantitative analysis of the sound correspondences involving voiceless and voiced stops, we tracked the evolution of the spirantization phenomenon in several respects. First, we tracked spirantization geographically, across Tuscany from the influential center of Florence to the peripheral areas. Second, we tracked it phonologically, from voiceless to voiced stops, and within each voicing class from velars to dentals and then to bilabials. Finally, we tracked it demographically, with young speakers using the most innovative sound correspondences more than old speakers. The fact that these results are in line with the literature on the topic of Tuscan 'gorgia' demonstrates the potential of the method of spectral partitioning of bipartite graphs with respect to the reconstruction of diachronic processes starting from diatopically distributed synchronic dialectal data.","keywords":["Tuscan dialactelogy","dialectometry","diachronic variation"],"pages":"157-172","url":"https:\/\/publications.cnr.it\/doc\/288064","volume":"28","doi":"10.1093\/llc\/fqs057","editors_people":"","editors":[""],"published":"Literary and linguistic computing","publisher":"Oxford University Press (Oxford, Regno Unito)","issn":"0268-1145","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":123661,"last_updated":"2023-11-06 19:33:30","id_people":266373,"institutes":["ILC","ITTIG","IGSG"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Domain Adaptation for Dependency Parsing at EVALITA 2011","year":2013,"authors_people":"F. Dell'Orletta and S. Marchi and S. Montemagni and G. Venturi and T. Agnoloni and E. Francesconi","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Marchi, Simone","Francesconi, Enrico","Agnoloni, Tommaso","Dell'Orletta, Felice"],"authors_cnr_id":["5595","10442","10498","11403","14329"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Marchi, S.","Montemagni, S.","Venturi, G.","Agnoloni, T.","Francesconi, E."],"abstract":"The domain adaptation task was aimed at investigating techniques for adapting state-of-the-art dependency parsing systems to new domains. Both the language dealt with, i.e. Italian, and the target do- main, namely the legal domain, represent two main novelties of the task organised at Evalita 2011 with respect to previous domain adaptation ini- tiatives. In this paper, we define the task and describe how the datasets were created from different resources. In addition, we characterize the different approaches of the participating systems, report the test results, and provide a first analysis of these results.","keywords":["Dependency Parsing","Domain Adaptation","Self-training","Active Learning","Legal-NLP"],"pages":"58-69","url":"https:\/\/publications.cnr.it\/doc\/266373","volume":"7689","doi":"","editors_people":"Bernardo Magnini, Francesco Cutugno, Mauro Falcone, Emanuele Pianta","editors":["Magnini, B.","Cutugno, F.","Falcone, M.","Pianta, E."],"published":"Evaluation of NLP and Speech Tools for Italian","publisher":"Springer (Berlin Heidelberg, DEU)","issn":"","isbn":"978-3-642-35827-2","conference_name":"","conference_place":"","conference_date":""},{"id":132055,"last_updated":"2015-04-23 22:38:51","id_people":329778,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Estrazione Terminologica Automatica e Indicizzazione: Scenari Applicativi, Problemi e Possibili Soluzioni","year":2013,"authors_people":"Montemagni Simonetta","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"Il ricorso a metodi e tecniche di estrazione automatica di terminologia settoriale da corpora di dominio, ovvero da insiemi di documenti relativi a uno specifico settore della conoscenza, rappresenta una sempre pi\u00f9 diffusa pratica di supporto al processo di indicizzazione di collezioni documentali, inteso come l'operazione volta all'individuazione delle voci indice che ne costituiscono il contenuto concettuale. L'obiettivo di questo contributo \u00e8 una rivisitazione critica di esperienze condotte all'interno di diversi scenari applicativi in cui i risultati del processo di estrazione automatica di terminologia sono utilizzati per la costruzione di vocabolari controllati o di thesauri sulla base dei quali \u00e8 condotto il processo di indicizzazione.","keywords":["Trattamento Automatico del Linguaggio","Estrazione Terminologica","Indicizzazione"],"pages":"241-284","url":"https:\/\/publications.cnr.it\/doc\/329778","volume":"","doi":"","editors_people":"Guarasci Roberto; Folino Antonietta","editors":["Guarasci, R.","Folino, A."],"published":"Documenti Digitali","publisher":"Iter (Milano) (Milano, ITA)","issn":"","isbn":"978-88-903419-3-9","conference_name":"","conference_place":"","conference_date":""},{"id":132057,"last_updated":"2015-04-23 23:20:46","id_people":329780,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Converting Italian Treebanks: Towards an Italian Stanford Dependency Treebank","year":2013,"authors_people":"Bosco, Cristina; Montemagni, Simonetta; Simi, Maria","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Bosco, C.","Montemagni, S.","Simi, M."],"abstract":"The paper addresses the challenge of converting MIDT, an existing dependency-based Italian treebank resulting from the harmonization and merging of smaller resources, into the Stanford Dependencies annotation formalism, with the final aim of constructing a standard-compliant resource for the Italian language. Achieved results include a methodology for converting treebank annotations belonging to the same dependency-based family, the Italian Stanford Dependency Treebank (ISDT), and an Italian localization of the Stanford Dependency scheme.","keywords":["Italian Treebank","Harmonization and Merging of Resources","Stanford Dependencie s"],"pages":"61-69","url":"http:\/\/aclweb.org\/anthology\/W13-2308","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of the 7th Linguistic Annotation Workshop and Interoperability with Discourse","publisher":"","issn":"","isbn":"978-1-937284-58-9","conference_name":"7th Linguistic Annotation Workshop and Interoperability with Discourse","conference_place":"Sofia, Bulgaria","conference_date":"8-9 August 2013"},{"id":131888,"last_updated":"2023-11-06 19:33:31","id_people":285772,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Linguistic Profiling based on General-purpose Features and Native Language Identification","year":2013,"authors_people":"Andrea Cimino, Felice Dell'Orletta, Giulia Venturi and Simonetta Montemagni","authors_cnr":["Venturi, Giulia","Cimino, Andrea","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048","048"],"authors":["Cimino, A.","Dell'Orletta, F.","Venturi, G.","Montemagni, S."],"abstract":"In this paper, we describe our approach to native language identification and discuss the results we submitted as participants to the First NLI Shared Task. By resorting to a wide set of general-purpose features qualifying the lexical and grammatical structure of a text, rather than to ad hoc features specifically selected for the NLI task, we achieved encouraging results, which show that the proposed approach is general-purpose and portable across different tasks, domains and languages.","keywords":["Native Language Identification","Linguistic Profiling"],"pages":"207-215","url":"http:\/\/www.aclweb.org\/anthology\/W13-1727","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-937284-47-3","conference_name":"8th workshop on \"Innovative Use of NLP for Building Educational Applications\"","conference_place":"Atlanta (Georgia)","conference_date":"13 giugno 2013"},{"id":131886,"last_updated":"2023-11-06 19:33:32","id_people":278421,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Linguistic Profiling of Texts Across Textual Genre and Readability Level. An exploratory Study on Italian Fictional Prose","year":2013,"authors_people":"Dell'Orletta F and Montemagni S and VENTURI G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"","keywords":[""],"pages":"189-197","url":"https:\/\/publications.cnr.it\/doc\/278421","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of Recent Advances in Natural Language Processing (RANLP 2013)","publisher":"","issn":"","isbn":"","conference_name":"Recent Advances in Natural Language Processing (RANLP 2013)","conference_place":"Hissar, Bulgaria","conference_date":"7-13 settembre"},{"id":131889,"last_updated":"2023-11-06 19:33:36","id_people":285773,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Unsupervised Linguistically-Driven Reliable Dependency Parses Detection and Self-Training for Adaptation to the Biomedical Domain","year":2013,"authors_people":"Felice Dell'Orletta, Giulia Venturi, Simonetta Montemagni","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Dell'Orletta, F.","Venturi, G.","Montemagni, S."],"abstract":"In this paper, a new self-training method for domain adaptation is illustrated, where the selection of reliable parses is carried out by an unsupervised linguistically-driven algorithm, ULISSE. The method has been tested on biomedical texts with results showing a significant improvement with respect to considered baselines, which demonstrates its ability to capture both reliability of parses and domain-specificity of linguistic constructions.","keywords":["Self-training","Domain Adaptation","Biomedical Texts"],"pages":"45-53","url":"http:\/\/www.aclweb.org\/anthology\/W13-1906","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-937284-55-8","conference_name":"12th workshop on \"Biomedical Natural Language Processing\" (BioNLP)","conference_place":"Sofia (Bulgaria)","conference_date":"8-9 agosto 2013"},{"id":124028,"last_updated":"2015-05-03 14:56:22","id_people":330113,"institutes":["ILC","ITTIG","IGSG"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings of the Fourth Workshop on Semantic Processing of Legal Texts (SPLeT 2012)","year":2012,"authors_people":"Enrico Francesconi, Simonetta Montemagni, Wim Peters, Adam Wyner","authors_cnr":["Montemagni, Simonetta","Francesconi, Enrico"],"authors_cnr_id":["5595","10498"],"authors_cnr_institute":["048","104"],"authors":["Francesconi, E.","Montemagni, S.","Peters, W.","Wyner, A."],"abstract":"","keywords":["Trattamento Automatico del Linguaggio","Linguaggio Giuridico","Estrazione di Conoscenza"],"pages":"71","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/workshops\/27.LREC%202012%20Workshop%20Proceedings%20SPLeT.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-7-7","conference_name":"","conference_place":"","conference_date":""},{"id":132003,"last_updated":"2023-11-06 19:33:39","id_people":310580,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Lessico settoriale e lessico comune dell'estrazione di terminologia specialistica da corpora di dominio","year":2012,"authors_people":"Bonin F., Dell'Orletta F., Montemagni S., Venturi G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Bonin, F.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"","keywords":[""],"pages":"207-220","url":"https:\/\/publications.cnr.it\/doc\/310580","volume":"","doi":"","editors_people":"","editors":[""],"published":"Lessico e Lessicologia. Atti del XLIV congresso internazionale di studi della societ\u00e0 di linguistica italiana","publisher":"Bulzoni Editore (Roma, ITA)","issn":"","isbn":"978-88-7870-655-2","conference_name":"XLIV congresso internazionale di studi della societ\u00e0 di linguistica italiana","conference_place":"Viterbo","conference_date":"27-29 settembre 2010"},{"id":132061,"last_updated":"2015-05-02 17:54:39","id_people":330109,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Harmonization and Merging of two Italian Dependency Treebanks","year":2012,"authors_people":"Cristina Bosco; Simonetta Montemagni; Maria Simi","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Bosco, C.","Montemagni, S.","Simi, M."],"abstract":"The paper describes the methodology which is currently being defined for the construction of a \"Merged Italian Dependency Treebank\" (MIDT) starting from already existing resources. In particular, it reports the results of a case study carried out on two available dependency treebanks, i.e. TUT and ISST-TANL. The issues raised during the comparison of the annotation schemes underlying the two treebanks are discussed and investigated with a particular emphasis on the definition of a set of linguistic categories to be used as a \"bridge\" between the specific schemes. As an encoding format, the CoNLL de facto standard is used.","keywords":["Syntactic Annotation","Merging of Resources","Dependency Parsing"],"pages":"23-30","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/workshops\/06.LREC%202012%20Merging%20Proceedings.pdf","volume":"","doi":"","editors_people":"Nuria Bel et al.","editors":["Bel, N."],"published":"Proceedings of the LREC 2012 Workshop on Language Resource Merging","publisher":"European Language Resources Association ELRA (Paris, FRA)","issn":"","isbn":"978-2-9517408-7-7","conference_name":"LREC 2012 Workshop on Language Resource Merging","conference_place":"Istambul","conference_date":"22 May 2012"},{"id":131746,"last_updated":"2023-11-06 19:33:41","id_people":219489,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"The SPLeT-2012 Shared Task on Dependency Parsing of Legal Texts","year":2012,"authors_people":"Dell'Orletta, Felice [1]; Marchi, Simone [1]; Montemagni, Simonetta [1]; Plank, Barbara [2]; Venturi, Giulia [3]","authors_cnr":["Montemagni, Simonetta","Marchi, Simone","Dell'Orletta, Felice"],"authors_cnr_id":["5595","10442","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Dell'Orletta, F.","Marchi, S.","Montemagni, S.","Plank, B.","Venturi, G."],"abstract":"The 4th Workshop on \"Semantic Processing of Legal Texts\" (SPLeT-2012) presents the first multilingual shared task on Dependency Parsing of Legal Texts. In this paper, we define the general task and its internal organization into sub-tasks, describe the datasets and the domain-specific linguistic peculiarities characterizing them. We finally report the results achieved by the participating systems, describe the underlying approaches and provide a first analysis of the final test results.","keywords":["Dependency Parsing","Domain Adaptation","Legal Text Processing"],"pages":"","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/workshops\/27.LREC%202012%20Workshop%20Proceedings%20SPLeT.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Fourth Workshop on Semantic Processing of Legal Texts (SPLeT 2012)-First Shared Task on Dependency Parsing of Legal Texts (SPLeT 2012)","conference_place":"Istanbul","conference_date":"27 Maggio 2012"},{"id":131745,"last_updated":"2023-11-06 19:33:37","id_people":219483,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Domain Adaptation for Dependency Parsing at Evalita 2011","year":2012,"authors_people":"Dell'Orletta, Felice [1]; Marchi, Simone [1]; Montemagni, Simonetta [1]; Venturi, Giulia [2]; Agnoloni, Tommaso [3]; Francesconi, Enrico [3]","authors_cnr":["Agnoloni, Tommaso","Montemagni, Simonetta","Marchi, Simone","Francesconi, Enrico","Dell'Orletta, Felice"],"authors_cnr_id":["5595","10442","10498","14329"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Marchi, S.","Montemagni, S.","Venturi, G.","Agnoloni, T.","Francesconi, E."],"abstract":"The domain adaptation task was aimed at investigating techniques for adapting state-of-the-art dependency parsing systems to new domains. Both the language dealt with, i.e. Italian, and the target domain, namely the legal domain, represent two main novelties of the task organised at Evalita 2011. In this paper, we define the task and describe how the datasets were created from different resources. In addition, we characterize the different approaches of the participating systems, report the test results, and provide a first analysis of these results.","keywords":["Dependency Parsing","Domain Adaptation","Legal Text Processing"],"pages":"1-7","url":"http:\/\/www.evalita.it\/sites\/evalita.fbk.eu\/files\/working_notes2011\/Domain_Adaptation\/","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Evaluation of NLP and Speech Tools for Italian (EVALITA 2011): Domain Adaptation track","conference_place":"Roma","conference_date":"24-25 Gennaio 2012"},{"id":131885,"last_updated":"2023-11-06 19:33:38","id_people":278420,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Genre-oriented Readability Assessment: a Case Study","year":2012,"authors_people":"Dell'Orletta F and Montemagni S and VENTURI G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"","keywords":[""],"pages":"91-98","url":"https:\/\/publications.cnr.it\/doc\/278420","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of Workshop on \"Speech and Language Processing Tools in Education\" (SLP-TED)","publisher":"","issn":"","isbn":"978-1-62748-389-6","conference_name":"Workshop on \"Speech and Language Processing Tools in Education\" (SLP-TED)","conference_place":"Mumbai, India","conference_date":"15 December, 2012"},{"id":131878,"last_updated":"2014-10-24 00:38:01","id_people":285544,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Enriching the ISST-TANL Corpus with Semantic Frames","year":2012,"authors_people":"Lenci, Alessandro; Montemagni, Simonetta; Venturi, Giulia; Cutrulla, Maria Rosaria","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048","048"],"authors":["Lenci, A.","Montemagni, S.","Venturi, G.","Cutrulla, M. R."],"abstract":"The paper describes the design and the results of a manual annotation methodology devoted to enrich the ISST-TANL Corpus with Semantic Frames information. The main issues encountered in applying the English FrameNet annotation criteria to a corpus of Italian language are discussed together with the choice of anchoring the semantic annotation layer to the underlying dependency syntactic structure. We also describe an experiment to measure inter-annotator agreement and a first case study to extend and specialise FrameNet annotation to a corpus of legislative texts.","keywords":["Semantic annotation","FrameNet","Multi-layer annotated corpus"],"pages":"3719-3726","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2012\/pdf\/986_Paper.pdf","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Mehmet U?ur Do?an and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis","editors":["Calzolari, N.","Choukri, K.","Declerck, T.","Do\u011fan, M. U.","Maegaard, B.","Mariani, J.","Moreno, A.","Odijk, J.","Piperidis, S."],"published":"Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)","publisher":"European language resources association (ELRA) (Paris, FRA)","issn":"","isbn":"978-2-9517408-7-7","conference_name":"Eight International Conference on Language Resources and Evaluation (LREC'12)","conference_place":"Istanbul, Turkey","conference_date":"23-25 May 2012"},{"id":132065,"last_updated":"2015-05-03 15:21:07","id_people":330114,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Patterns of Language Variation and Underlying Linguistic Features: A New Dialectometric Approach","year":2012,"authors_people":"Simonetta Montemagni, Martijn Wieling, Bob de Jonge, John Nerbonne","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S.","Wieling, M.","De Jonge, B.","Nerbonne, J."],"abstract":"","keywords":[""],"pages":"879-889","url":"https:\/\/publications.cnr.it\/doc\/330114","volume":"II","doi":"","editors_people":"Patricia Bianchi, Nicola De Blasi, Chiara De Caprio, Francesco Montuori","editors":["Bianchi, P.","De Blasi, N.","De Caprio, C.","Montuori, F."],"published":"La variazione nell'italiano e nella sua storia. Variet\u00e0 e varianti linguistiche e testuali. Atti dell'XI Congresso SILFI (Societ\u00e0 Internazionale di Linguistica e Filologia Italiana)","publisher":"Franco Cesati Editore (Firenze, ITA)","issn":"","isbn":"978-88-7667-433-4","conference_name":"XI Congresso SILFI (Societ\u00e0 Internazionale di Linguistica e Filologia Italiana)","conference_place":"Napoli","conference_date":"5-7 Ottobre 2010"},{"id":131669,"last_updated":"2016-03-18 14:44:40","id_people":205232,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"The BioLexicon: a large-scale terminological resource for biomedical text mining","year":2011,"authors_people":"Paul Thompson, John McNaught, Simonetta Montemagni, Nicoletta Calzolari, Riccardo del Gratta, Vivian Lee, Simone Marchi, Monica Monachini, Piotr Pezik, Valeria Quochi, CJ Rupp, Yutaka Sasaki, Giulia Venturi, Dietrich Rebholz-Schuhmann, Sophia Ananiadou","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Monachini, Monica","Marchi, Simone","Quochi, Valeria","Del Gratta, Riccardo","Zamorani, Nicoletta"],"authors_cnr_id":["5595","8945","10442","11893","11933","26123"],"authors_cnr_institute":["048","048","048","048","048","048","048"],"authors":["Thompson, P.","McNaught, J.","Montemagni, S.","Calzolari, N.","Del Gratta, R.","Lee, V.","Marchi, S.","Monachini, M.","Pezik, P.","Quochi, V.","Rupp, C.","Sasaki, Y.","Venturi, G.","Rebholz Schuhmann, D.","Ananiadou, S."],"abstract":"Background Due to the rapidly expanding body of biomedical literature, biologists require increasingly sophisticated and efficient systems to help them to search for relevant information. Such systems should account for the multiple written variants used to represent biomedical concepts, and allow the user to search for specific pieces of knowledge (or events) involving these concepts, e.g., protein-protein interactions. Such functionality requires access to detailed information about words used in the biomedical literature. Existing databases and ontologies often have a specific focus and are oriented towards human use. Consequently, biological knowledge is dispersed amongst many resources, which often do not attempt to account for the large and frequently changing set of variants that appear in the literature. Additionally, such resources typically do not provide information about how terms relate to each other in texts to describe events. Results This article provides an overview of the design, construction and evaluation of a large-scale lexical and conceptual resource for the biomedical domain, the BioLexicon. The resource can be exploited by text mining tools at several levels, e.g., part-of-speech tagging, recognition of biomedical entities, and the extraction of events in which they are involved. As such, the BioLexicon must account for real usage of words in biomedical texts. In particular, the BioLexicon gathers together different types of terms from several existing data resources into a single, unified repository, and augments them with new term variants automatically extracted from biomedical literature. Extraction of events is facilitated through the inclusion of biologically pertinent verbs (around which events are typically organized) together with information about typical patterns of grammatical and semantic behaviour, which are acquired from domain-specific texts. In order to foster interoperability, the BioLexicon is modelled using the Lexical Markup Framework, an ISO standard. Conclusions The BioLexicon contains over 2.2 M lexical entries and over 1.8 M terminological variants, as well as over 3.3 M semantic relations, including over 2 M synonymy relations. Its exploitation can benefit both application developers and users. We demonstrate some such benefits by describing integration of the resource into a number of different tools, and evaluating improvements in performance that this can bring.","keywords":["Text Mining","Information Extraction","Computational Lexicon"],"pages":"1-29","url":"http:\/\/www.biomedcentral.com\/1471-2105\/12\/397","volume":"12","doi":"10.1186\/1471-2105-12-397","editors_people":"","editors":[""],"published":"BMC bioinformatics","publisher":"BioMed Central ([London], Regno Unito)","issn":"1471-2105","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132015,"last_updated":"2023-11-06 19:33:43","id_people":138775,"institutes":["ILC","IRISS"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Tecnologie linguistico-computazionali per il monitoraggio della competenza linguistica italiana degli alunni stranieri nella scuola primaria e secondaria","year":2011,"authors_people":"Dell'Orletta Felice; Montemagni Simonetta; Vecchi Eva Maria; Venturi Giulia","authors_cnr":["Vecchi, Eva Maria","Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["071","071","048","048"],"authors":["Dell'Orletta, F.","Montemagni, S.","Vecchi, E. M.","Venturi, G."],"abstract":"La possibilit\u00e0 di disporre di tecnologie avanzate e innovative che permettano di monitorare la competenza linguistica degli alunni stranieri e, al contempo, valutare l'adeguatezza dei materiali didattici a loro offerti pu\u00f2 essere di supporto all'insegnante nell'orientare la propria azione formativa, rendendo cos\u00ec il processo di integrazione linguistico-culturale meno faticoso e traumatico. In tale ottica, questo studio, realizzato col supporto di una piattaforma ormai consolidata di metodi e strumenti per il trattamento automatico dell'italiano, costituisce il primo tentativo condotto in relazione alla lingua italiana, per mettere a punto una metodologia di monitoraggio linguistico rivolta specificamente agli studenti apprendenti la lingua italiana come L2 ed alle loro produzioni scritte.","keywords":["Trattamento Automatico del Linguaggio","Stranieri","Lingua italiana"],"pages":"319-336","url":"https:\/\/publications.cnr.it\/doc\/138775","volume":"","doi":"","editors_people":"Bruno Giovanni Carlo; Caruso Immacolata; Sanna Manuela; Vellecco Immacolata","editors":["Bruno, G. C.","Caruso, I.","Sanna, M.","Vellecco, I."],"published":"Percorsi Migranti","publisher":"Mc Graw-Hill (Milano, ITA)","issn":"","isbn":"978-88-386-7296-5","conference_name":"","conference_place":"","conference_date":""},{"id":131676,"last_updated":"2023-11-06 19:33:42","id_people":205510,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"READ-IT: assessing readability of Italian texts with a view to text simplification","year":2011,"authors_people":"Felice Dell'Orletta, Simonetta Montemagni, Giulia Venturi","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"In this paper, we propose a new approach to readability assessment with a specific view to the task of text simplification: the intended audience includes people with low literacy skills and\/or with mild cognitive impairment. READ-IT represents the first advanced readability assessment tool for what concerns Italian, which combines traditional raw text features with lexical, morpho-syntactic and syntactic information. In READ-IT readability assessment is carried out with respect to both documents and sentences where the latter represents an important novelty of the proposed approach creating the prerequisites for aligning the readability assessment step with the text simplification process. READ-IT shows a high accuracy in the document classification task and promising results in the sentence classification scenario.","keywords":["Readability Assessment","Text Simplification"],"pages":"73-83","url":"http:\/\/dl.acm.org\/citation.cfm?id=2140511","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-937284-14-5","conference_name":"SLPAT '11 Proceedings of the Second Workshop on Speech and Language Processing for Assistive Technologies","conference_place":"Edimburgo, UK","conference_date":"30 Luglio 2011"},{"id":131675,"last_updated":"2023-11-06 19:33:46","id_people":205505,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"ULISSE: an unsupervised algorithm for detecting reliable dependency parses","year":2011,"authors_people":"Felice Dell'Orletta, Giulia Venturi and Simonetta Montemagni","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Dell'Orletta, F.","Venturi, G.","Montemagni, S."],"abstract":"In this paper we present ULISSE, an unsupervised linguistically--driven algorithm to select reliable parses from the output of a dependency parser. Different experiments were devised to show that the algorithm is robust enough to deal with the output of different parsers and with different languages, as well as to be used across different domains. In all cases, ULISSE appears to outperform the baseline algorithms.","keywords":["Dependency Parsing","Selection of Reliable Parses","Unsupervised Algorithm"],"pages":"115-124","url":"http:\/\/dl.acm.org\/citation.cfm?id=2018950","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-932432-92-3","conference_name":"CoNLL '11 Proceedings of the Fifteenth Conference on Computational Natural Language Learning","conference_place":"Portland, Oregon, USA","conference_date":"23-24 Giugno 2011"},{"id":131689,"last_updated":"2023-11-06 19:33:45","id_people":205737,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Towards an NLP-based approach for measuring syntactic complexity: preliminary experiments with Italian texts from different registers","year":2011,"authors_people":"Felice Dell'Orletta, Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048"],"authors":["Dell'Orletta, F.","Montemagni, S."],"abstract":"In this paper, we explore how NLP can be used to automatically identify relevant syntactic complexity features in texts with the aim of assessing their correlation with specific linguistic registers. Our final goal is twofold. On the one hand, we demonstrate that automatic morpho-syntactic and syntactic annotation of texts provides sufficiently accurate output for use in the automatic extraction and measurement of syntactic complexity features. On the other hand, we identify the set of syntactic features strongly correlating with considered linguistic registers.","keywords":["Language Variation","Natural Language Processing","Syntactic Complexity"],"pages":"","url":"http:\/\/www.benszm.net\/BSBWWS\/Dellorletta_Montemagni.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Workshop on \"Cross-linguistic and language-internal variation in text and speech: focus on the joint analysis of multiple characteristics\"","conference_place":"Freiburg Institute for Advanced Studies (FRIAS), University of Freiburg","conference_date":"29\/10\/2010"},{"id":131691,"last_updated":"2013-02-28 11:00:52","id_people":205779,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Ontology Learning. An introduction","year":2011,"authors_people":"Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S."],"abstract":"The tutorial is organised into two parts: PART 1 is devoted to provide the basic notions underlying Ontology Learning, in particular why it is needed, how it can be carried out and how its results can be evaluated. PART 2 discusses the topic of Ontology Learning in the Legal domain, with particular attention to the specific challenges posed by it. It also provides an overview of different feasibility studies carried out in the legal domain.","keywords":["Ontology Learning","Legal Information extraction","Natural Language Processing"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/205779","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Summer School LEX 2011, Ravenna, Italy \"Managing Legal Resources in the Semantic Web\"","conference_place":"Ravenna, Italia","conference_date":"8 settembre 2011"},{"id":131694,"last_updated":"2013-03-01 15:53:33","id_people":205911,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Synchronic patterns of Tuscan phonetic variation and diachronic change: evidence from a dialectometric study","year":2011,"authors_people":"Simonetta Montemagni, Martijn Wieling, Bob De Jonge, John Nerbonne","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S.","Wieling, M.","De Jonge, B.","Nerbonne, J."],"abstract":"A careful investigation of synchronic patterns of linguistic variation with underlying linguistic features can lead to important insights into the comprehension of diachronic phonetic processes. Starting from the analysis of synchronic patterns of phonetic variation in Tuscany we tackled one of the main and most debated features of Tuscan dialects, the phenomenon of spirantization with a specific view to the so-called Tuscan \"gorgia\" (i.e. voiceless spirantization). In particular, we showed that the newly proposed method of spectral partitioning of bipartite graphs applied to synchronic dialectal data can effectively be used to investigate diachronic phonetic processes. From a careful analysis of the sound correspondences involving voiceless and voiced stops, we tracked the evolution of the spirantization phenomenon in several respects. First, we tracked spirantization geographically, across Tuscany from the influential center of Florence to the peripheral areas. Second, we tracked it phonologically, from voiceless to voiced stops, and within each voicing class from velars to dentals and then to bilabials. Finally, we tracked it demographically, with young speakers using the most innovative sound correspondences more than old speakers. The fact that these results are in line with the literature on the topic of Tuscan \"gorgia\" demonstrates the potential of the method of spectral partitioning of bipartite graphs with respect to the reconstruction of diachronic processes starting from diatopically distributed synchronic dialectal data.","keywords":["Dialectometry","Phonetic Variation","Tuscan Dialects"],"pages":"120-121","url":"http:\/\/westernlinguistics.ca\/methods14\/files\/all_abstracts_one_document.pdf","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Fourteenth Methods in Dialectology Conference","conference_place":"University of Western Ontario","conference_date":"2-6 August 2011"},{"id":131720,"last_updated":"2013-03-13 10:17:55","id_people":206506,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Definizione di un modello computazionale della variazione dialettale basato sull'integrazione di fattori socio-demografici e geografici","year":2011,"authors_people":"Simonetta Montemagni, Martijn Wieling,","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S.","Wieling, M."],"abstract":"In this study, we used a mixed-effects logistic regression model in combination with generalized additive logistic modeling to predict lexical differences in Tuscan dialects with respect to standard Italian. We used lexical information for 170 concepts in 213 locations in Tuscany. Although geographical position is an important predictor with locations distant from Florence having lexical forms more likely to differ from standard Italian, several other factors emerged as significant. The model predicts that lexical variants used by older speakers and in smaller as well as poorer communities are more likely to differ from standard Italian. The impact of the demographic variables, however, varied from concept to concept. For a majority of concepts, smaller and poorer communities have lexical forms different from standard Italian. For a smaller minority of concepts, however, larger and richer communities have lexical forms different from standard Italian. Similarly, the effect of speaker age and the average community age also varied per concept. While not significant as a fixed effect, the concept frequency showed significant geographical variation. These results clearly identify important factors involved in dialect variation at the lexical level. In addition, this study illustrates the usefulness of mixed-effects regression techniques together with generalized additive modeling for analyzing lexical dialect data.","keywords":["Dialettologia toscana","Dialettometria","variazione lessicale"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/206506","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131884,"last_updated":"2023-11-06 19:33:53","id_people":278419,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Singling out Legal Knowledge from World Knowledge","year":2010,"authors_people":"Bonin F and Dell'Orletta F and VENTURI G. and Montemagni S","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":[""],"authors":["Bonin, F.","Dell'Orletta, F.","Venturi, G.","Montemagni, S."],"abstract":"","keywords":[""],"pages":"217-229","url":"https:\/\/publications.cnr.it\/doc\/278419","volume":"","doi":"","editors_people":"","editors":[""],"published":"Informatica e diritto","publisher":"Edizioni Scientifiche Italiane (Firenze, Italia)","issn":"0390-0975","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":121242,"last_updated":"2013-10-20 11:16:28","id_people":30888,"institutes":["ILC","ITTIG","IGSG"],"type":"journal_article","type_order":0,"type_people":"article","title":"Integrating a Bottom-Up and Top-Down Methodology for Building Semantic Resources for the Multilingual Legal Domain","year":2010,"authors_people":"Francesconi E.; Montemagni S.; Peters W.; Tiscornia D.","authors_cnr":["Montemagni, Simonetta","Francesconi, Enrico"],"authors_cnr_id":["5595","10498"],"authors_cnr_institute":["104"],"authors":["Francesconi, E.","Montemagni, S.","Peters, W.","Tiscornia, D."],"abstract":"This article presents a methodology for multilingual legal knowledge acquisition and modelling. It encompasses two comlementary strategies. On the one hand, there is the top-down definition of the conceptual structure of the legal domain under consideration on the basis of expert jugdment. This structure is language-independent, modeled as an ontology, and can be aligned with other ontologies that capture similar or complementary knowledge, in order to provide a wider conceptual embedding. Another top-down approach is the exploitation of the explicit structure of legal texts, which enables the targeted identification of text spans that play an ontological role and their subsequent inclusion in the knowledge model. On the other hand, the linguistically motivated, text-based bottom-up population and incremental refinement of this conceptual structure using (semi-)automatic NLP techniques, maximizes the completeness and domain-specificity of the resulting knowledge. The proposed methodology is concerned with the relation between these two differently derived types of knowledge, and defines a framework for interfacing lexical and ontological knowledge, the result of which offers various perspectives on multilingual legal knowledge. Two case-studies combining bottom-up and top-down methodologies for knowledge modelling and learning are presented as illustrations of the methodology.","keywords":["Knowledge Modelling","Knowledge Acquisition","Natural Language Processing","Ontology Learning"],"pages":"95-121","url":"https:\/\/publications.cnr.it\/doc\/30888","volume":"6036\/","doi":"","editors_people":"","editors":[""],"published":"Lecture notes in computer science","publisher":"Springer (Berlin, Germania)","issn":"0302-9743","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":123398,"last_updated":"2012-03-23 11:07:38","id_people":170395,"institutes":["ILC","ITTIG","IGSG"],"type":"book","type_order":1,"type_people":"book","title":"Semantic Processing of Legal Texts: Where the Language of Law Meets the Law of Language","year":2010,"authors_people":"Francesconi E., Montemagni S., Peters W., Tiscornia D. (a cura di)","authors_cnr":["Montemagni, Simonetta","Francesconi, Enrico","Tiscornia, Daniela"],"authors_cnr_id":["5595","10498","20276"],"authors_cnr_institute":[""],"authors":["Francesconi, E.","Montemagni, S.","Peters, W.","Tiscornia, D."],"abstract":"The last few years have seen a growing body of research and practice addressing aspects such as automated legal reasoning and argumentation, semantic and cross-language legal information retrieval, document classification, legal drafting, legal knowledge discovery and extraction. This State-of-the-Art Survey contains invited contributions of leading researchers and groups eminently active in the field, which were complemented with selected papers from the Workshop on Semantic Processing of Legal Texts, held in Marrakech, Morocco, in 2008, within the framework of the Sixth International Conference on Language Resources and Evaluation (LREC 2008). These publications mirror the state-of-the-art in linguistic technologies, tools and resources focusing on the automatic extraction of relevant information from legal texts, and the structured organization of this extracted knowledge for legal knowledge representation and scholarly activity, with particular emphasis on the crucial role played by language resources and human language technologies. The contents are organized in three topical sections on information extraction; construction of knowledge resources; and semantic indexing, summarization and translation.","keywords":["Legal Text Processing, Ontology Learning, Information Extraction"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/170395","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":123465,"last_updated":"2012-06-07 20:57:09","id_people":186091,"institutes":["ILC","ITTIG","IGSG"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Semantic Processing of Legal Texts: Where the Language of Law Meets the Law of Language","year":2010,"authors_people":"Francesconi, E.; Montemagni, S.; Peters, W.; Tiscornia, D.","authors_cnr":["Montemagni, Simonetta","Francesconi, Enrico","Tiscornia, Daniela"],"authors_cnr_id":["5595","10498","20276"],"authors_cnr_institute":["048","104","104"],"authors":["Francesconi, E.","Montemagni, S.","Peters, W.","Tiscornia, D."],"abstract":"The last few years have seen a growing body of research and practice addressing aspects such as automated legal reasoning and argumentation, semantic and cross-language legal information retrieval, document classification, legal drafting, legal knowledge discovery and extraction. This State-of-the-Art Survey contains invited contributions of leading researchers and groups eminently active in the field, which were complemented with selected papers from the Workshop on Semantic Processing of Legal Texts, held in Marrakech, Morocco, in 2008, within the framework of the Sixth International Conference on Language Resources and Evaluation (LREC 2008). These publications mirror the state-of-the-art in linguistic technologies, tools and resources focusing on the automatic extraction of relevant information from legal texts, and the structured organization of this extracted knowledge for legal knowledge representation and scholarly activity, with particular emphasis on the crucial role played by language resources and human language technologies. The contents are organized in three topical sections on information extraction; construction of knowledge resources; and semantic indexing, summarization and translation.","keywords":[""],"pages":"249","url":"https:\/\/publications.cnr.it\/doc\/186091","volume":"6036","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-3-642-12836-3","conference_name":"","conference_place":"","conference_date":""},{"id":131387,"last_updated":"2011-05-26 00:00:00","id_people":136477,"institutes":["ILC"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings of the LREC 2010 Workshop on SEMANTIC PROCESSING OF LEGAL TEXTS (SPLeT-2010)","year":2010,"authors_people":"Francesconi E.; Montemagni S.; Peters W.; Wyner A.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Francesconi, E.","Montemagni, S.","Peters, W.","Wyner, A."],"abstract":"","keywords":["Legal Knowledge Extraction, Natural Language Processing"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/136477","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":122388,"last_updated":"2013-10-20 10:57:59","id_people":136476,"institutes":["ILC","ITTIG","IGSG"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings of the 4th Workshop on Legal Ontologies and Artificial Intelligence Techniques (LOAIT 2010)","year":2010,"authors_people":"Francesconi E.; Montemagni S.; Rossi P.; Tiscornia D.","authors_cnr":["Montemagni, Simonetta","Francesconi, Enrico","Tiscornia, Daniela"],"authors_cnr_id":["5595","10498","20276"],"authors_cnr_institute":["104","104"],"authors":["Francesconi, E.","Montemagni, S.","Rossi, P.","Tiscornia, D."],"abstract":"","keywords":["Legal Ontologies","Ontology Learning","Legal Knowledge Extraction","Legal Knowledge Modelling"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/136476","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131221,"last_updated":"1970-01-01 01:00:00","id_people":84775,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A Resource and Tool for Super-sense Tagging of Italian Texts","year":2010,"authors_people":"Attardi G.; Dei Rossi S.; Di Pietro G.; Lenci A.; Montemagni S.; Simi M.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Attardi, G.","Dei Rossi, S.","Di Pietro, G.","Lenci, A.","Montemagni, S.","Simi, M."],"abstract":"","keywords":["Corpus (creation, annotation, etc.)","Tools","Systems","Applications","Statistical and machine learning methods"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84775","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Seventh International Conference on Language Resources and Evaluation","conference_place":"Valletta, Malta","conference_date":"2010"},{"id":131238,"last_updated":"2023-11-06 19:33:47","id_people":84796,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"A Contrastive Approach to Multi-word Extraction from Domain-specific Corpora","year":2010,"authors_people":"Bonin F.; Dell'Orletta F.; Montemagni S.; Venturi G.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Bonin, F.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"In this paper we present a novel approach to multi-word terminology extraction combining a well-known automatic term recognition approach, the C-NC value method, with a contrastive ranking technique, aimed at refining obtained results either by filtering noise due to common words or by discerning between semantically different types of terms within heterogeneous terminologies. The proposed methodology has been tested in two case studies carried out in the History of Art and Legal domains with promising results.","keywords":["Terminology Extraction","Domain-specific Corpora","Multi-word Expression"],"pages":"3222-3229","url":"https:\/\/publications.cnr.it\/doc\/84796","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"2-9517408-6-7","conference_name":"Seventh International Conference on Language Resources and Evaluation","conference_place":"Valletta, Malta","conference_date":"19-21 maggio 2010"},{"id":131244,"last_updated":"2023-11-06 19:33:50","id_people":84802,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Contrastive filtering of domain specific multi-word terms from different types of corpora","year":2010,"authors_people":"Bonin F.; Dell'Orletta F.; Venturi G.; Montemagni S.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Dell'Orletta, Felice"],"authors_cnr_id":["5595","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Bonin, F.","Dell'Orletta, F.","Venturi, G.","Montemagni, S."],"abstract":"In this paper we tackle the challenging task of Multi-word term (MWT) extraction from different types of specialized corpora. Contrastive filtering of previously extracted MWTs results in a considerable increment of acquired domain-specific terms.","keywords":["multi-word terms extraction","corpora"],"pages":"76-79","url":"https:\/\/publications.cnr.it\/doc\/84802","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-7-900268-00-6","conference_name":"The 23rd International Conference on Computational Linguistics (COLING 2010). Multiword Expressions: from Theory to Applications (MWE 2010)","conference_place":"Beijing, China","conference_date":"28 agosto 2010"},{"id":131241,"last_updated":"1970-01-01 01:00:00","id_people":84799,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Evalita'09 Parsing Task: comparing dependency parsers and treebanks","year":2010,"authors_people":"Bosco C.; Montemagni S.; Mazzei A.; Dell'Orletta F.; Lenci A.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Bosco, C.","Montemagni, S.","Mazzei, A.","Dell'Orletta, F.","Lenci, A."],"abstract":"","keywords":["dependency parsing","dependency treebank"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84799","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Evaluation of NLP and Speech Tools for Italian. EVALITA 2009","conference_place":"Reggio Emilia, Italy","conference_date":"2010"},{"id":131232,"last_updated":"1970-01-01 01:00:00","id_people":84789,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Comparing the Influence of Different Treebank Annotations on Dependency Parsing","year":2010,"authors_people":"Bosco C.; Montemagni S.; Mazzei A.; Lombardo V.; Dell'Orletta F.; Lenci A.; Lesmo L.; Attardi G.; Simi M.; Lavelli A.; Hall J.; Nilsson J.; Nivre J.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Bosco, C.","Montemagni, S.","Mazzei, A.","Lombardo, V.","Dell'Orletta, F.","Lenci, A.","Lesmo, L.","Attardi, G.","Simi, M.","Lavelli, A.","Hall, J.","Nilsson, J.","Nivre, J."],"abstract":"","keywords":["Parsing","Corpus (creation, annotation, etc.)","Evaluation methodologies"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84789","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Seventh International Conference on Language Resources and Evaluation","conference_place":"Valletta, Malta","conference_date":"2010"},{"id":131218,"last_updated":"2012-06-05 17:44:53","id_people":84772,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Esplorazioni computazionali nello spazio della variazione lessicale in Toscana","year":2010,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S."],"abstract":"Il passaggio dalla descrizione della distribuzione geografica di singole parole a un livello di descrizione pi\u00f9 astratto volto a formulare generalizzazioni relative alla variazione diatopica \u00e8 oggi reso possibile dal ricorso a tecnologie linguistico-computazionali affiancate da tecniche di analisi statistica multivariata. L'uso combinato di queste tecniche si \u00e8 dimostrato particolarmente promettente nello studio della variazione linguistica (principalmente fonetica e lessicale) di diverse lingue e dialetti, tipologicamente anche molto distanti. Tali tecniche sono state anche proficuamente utilizzate per l'analisi del contatto tra variet\u00e0 linguistiche e una norma di riferimento. L'articolo si colloca all'interno di questo filone di ricerca, riportando i risultati di esplorazioni computazionali nello spazio della variazione lessicale in Toscana. Tali esplorazioni intendono ripercorrere i passi di Gabriella Giacomelli, ideatrice e direttrice dell'impresa dell'Atlante Lessicale Toscano (ALT) e profonda conoscitrice della realt\u00e0 dialettale toscana, nel suo studio sulle aree lessicali toscane (Giacomelli 1975). Questa rivisitazione dello studio sulle aree lessicali toscane di Giacomelli si \u00e8 avvalsa, pi\u00f9 di tre decenni dopo, di due importanti elementi di novit\u00e0, ovvero: i) sul versante dei dati, si \u00e8 basata sull'intero corpus dei materiali dialettali dell'ALT disponibili nel sito di ALT-Web (http:\/\/serverdbt.ilc.cnr.it\/altweb); ii) sul versante degli strumenti di analisi, \u00e8 stata condotta attraverso l'uso combinato di tecnologie linguistiche e tecniche di analisi statistica multivariata che rendono possibile un'analisi aggregata di corpora di materiali dialettali anche di vaste dimensioni. Lo studio si focalizza su due dei tre aspetti indicati come fondamentali da Giacomelli per l'analisi delle aree lessicali toscane, ovvero quello dei \"rapporti interni, tra aree subregionali\" e quello dei \"rapporti con la lingua\".","keywords":["Computational Dialectology","Lexical Variation"],"pages":"609-634","url":"https:\/\/publications.cnr.it\/doc\/84772","volume":"","doi":"","editors_people":"Prantera N.; Mendicino A.; Citraro C.","editors":["Prantera, N.","Mendicino, A.","Citraro, C."],"published":"Parole. Il lessico come strumento per organizzare e trasmettere gli etnosaperi","publisher":"Centro Editoriale e Librario (Arcavacata di Rende, ITA)","issn":"","isbn":"9788874581030","conference_name":"Convegno 'Parole. Il lessico come strumento per organizzare e trasmettere gli etnosaperi'","conference_place":"Rende, Universit\u00e0 della Calabr","conference_date":"2-4 luglio 2009"},{"id":131317,"last_updated":"2023-11-06 19:33:52","id_people":112966,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Lessico settoriale e lessico comune nell'estrazione di terminologia specialistica da corpora di dominio","year":2010,"authors_people":"Bonin F.; Dell'Orletta F.; Montemagni S.; Venturi G.","authors_cnr":["Dell'Orletta, Felice","Venturi, Giulia","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Bonin, F.","Dell'Orletta, F.","Montemagni, S.","Venturi, G."],"abstract":"","keywords":["Automatic Term Extraction"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112966","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"XLIV Congresso Internazionale di Studi della Societ\u00e0 di Linguistica Italiana","conference_place":"Viterbo, Universit\u00e0 degli Stud","conference_date":""},{"id":131639,"last_updated":"2012-03-29 15:58:24","id_people":173723,"institutes":["ILC","IRISS"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Tecnologie linguistico-computazionali per il monitoraggio delle competenze linguistiche di apprendenti l'italiano come L2","year":2010,"authors_people":"Dell'Orletta F.; Montemagni S.; Vecchi E. M.; Venturi G.","authors_cnr":["Venturi, Giulia","Vecchi, Eva Maria","Venturi, Giulia","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Montemagni, S.","Vecchi, E. M.","Venturi, G."],"abstract":"","keywords":["Natural Language Processing, Educational Linguistics, Language Learning"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/173723","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Congresso \"IT. L2: italiano lingua seconda nell'universit\u00e0, nella scuola e sul territorio. Esperienze didattiche e ricerche\" Universit\u00e0 del Piemonte Orientale \"Amedeo Avogadro\", Facolt\u00e0 di Lettere e Filosofia","conference_place":"Vercelli","conference_date":"2010"},{"id":131308,"last_updated":"2013-02-28 10:52:37","id_people":112955,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Ontology Learning. An introduction","year":2010,"authors_people":"Simonetta Montemagni","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S."],"abstract":"","keywords":["Legal Text Processing","Ontology Learning","NLP"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112955","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Summer School LEX2010-Managing Legal Resources in the Semantic Web, Session \"Ontology in the Legal Domain\"","conference_place":"Ravenna","conference_date":"2010"},{"id":131310,"last_updated":"1970-01-01 01:00:00","id_people":112957,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Tecnologie linguistico-computazionali per il monitoraggio della lingua italiana","year":2010,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":["Language Variation, Natural Language Processing"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112957","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Giornata di Studio \"Lo stato della lingua. Il CNR e l'italiano nel terzo millennio\" organizzata dal Consiglio Nazionale delle Ricerche-Dipartimento Identit\u00e0 Culturale","conference_place":"Roma","conference_date":"2010"},{"id":131311,"last_updated":"1970-01-01 01:00:00","id_people":112958,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"The BioLexicon: a Large-Scale Domain-Specific Lexical Resource for Biomedical Text Mining","year":2010,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":["Text Mining, Knowledge Extraction, Lexical Resources"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112958","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LREC 2010 2nd Workshop on Building and evaluating resources for biomedical text mining","conference_place":"Malta","conference_date":"2010"},{"id":131314,"last_updated":"1970-01-01 01:00:00","id_people":112962,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Design, Construction and Use of an Italian Dependency Treebank: Methodological Issues and Empirical Results","year":2010,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":["Syntactic Annotation, Treebanks"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112962","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"TheCopenhagen Dependency Treebank Workshop on \"Designing Treebanks\"","conference_place":"Copehagen (DK)","conference_date":"2010"},{"id":131318,"last_updated":"1970-01-01 01:00:00","id_people":112967,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Modelli di variazione dialettale e analisi dei tratti linguistici sottostanti: un nuovo approccio dialettometrico","year":2010,"authors_people":"Montemagni S.; Wieling M.; De Jonge B.; Nerbonne J.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Wieling, M.","De Jonge, B.","Nerbonne, J."],"abstract":"","keywords":["Computational dialectology"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112967","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"XI Congresso Silfi-Congresso della Societ\u00e0 Internazionale di Linguistica e Filologia Italiana","conference_place":"Napoli","conference_date":"2010"},{"id":131615,"last_updated":"1970-01-01 01:00:00","id_people":157485,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Computational Models of Dialectal Variation and Underlying Linguistic Features","year":2010,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":["Computational Dialectology, Language Variation"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157485","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132202,"last_updated":"2023-11-06 19:33:48","id_people":367784,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ConnectToLife (modulo semantico)-Rapporto tecnico finale","year":2010,"authors_people":"Vito Pirrelli, Alessandro Lenci, Simonetta Montemagni, Felice Dell'Orletta, Emiliano Giovannetti, Simone Marchi","authors_cnr":["Lenci, Alessandro","Pirrelli, Vito","Montemagni, Simonetta","Marchi, Simone","Giovannetti, Emiliano","Dell'Orletta, Felice"],"authors_cnr_id":["326","5595","10442","11969","14329"],"authors_cnr_institute":[""],"authors":["Pirrelli, V.","Lenci, A.","Montemagni, S.","Dell'Orletta, F.","Giovannetti, E.","Marchi, S."],"abstract":"Il presente documento costituisce il rapporto tecnico finale del progetto Connect-To-Life (modulo semantico) relativo alle attivit\u00e0 svolte dall'unit\u00e0 ILC-CNR.","keywords":["annotazione linguistica","estrazione di termini","clustering semantico","trattamento automatico della lingua","costruzione di ontologie"],"pages":"16","url":"https:\/\/publications.cnr.it\/doc\/367784","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":123415,"last_updated":"2012-03-28 13:17:59","id_people":173012,"institutes":["ILC","ITTIG","IGSG"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"A two-level Knowledge approach to support multilingual legislative drafting","year":2009,"authors_people":"Agnoloni T.; Bacci L.; Francesconi E.; Peters W.; Montemagni S.; Venturi G.","authors_cnr":["Bacci, Lorenzo","Agnoloni, Tommaso","Venturi, Giulia","Montemagni, Simonetta","Francesconi, Enrico"],"authors_cnr_id":["5595","10498"],"authors_cnr_institute":[""],"authors":["Agnoloni, T.","Bacci, L.","Francesconi, E.","Peters, W.","Montemagni, S.","Venturi, G."],"abstract":"","keywords":["DALOS project","Ontological-linguistic"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/173012","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131879,"last_updated":"2023-11-06 19:33:59","id_people":184585,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Text-2-Knowledge: una piattaforma linguistico-computazionale per l'estrazione di conoscenza da testi","year":2009,"authors_people":"Dell'Orletta F., Lenci A., Marchi S., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Marchi, Simone","Dell'Orletta, Felice"],"authors_cnr_id":["326","5595","10442","14329"],"authors_cnr_institute":["048","048","048","048"],"authors":["Dell'Orletta, F.","Lenci, A.","Marchi, S.","Montemagni, S.","Pirrelli, V."],"abstract":"The paper describes the automatic extraction of domain knowledge from Italian document collections and presents a fully-implemented ontology learning system (T2K, Text-2-Knowledge) that includes a battery of tools for Natural Language Processing, statistical text analysis and machine learning. Evaluated results show the considerable potential of systems like T2K, exploiting an incremental interleaving of NLP and machine learning techniques for accurate large-scale semi-automatic extraction and structuring of domain-specific knowledge.","keywords":["Term extraction","Ontology Learning"],"pages":"285-300","url":"https:\/\/publications.cnr.it\/doc\/184585","volume":"","doi":"","editors_people":"Giacomo Ferrari, Ruben Benatti, Monica Mosca","editors":["Ferrari, G.","Benatti, R.","Mosca, M."],"published":"","publisher":"Bulzoni (Roma, ITA)","issn":"","isbn":"978-88-7870-469-5","conference_name":"","conference_place":"","conference_date":""},{"id":131653,"last_updated":"2012-06-05 17:41:15","id_people":186141,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Annotazione sintattica di corpora: aspetti metodologici","year":2009,"authors_people":"Alessandro Lenci; Simonetta Montemagni; Vito Pirrelli","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":["048","048"],"authors":["Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"Un assunto sempre pi\u00f9 condiviso nell'ambito degli studi sull'acquisizione sia di L1 che di L2 \u00e8 che l'evidenza empirica privilegiata debba essere rappresentata da corpora di produzioni scritte o orali degli apprendenti, estensivamente annotate a molteplici livelli di rappresentazione linguistica. Pi\u00f9 in generale, corpora lemmatizzati e annotati a livello morfosintattico fanno ormai parte dello strumentario comune del linguista. Accanto ad essi, si fa per\u00f2 strada l'esigenza di disporre di risorse testuali pi\u00f9 sofisticate dal punto di vista delle modalit\u00e0 di esplorazione linguistica, come ad esempio corpora annotati a livello sintattico (le cosiddette treebank). Questi consentono infatti di osservare i processi di convergenza degli apprendenti verso la lingua \"obiettivo\" anche a livello di specifici tratti grammaticali astratti o di macro-strutture linguistiche. L'articolo propone uno schema di annotazione sintattica caratterizzato da un doppio livello di codifica. Si tratta di un approccio originale che differisce dalla maggior degli schemi di annotazione sintattica esistenti per due aspetti: 1. la separazione della dimensione relazionale da quella a costituenti, che sono trattati a livelli di annotazione indipendenti, ma al tempo stesso correlati, in modo tale che lo stesso testo \u00e8 simultaneamente interrogabile ai due livelli; 2. la rappresentazione a costituenti fornisce una rappresentazione del testo come sequenza di proto-costituenti sintagmatici non ricorsivi. Questa strategia di annotazione permette una fattorizzazione di diversi aspetti e dimensioni della struttura sintattica che risulta promettente da un lato per l'annotazione di corpora di lingua \"non-standard\" come quelli contenenti produzioni di apprendenti di L1 o L2, sia come punto di partenza per successivi processi di estrazione di informazione linguistica dal testo. Dopo aver illustrato le motivazioni sottostanti allo schema proposto, ciascun livello di rappresentazione (chunking e dipendenze funzionali) viene illustrato in dettaglio, mostrandone anche la possibilit\u00e0 di combinazione sullo stesso testo. L'articolo si chiude con la discussione di prospettive di uso di corpora annotati secondo lo schema di annotazione proposto.","keywords":["Corpora annotati","annotazione sintattica"],"pages":"25-46","url":"https:\/\/publications.cnr.it\/doc\/186141","volume":"","doi":"","editors_people":"Cecilia Andorno; Stefano Rastelli","editors":["Andorno, C.","Rastelli, S."],"published":"CORPORA DI ITALIANO L2: TECNOLOGIE, METODI, SPUNTI TEORICI","publisher":"Guerra Edizioni (Perugia, ITA)","issn":"","isbn":"978-88-557-0168-6","conference_name":"","conference_place":"","conference_date":""},{"id":131377,"last_updated":"2015-02-16 10:56:35","id_people":136465,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Ontology learning from Italian legal texts","year":2009,"authors_people":"Lenci A.; Montemagni S.; Pirrelli V.; Giulia V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":["048","048"],"authors":["Lenci, A.","Montemagni, S.","Pirrelli, V.","Venturi, G."],"abstract":"The paper reports on the methodology and preliminary results of a case study in automatically extracting ontological knowledge from Italian legislative texts. We use a fully-implemented ontology learning system (T2K) that includes a battery of tools for Natural Language Processing (NLP), statistical text analysis and machine language learning. Tools are dynamically integrated to provide an incremental representation of the content of vast repositories of unstructured documents. Evaluated results, however preliminary, show the great potential of NLP-powered incremental systems like T2K for accurate large-scale semi-automatic extraction of legal ontologies.","keywords":["Ontology Learning","document management","legal knowledge extraction"],"pages":"75-94","url":"https:\/\/publications.cnr.it\/doc\/136465","volume":"188","doi":"10.3233\/978-1-58603-942-4-75","editors_people":"Joost Breuker; Pompeu Casanovas; Michel C.A. Klein; Enrico Francesconi","editors":["Breuker, J.","Casanovas, P.","Klein, M. C. A.","Francesconi, E."],"published":"Law, Ontologies and the Semantic Web-Channelling the Legal Information Flood","publisher":"","issn":"","isbn":"978-1-58603-942-4","conference_name":"","conference_place":"","conference_date":""},{"id":122578,"last_updated":"2017-03-02 16:29:51","id_people":143540,"institutes":["ILC","ITTIG","IGSG"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Proceedings of the 3rd Workshop on Legal Ontologies and Artificial Intelligence Techniques (LOAIT '09) joint with the 2nd Workshop on Semantic Processing of Legal Texts","year":2009,"authors_people":"Casellas N., Francesconi E., Hokstra R., Montemagni S. (eds.)","authors_cnr":["Montemagni, Simonetta","Francesconi, Enrico"],"authors_cnr_id":["5595","10498"],"authors_cnr_institute":["048","104"],"authors":["Casellas, N.","Francesconi, E.","Hokstra, R.","Montemagni, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/143540","volume":"2","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":123422,"last_updated":"2012-03-29 15:40:44","id_people":173712,"institutes":["ILC","ITTIG","IGSG"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Towards a FrameNet Resource for the Legal Domain","year":2009,"authors_people":"Venturi G.; Lenci A.; Montemagni S.; Vecchi E. M.; Sagri M. T.; Tiscornia D.; Agnoloni T.","authors_cnr":["Sagri, Maria Teresa","Agnoloni, Tommaso","Venturi, Giulia","Montemagni, Simonetta","Tiscornia, Daniela"],"authors_cnr_id":["5595","20276"],"authors_cnr_institute":[""],"authors":["Venturi, G.","Lenci, A.","Montemagni, S.","Vecchi, E. M.","Sagri, M. T.","Tiscornia, D.","Agnoloni, T."],"abstract":"","keywords":["Frame Semantics","Legal Ontologies","Knowledge Representation","Corpus Annotation"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/173712","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"3rd Workshop on Legal Ontologies and Artificial Intelligence Techniques joint with 2nd Workshop on Semantic Processing of Legal text","conference_place":"Barcelona, Spain","conference_date":"2009"},{"id":131187,"last_updated":"2023-07-09 16:06:59","id_people":84736,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Bootstrapping a Verb Lexicon for Biomedical Information Extraction","year":2009,"authors_people":"Venturi G.; Montemagni S.; Marchi S.; Sasaki Y.; Thompson P.; McNaught J.; Ananiadou S.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["5595","10442"],"authors_cnr_institute":[""],"authors":["Venturi, G.","Montemagni, S.","Marchi, S.","Sasaki, Y.","Thompson, P.","McNaught, J.","Ananiadou, S."],"abstract":"The extraction of information from texts requires resources that contain both syntactic and semantic properties of lexical units. As the use of language in specialized domains, such as biology, can be very different to the general domain, there is a need for domain-specific resources to ensure that the information extracted is as accurate as possible. We are building a large-scale lexical resource for the biology domain, providing information about predicate-argument structure that has been bootstrapped from a biomedical corpus on the subject of E. Coli. The lexicon is currently focussed on verbs, and includes both automatically-extracted syntactic subcategorization frames, as well as semantic event frames that are based on annotation by domain experts. In addition, the lexicon contains manually-added explicit links between semantic and syntactic slots in corresponding frames. To our knowledge, this lexicon currently represents a unique resource within in the biomedical domain.","keywords":["domain-specific lexical resources","Biological Language Processing","syntax-semantic linking"],"pages":"137-148","url":"https:\/\/publications.cnr.it\/doc\/84736","volume":"","doi":"10.1007\/978-3-642-00382-0_11","editors_people":"","editors":[""],"published":"","publisher":"Springer-Verlag (Berlin Heidelberg, DEU)","issn":"","isbn":"9783642003813","conference_name":"10th International Conference on Intelligent Text Processing and Computational Linguistics","conference_place":"Mexico City, Mexico","conference_date":"1-7\/03\/2009"},{"id":122044,"last_updated":"2017-03-02 16:29:45","id_people":130118,"institutes":["ILC","ITTIG","IGSG"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"NLP\u0096based Metadata Extraction for Legal Text Consolidation","year":2009,"authors_people":"Spinosa P., Giardiello G., Cherubini M., Marchi S., Venturi G., Montemagni S.","authors_cnr":["Giardiello, Gerardo","Venturi, Giulia","Montemagni, Simonetta","Marchi, Simone","Cherubini, Manola","Spinosa, Pierluigi"],"authors_cnr_id":["5595","10442","11042","19619"],"authors_cnr_institute":[""],"authors":["Spinosa, P.","Giardiello, G.","Cherubini, M.","Marchi, S.","Venturi, G.","Montemagni, S."],"abstract":"","keywords":["Natural Language Processing","textual amendments","XML representation","metadata extraction","consolidation of legal text"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/130118","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Twelfth International Conference on Artificial Intelligence and Law (ICAIL 2009)","conference_place":"Barcelona","conference_date":"June 8-12, 2009"},{"id":131309,"last_updated":"2023-11-06 19:33:54","id_people":112956,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Bootstrapping a Verb Lexicon for Biomedical Information Extraction","year":2009,"authors_people":"Venturi, Giulia; Montemagni, Simonetta; Marchi, Simone; Sasaki, Yutaka; Thompson, Paul; McNaught, John; Ananiadou, Sophia","authors_cnr":["Montemagni, Simonetta","Marchi, Simone","Dell'Orletta, Felice"],"authors_cnr_id":["5595","10442","14329"],"authors_cnr_institute":["048","048","048"],"authors":["Venturi, G.","Montemagni, S.","Marchi, S.","Sasaki, Y.","Thompson, P.","McNaught, J.","Ananiadou, S."],"abstract":"The extraction of information from texts requires resources that contain both syntactic and semantic properties of lexical units. As the use Of language in specialized domains, such as biology, can be very different to the general domain, there is a need for domain-specific resources to ensure that the information extracted is as accurate as possible. We are building a large-scale lexical resource for the biology domain. providing information about predicate-argument structure that has been bootstrapped from a biomedical corpus on the subject of E. Coli. The lexicon is currently focussed on verbs, and includes both automatically-extracted syntactic subcategorization frames, as well as semantic event frames that are based on annotation by domain experts. In addition, the lexicon contains manually-added explicit links between semantic and syntactic slots in corresponding frames. To Our knowledge, this lexicon currently represents a unique resource within in the biomedical domain.","keywords":["domain-specific lexical resources","lexical acquisition","syntax-semantics linking","Information Extraction","Biological Language Processing"],"pages":"137-148","url":"https:\/\/publications.cnr.it\/doc\/112956","volume":"5449","doi":"","editors_people":"Alexander Gelbukh","editors":["Gelbukh, A."],"published":"Proceedings of the 10th International Conference on Intelligent Text Processing and Computational Linguistics (CICLing 2009)","publisher":"Springer (Berlin, Germania)","issn":"0302-9743","isbn":"978-3-642-00381-3","conference_name":"International Conference on Intelligent Text Processing and Computational Linguistics (CICLing 2009)","conference_place":"Mexico City, Mexico","conference_date":"March 1-7, 2009"},{"id":131591,"last_updated":"2010-11-20 00:00:00","id_people":157461,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"3rd Workshop on Legal Ontologies and Artificial Intelligence Techniques joint with 2nd Workshop on Semantic Processing of Legal text","year":2009,"authors_people":"Casellas N.; Francesconi E.; Hoekstra R.; Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Casellas, N.","Francesconi, E.","Hoekstra, R.","Montemagni, S."],"abstract":"","keywords":["Legal Ontologies","Computational Semantics"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157461","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130998,"last_updated":"2023-11-06 19:34:03","id_people":64541,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Dal testo alla conoscenza e ritorno: estrazione terminologica e annotazione semantica di basi documentali di dominio","year":2008,"authors_people":"Dell'Orletta F.; Lenci A.; Marchi S.; Montemagni S.; Pirrelli V.; Venturi G.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["326","5595","10442"],"authors_cnr_institute":["048","048","048","048"],"authors":["Dell'Orletta, F.","Lenci, A.","Marchi, S.","Montemagni, S.","Pirrelli, V.","Venturi, G."],"abstract":"The paper focuses on the automatic extraction of domain knowledge from Italian legal texts and presents a fully-implemented ontology learning system (T2K, Text-2-Knowledge) that includes a battery of tools for Natural Language Processing, statistical text analysis and machine learning. Evaluated results show the considerable potential of systems like T2K, exploiting an incremental interleaving of NLP and machine learning techniques for accurate large-scale semi-automatic extraction and structuring of domain-specific knowledge.","keywords":["Natural Language Processing","Machine Learning","Knowledge extraction from texts","Ontology learning","Legal ontologies"],"pages":"197-218","url":"https:\/\/publications.cnr.it\/doc\/64541","volume":"26","doi":"","editors_people":"","editors":[""],"published":"Aida Informazioni (Online)","publisher":"Aida (Roma, Italia)","issn":"1594-2201","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131000,"last_updated":"2012-06-04 11:27:15","id_people":64543,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"The space of Tuscan dialectal variation. A correlation study","year":2008,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048"],"authors":["Montemagni, S."],"abstract":"The paper illustrates the results of a correlation study focusing on linguistic variation in an Italian region, Tuscany. By exploiting a multi-level representation scheme of dialectal data, the study analyses attested patterns of phonetic and morpho-lexical variation with the aim of testing the degree of correlation between a) phonetic and morpho-lexical variation, and b) linguistic variation and geographic distance. The correlation analysis was performed by combining two complementary approaches proposed in dialectometric literature, namely by computing both global and place-specific correlation measures and by inspecting their spatial distribution. Achieved results demonstrate that phonetic and morpho-lexical variations in Tuscany seem to follow a different pattern than encountered in previous studies.","keywords":["Computational dialectology","Dialectometry"],"pages":"135-152","url":"http:\/\/www.euppublishing.com\/doi\/abs\/10.3366\/E1753854809000354","volume":"2","doi":"10.3366\/E1753854809000354","editors_people":"","editors":[""],"published":"International journal of humanities and arts computing (Print)","publisher":"Edinburgh University Press for the Association for History and Computing (Edinburgh, Regno Unito)","issn":"1753-8548","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131373,"last_updated":"2009-08-18 00:00:00","id_people":136460,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Analisi linguistico-computazionali del corpus dialettale dell'Atlante Lessicale Toscano. Primi risultati sul rapporto toscano-italiano","year":2008,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":["Corpus dialettale"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/136460","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Pacini (Pisa, ITA)","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131160,"last_updated":"2023-11-06 19:34:04","id_people":84707,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Dal testo alla conoscenza e ritorno: estrazione terminologica e annotazione semantica di basi documentali di dominio","year":2008,"authors_people":"Dell'Orletta Felice; Lenci Alessando; Marchi Simone; Montemagni Simonetta; Pirrelli Vito; Venturi Giulia","authors_cnr":["Dell'Orletta, Felice","Venturi, Giulia","Pirrelli, Vito","Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["326","5595","10442"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Lenci, A.","Marchi, S.","Montemagni, S.","Pirrelli, V.","Venturi, G."],"abstract":"The paper focuses on the automatic extraction of domain knowledge from Italian legal texts and presents a fully-implemented ontology learning system (T2K, Text-2-Knowledge) that includes a battery of tools for Natural Language Processing, statistical text analysis and machine learning. Evaluated results show the considerable potential of systems like T2K, exploiting an incremental interleaving of NLP and machine learning techniques for accurate large-scale semi-automatic extraction and structuring of domain-specific knowledge.","keywords":["Natural Language Processing","Machine Learning","Knowledge extraction from texts","Ontology learning","Legal ontologies"],"pages":"197-218","url":"http:\/\/www.assiterm91.it\/wp-content\/uploads\/2010\/11\/Convegno-2008.pdf","volume":"Anno 26, numero 1-2","doi":"","editors_people":"","editors":[""],"published":"Terminologia analisi testuale e documentazione nella citt\u00e0 digitale","publisher":"Aida (Roma, Italia)","issn":"1594-2201","isbn":"","conference_name":"Atti del Convegno Nazionale Ass. I. Term","conference_place":"Arcavacata di Rende (CS)","conference_date":"5-7\/06\/2008"},{"id":131151,"last_updated":"2023-11-06 19:34:01","id_people":84698,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Acquiring Legal Ontologies from Domain-specific Texts","year":2008,"authors_people":"Dell'Orletta F.; Lenci A.; Montemagni S.; Marchi S.; Pirrelli V.; Venturi G.","authors_cnr":["Dell'Orletta, Felice","Venturi, Giulia","Pirrelli, Vito","Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["326","5595","10442"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Lenci, A.","Montemagni, S.","Marchi, S.","Pirrelli, V.","Venturi, G."],"abstract":"The paper reports on methodology and preliminary results ofa case study in automatically extracting ontological knowledgefrom Italian legislative texts in the environmental domain. Weuse a fully-implemented ontology learning system (T2K) thatincludes a battery of tools for Natural Language Processing(NLP), statistical text analysis and machine language learn-ing. Tools are dynamically integrated to provide an incremen-tal representation of the content of vast repositories of unstruc-tured documents. Evaluated results, however preliminary, arevery encouraging, showing the great potential of NLP-poweredincremental systems like T2K for accurate large-scale semi-automatic extraction of legal ontologies.","keywords":["Ontology learning","Document management","knowledge extraction from texts","Natural Language Processing"],"pages":"98-101","url":"https:\/\/publications.cnr.it\/doc\/84698","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LangTech 2008","conference_place":"Roma","conference_date":"28-29\/02\/2008"},{"id":131159,"last_updated":"2015-02-25 15:49:07","id_people":84706,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Combining statistical techniques and lexico-syntactic patterns for semantic relations extraction from text","year":2008,"authors_people":"Giovannetti E.; Marchi S.; Montemagni S.","authors_cnr":["Giovannetti, Emiliano","Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["5595","10442"],"authors_cnr_institute":[""],"authors":["Giovannetti, E.","Marchi, S.","Montemagni, S."],"abstract":"We describe here a methodology to combine two different techniques for Semantic Relation Extraction from texts. On the one hand, generic lexicosyntactic patterns are applied to the linguistically analyzed corpus to detect a first set of pairs of co-occurring words, possibly involved in \"syntagmatic\" relations. On the other hand, a statistical unsupervised association system is used to obtain a second set of pairs of \"distributionally similar\" terms, that appear to occur in similar contexts, thus possibly involved in \"paradigmatic\" relations. The approach aims at learning ontological information by filtering the candidate relations obtained through generic lexico-syntactic patterns and by labelling the anonymous relations obtained through the statistical system. The resulting set of relations can be used to enrich existing ontologies and for semantic annotation of documents or web pages.","keywords":["Ontology Learning from Text","Semantic Relation Extraction","Lexico-syntactic Patterns","Distributional Similarity"],"pages":"","url":"http:\/\/sunsite.informatik.rwth-aachen.de\/Publications\/CEUR-WS\/Vol-426\/swap2008_submission_54.pdf","volume":"","doi":"","editors_people":"Aldo Gangemi, Johannes Keizer, Valentina Presutti, Heiko Stoermer","editors":["Gangemi, A.","Keizer, J.","Presutti, V.","Stoermer, H."],"published":"","publisher":"","issn":"","isbn":"","conference_name":"SWAP 2008-Semantic Web Applications and Perspectives","conference_place":"Roma","conference_date":"15-17 December 2008"},{"id":131177,"last_updated":"2012-06-07 20:38:43","id_people":84726,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Ontology Learning and Semantic Annotation: a Necessary Symbiosis","year":2008,"authors_people":"Giovannetti E.; Marchi S.; Montemagni S.; Bartolini R.","authors_cnr":["Giovannetti, Emiliano","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["5595","10441","10442"],"authors_cnr_institute":["048","048","048","048"],"authors":["Giovannetti, E.","Marchi, S.","Montemagni, S.","Bartolini, R."],"abstract":"Semantic annotation of text requires the dynamic merging of linguistically structured information and a \"world model\", usually represented as a domain-specific ontology. On the other hand, the process of engineering a domain-ontology through semi-automatic ontology learning system requires the availability of a considerable amount of semantically annotated documents. Facing this bootstrapping paradox requires an incremental process of annotation-acquisition-annotation, whereby domain-specific knowledge is acquired from linguistically-annotated texts and then projected back onto texts for extra linguistic information to be annotated and further knowledge layers to be extracted. The presented methodology is a first step in the direction of a full \"virtuous\" circle where the semantic annotation platform and the evolving ontology interact in symbiosis. As a case study we have chosen the semantic annotation of product catalogues. We propose a hybrid approach, combining pattern matching techniques to exploit the regular structure of product descriptions in catalogues, and Natural Language Processing techniques which are resorted to analyze natural language descriptions. The semantic annotation involves the access to the ontology, semi-automatically bootstrapped with an ontology learning tool from annotated collections of catalogues.","keywords":["Information Extraction","Information Retrieval","Ontologies","Tools","Systems"],"pages":"2079-2085","url":"http:\/\/www.lrec-conf.org\/proceedings\/lrec2008\/","volume":"","doi":"","editors_people":"Nicoletta Calzolari (Conference Chair); Khalid Choukri; Bente Maegaard; Joseph Mariani; Jan Odjik; Stelios Piperidis; Daniel Tapias","editors":["Calzolari, N.","Choukri, K.","Maegaard, B.","Mariani, J.","Odjik, J.","Piperidis, S.","Tapias, D."],"published":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","publisher":"European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)","issn":"","isbn":"2-9517408-4-0","conference_name":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","conference_place":"Marrakech, Marocco","conference_date":"2008"},{"id":131181,"last_updated":"2009-08-18 00:00:00","id_people":84730,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Unsupervised Acquisition of Verb Subcategorization Frames from Shallow-Parsed Corpora","year":2008,"authors_people":"Lenci A.; McGillivray B.; Pirrelli V.; Montemagni S.","authors_cnr":["Mcgillivray, Barbara","Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Lenci, A.","McGillivray, B.","Pirrelli, V.","Montemagni, S."],"abstract":"","keywords":["Acquisition","Machine Learning","Corpus (creation, annotation, etc.)","Lexicon","Lexical database"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84730","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LREC 2008, Sixth International Conference on Language Resources and Evaluation","conference_place":"Marrakech, Marocco","conference_date":"2008"},{"id":131156,"last_updated":"2009-08-18 00:00:00","id_people":84703,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"BioLexicon: A Lexical Resource for the Biology Domain","year":2008,"authors_people":"Sasaki Y.; Montemagni S.; Pezik P.; Rebholz-Schuhmann D.; McNaught J.; Ananiadou S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Sasaki, Y.","Montemagni, S.","Pezik, P.","Rebholz Schuhmann, D.","McNaught, J.","Ananiadou, S."],"abstract":"","keywords":["BioLexicon","Terminological verbs"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84703","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Third International Symposium on Semantic Mining in Biomedicine","conference_place":"Turku, Finland","conference_date":"2008"},{"id":131157,"last_updated":"2014-10-28 11:05:02","id_people":84704,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Building a Bio-Event Annotated Corpus for the Acquisition of Semantic Frames from Biomedical Corpora","year":2008,"authors_people":"Thompson P.; Cotter P.; Ananiadou S.; McNaught J.; Montemagni S.; Trabucco A.; Venturi G.","authors_cnr":["Venturi, Giulia","Trabucco, Andrea","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048","","048"],"authors":["Thompson, P.","Cotter, P.","Ananiadou, S.","McNaught, J.","Montemagni, S.","Trabucco, A.","Venturi, G."],"abstract":"","keywords":["Corpus (creation","annotation","etc.)","Text mining","Semantics","Event Extraction"],"pages":"2159-2166","url":"https:\/\/publications.cnr.it\/doc\/84704","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"2-9517408-4-0","conference_name":"LREC 2008, Sixth International Conference on Language Resouces and Evaluation","conference_place":"Marrakech, Morocco","conference_date":"28-30 maggio 2014"},{"id":131158,"last_updated":"2014-10-28 16:39:30","id_people":84705,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Categorising Modality in Biomedical Texts","year":2008,"authors_people":"Thompson P.; Venturi G.; McNaught J.; Montemagni S.; Ananiadou S.","authors_cnr":["Venturi, Giulia","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":["048","048"],"authors":["Thompson, P.","Venturi, G.","McNaught, J.","Montemagni, S.","Ananiadou, S."],"abstract":"The accurate recognition of modal information is vital for the correct interpretation of statements. In this paper, we report on the collection a list of words and phrases that express modal information in biomedical texts, and propose a categorisation scheme according to the type of information conveyed. We have performed a small pilot study through the annotation of 202 MEDLINE abstracts according to our proposed scheme. Our initial results suggest that modality in biomedical statements can be predicted fairly reliably though the presence of particular lexical items, together with a small amount of contextual information.","keywords":["Biomedical texts","Modality"],"pages":"27-34","url":"https:\/\/publications.cnr.it\/doc\/84705","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"2-9517408-4-0","conference_name":"LREC 2008, Sixth International Conference on Language Resources and Evaluation: Workshop 'Building and Evaluating Resources for Biomedical Text Mining'","conference_place":"Marrakech, Marocco","conference_date":"26 maggio 2008"},{"id":131294,"last_updated":"2009-08-18 00:00:00","id_people":112936,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Exploring the correlation between phonetic and lexical variation in Tuscany","year":2008,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":["Dialectal variation","ALT-Web"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112936","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Thirteenth International Conference on Methods in Dialectology","conference_place":"Leeds","conference_date":"2008"},{"id":131293,"last_updated":"2013-06-06 16:58:30","id_people":112935,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"BioLexicon: Towards a reference terminological resource in the biomedical domain","year":2008,"authors_people":"Rebholz-Schuhmann D.; Pezik P.; Lee V.; Del Gratta R.; Kim J.; Sasaki Y.; McNaught J.; Montemagni S.; Monachini M.; Calzolari N.; Ananiadou S.","authors_cnr":["Del Gratta, Riccardo","Montemagni, Simonetta","Monachini, Monica","Zamorani, Nicoletta"],"authors_cnr_id":["5595","8945","26123"],"authors_cnr_institute":["048"],"authors":["Rebholz Schuhmann, D.","Pezik, P.","Lee, V.","Del Gratta, R.","Kim, J.","Sasaki, Y.","McNaught, J.","Montemagni, S.","Monachini, M.","Calzolari, N.","Ananiadou, S."],"abstract":"The BioLexicon is a publicly available large-scale terminological resource which brings together potential terms from several resources representing selected semantic types (genes, proteins, chemicals, species, enzymes, selected ontological terms). The schema of the BioLexicon enables improved resolution of term ambiguity and follows lexical standards for terminological resources.","keywords":["BioLexicon"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112935","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"978-1-61567-371-1","conference_name":"16th Annual International Conference on Intelligent Systems for Molecular Biology","conference_place":"Toronto, Canada","conference_date":"19-23 Luglio 2008"},{"id":131578,"last_updated":"2009-08-18 00:00:00","id_people":157448,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Augmented version of the bio-lexicon extended with bio event information and term-to-term weighted links","year":2008,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":["Bio-lexicon"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157448","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131443,"last_updated":"2009-09-25 00:00:00","id_people":151569,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"AnITA","year":2008,"authors_people":"Pirrelli V., Montemagni S.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Pirrelli, V.","Montemagni, S."],"abstract":"","keywords":["NLP Tools"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151569","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130994,"last_updated":"2023-11-06 19:34:11","id_people":64537,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Maximum Entropy for Italian PoS Tagging","year":2007,"authors_people":"Dell'Orletta F., Federico M., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Federico, Maria","Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Federico, M.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"L'articolo illustra le prestazioni del ILC-UniPi MaxEnt PoS Tagger in Evalita 2007. The report contains a description of the ILC-UniPi MaxEnt PoS Tagger performance in Evalita 2007.","keywords":[""],"pages":"10-11","url":"https:\/\/publications.cnr.it\/doc\/64537","volume":"IV(2)","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131372,"last_updated":"2023-11-06 19:34:08","id_people":136459,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Corpus-based Modelling of Grammar Variation","year":2007,"authors_people":"Dell\u0092Orletta F., Lenci A., Montemagni, S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":["Grammar variation","stochastic parsing","linguistic typology"],"pages":"38-55","url":"https:\/\/publications.cnr.it\/doc\/136459","volume":"","doi":"","editors_people":"Andrea Sans\u00f2","editors":["Sans\u00f2, A."],"published":"Language resources and linguistic theory","publisher":"Angeli (Milano, ITA)","issn":"","isbn":"9788846489449","conference_name":"","conference_place":"","conference_date":""},{"id":123403,"last_updated":"2012-04-19 15:48:46","id_people":171352,"institutes":["ILC","ITTIG","IGSG"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Building an ontological support for multilingual legislative drafting","year":2007,"authors_people":"Agnoloni T., Bacci L., Francesconi E., Spinosa P., Tiscornia D., Montemagni S., Venturi G.","authors_cnr":["Bacci, Lorenzo","Agnoloni, Tommaso","Venturi, Giulia","Montemagni, Simonetta","Francesconi, Enrico","Spinosa, Pierluigi","Tiscornia, Daniela"],"authors_cnr_id":["5595","10498","19619","20276"],"authors_cnr_institute":["104"],"authors":["Agnoloni, T.","Bacci, L.","Francesconi, E.","Spinosa, P.","Tiscornia, D.","Montemagni, S.","Venturi, G."],"abstract":"","keywords":[""],"pages":"9-18","url":"https:\/\/publications.cnr.it\/doc\/171352","volume":"","doi":"","editors_people":"Lodder Ar; Mommers L.","editors":["Ar, L.","Mommers, L."],"published":"Legal Knowledge and information Systems","publisher":"","issn":"","isbn":"","conference_name":"International Conference on Legal Knowledge and Information Systems (JURIX 2007)","conference_place":"Leiden","conference_date":"2007"},{"id":131150,"last_updated":"2023-11-06 19:34:12","id_people":84696,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Maximum Entropy for Italian PoS Tagging","year":2007,"authors_people":"Dell'Orletta F., Federico M., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Federico, Maria","Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Federico, M.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84696","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Evaluation of NLP Tools for Italian-EVALITA 2007","conference_place":"Roma","conference_date":""},{"id":131142,"last_updated":"2023-11-06 19:34:21","id_people":84687,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Text-2-Knowledge: una piattaforma linguistico-computazionale per l'estrazione di conoscenza da testi","year":2007,"authors_people":"Dell'Orletta F., Lenci A., Marchi S., Motemagni S., Pirrelli S.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["326","5595","10442"],"authors_cnr_institute":["048","048","048","048"],"authors":["Dell'Orletta, F.","Lenci, A.","Marchi, S.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84687","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"XL Congresso Internazionale di Studi della Societ\u00e0 di Linguistica Italiana (SLI 2006)","conference_place":"Roma","conference_date":""},{"id":131145,"last_updated":"2014-07-28 11:46:33","id_people":84690,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Ontology-based Semantic Annotation of Product Catalogues","year":2007,"authors_people":"Giovannetti E, Marchi S, Montemagni S., Bartolini R.","authors_cnr":["Giovannetti, Emiliano","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["5595","10441","10442"],"authors_cnr_institute":["048","048","048","048"],"authors":["Giovannetti, E.","Marchi, S.","Montemagni, S.","Bartolini, R."],"abstract":"This paper describes a methodology for the semantic annotation of product catalogues. We propose a hybrid approach, combining pattern matching techniques to exploit the regular structure of product descriptions in catalogues, and Natural Language Processing techniques which are resorted to analyze natural language descriptions. It also includes the access to an application ontology, semi-automatically bootstrapped from collections of catalogues with an ontology learning tool, which is used to drive the semantic annotation process.","keywords":["Semantic Annotation of texts","Ontology Learning","Information Extraction for e-commerce"],"pages":"235-239","url":"https:\/\/publications.cnr.it\/doc\/84690","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of the International Conference \"Recent Advances in Natural Language Processing\"","publisher":"","issn":"","isbn":"","conference_name":"Recent Advances in Natural Language Processing (RANLP-2007)","conference_place":"Borovets","conference_date":"27-29 settembre 2007"},{"id":131147,"last_updated":"2014-10-28 17:09:37","id_people":84693,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"NLP-based ontology learning from legal texts. A case study","year":2007,"authors_people":"Lenci A., Montemagni S., Pirrelli V., Venturi G.","authors_cnr":["Venturi, Giulia","Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":["048","048","048"],"authors":["Lenci, A.","Montemagni, S.","Pirrelli, V.","Venturi, G."],"abstract":"The paper reports on the methodology and preliminary results of a case study in automatically extracting ontological knowledge from Italian legislative texts in the environmental domain. We use a fully-implemented ontology learning system (T2K) that includes a battery of tools for Natural Language Processing (NLP), statistical text analysis and machine language learning. Tools are dynamically integrated to provide an incremental representation of the content of vast repositories of unstructured documents. Evaluated results, however preliminary, are very encouraging, showing the great potential of NLP-powered incremental systems like T2K for accurate large-scale semi-automatic extraction of legal ontologies.","keywords":[""],"pages":"113-129","url":"https:\/\/publications.cnr.it\/doc\/84693","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"II Workshop on Legal Ontologies and Artificial Intelligence Techniques (LOAIT'07)","conference_place":"Stanford","conference_date":"4 giugno 2007"},{"id":131146,"last_updated":"2009-06-16 00:00:00","id_people":84692,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Patterns of phonetic variation in Tuscany: using dialectometric techniques on multi-level representations of dialectal data","year":2007,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84692","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"International Workshop on Computational Phonology","conference_place":"Borovets","conference_date":"2007"},{"id":131148,"last_updated":"2009-06-16 00:00:00","id_people":84694,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Aree fonetiche e lessicali toscane a confronto: prime elaborazioni computazionale dei dati dell\u0092Atlante Lessicale Toscano","year":2007,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84694","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"XL Congresso Internazionale di Studi della Societ\u00e0 di Linguistica Italiana","conference_place":"Vercelli","conference_date":"2007"},{"id":131149,"last_updated":"2009-06-16 00:00:00","id_people":84695,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Acquisizione automatica di termini da testi: primi esperimenti di estrazione e strutturazione di terminologia metalinguistica","year":2007,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84695","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"DLM su Lessicologia e metalinguaggio","conference_place":"Macerata","conference_date":"2007"},{"id":131137,"last_updated":"2009-06-16 00:00:00","id_people":84682,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Automatic Extraction of Semantics in Law Documents","year":2007,"authors_people":"Soria C., Bartolini R., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Soria, Claudia","Bartolini, Roberto"],"authors_cnr_id":["326","5595","9887","10441"],"authors_cnr_institute":[""],"authors":["Soria, C.","Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84682","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"V Legislative XML Workshop","conference_place":"Firenze","conference_date":"2007"},{"id":131548,"last_updated":"2009-06-16 00:00:00","id_people":157418,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Semantic Annotation Services for Virtual Information and Knowledge Environments","year":2007,"authors_people":"Ait-Mokhtar S., Barker E., Brunelli R., Demetriou G., Gaizauskas R., Giovannetti E., Montemagni S., S\u00e1ndor A., Sun H.","authors_cnr":["Giovannetti, Emiliano","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Ait Mokhtar, S.","Barker, E.","Brunelli, R.","Demetriou, G.","Gaizauskas, R.","Giovannetti, E.","Montemagni, S.","S\u00e1ndor, A.","Sun, H."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157418","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131549,"last_updated":"2009-06-16 00:00:00","id_people":157419,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Semantic Representation and Management Report","year":2007,"authors_people":"Bouquet P., Stoermer H., Montemagni S., Giovannetti E., Semeraro G., Niederee C., Stecher R., Brunelli R., Chanod J. P., Jacquin T.","authors_cnr":["Giovannetti, Emiliano","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Bouquet, P.","Stoermer, H.","Montemagni, S.","Giovannetti, E.","Semeraro, G.","Niederee, C.","Stecher, R.","Brunelli, R.","Chanod, J. P.","Jacquin, T."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157419","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131570,"last_updated":"2016-07-20 15:08:53","id_people":157440,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Report on Ontology learning tool and testing","year":2007,"authors_people":"Montemagni S., Marchi S., Venturi G., Bartolini R., Bertagna F., Ruffolo P., Peters W., Tiscornia D.","authors_cnr":["Bertagna, Francesca","Ruffolo, Paolo","Venturi, Giulia","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Marchi, S.","Venturi, G.","Bartolini, R.","Bertagna, F.","Ruffolo, P.","Peters, W.","Tiscornia, D."],"abstract":"This deliverable documents the work done within the DALOS EU project for what concerns the definition and implementation of methodologies and techniques to bootstrap terminological and ontological knowledge from domain corpora. Starting from a corpus of legacy legislative texts in different languages, linguistic technologies combined with statistical techniques have been used to extract significant terms as well as to structure them in conceptual structures for the different languages dealt with within the project, namely Italian, English, Spanish and Dutch.","keywords":["Ontology Learning","Term Extraction","Natural Language Processing","Conceptual Indexing"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157440","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131550,"last_updated":"2009-06-16 00:00:00","id_people":157420,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"The Italian dependency annotated corpus developed for the CoNLL-2007 Shared Task","year":2007,"authors_people":"Montemagni S., Simi M.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Simi, M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157420","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131551,"last_updated":"2009-06-16 00:00:00","id_people":157421,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Bio-Event Linguistic Annotation Tool. User Manual","year":2007,"authors_people":"Montemagni S., Trabucco A., Venturi G.","authors_cnr":["Venturi, Giulia","Trabucco, Andrea","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Trabucco, A.","Venturi, G."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157421","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131552,"last_updated":"2009-06-16 00:00:00","id_people":157422,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Event annotation of domain corpora","year":2007,"authors_people":"Montemagni S., Trabucco A., Venturi G., Thompson P., Cotter P., Ananiadou S., McNaught J., Kim J., Rebholz D., Pezik P.","authors_cnr":["Venturi, Giulia","Trabucco, Andrea","Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Trabucco, A.","Venturi, G.","Thompson, P.","Cotter, P.","Ananiadou, S.","McNaught, J.","Kim, J.","Rebholz, D.","Pezik, P."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157422","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131553,"last_updated":"2009-06-16 00:00:00","id_people":157423,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Augmented Version of Bio-Lexicon","year":2007,"authors_people":"Sasaki Y., McNaught J., Ananiadou S., Pezik P., McGillivray B., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Sasaki, Y.","McNaught, J.","Ananiadou, S.","Pezik, P.","McGillivray, B.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157423","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131566,"last_updated":"2017-06-21 16:04:27","id_people":157436,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"ALT-Web. Sito dell\u0092Atlante Lessicale Toscano (ALT) in rete","year":2007,"authors_people":"Picchi E., Montemagni S., Cucurullo S., Sassolini E., Paoli M.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["5595","11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Montemagni, S.","Cucurullo, S.","Sassolini, E.","Paoli, M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157436","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131124,"last_updated":"2023-07-10 09:15:54","id_people":84664,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Multimedia Information Extraction in Ontology-based Semantic Annotation of Product Catalogues","year":2006,"authors_people":"Bartolini R., Giovannetti E., Marchi S., Montemagni S., Andreatta C., Brunelli R., Stecher R. and Bouquet P.","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone","Giovannetti, Emiliano"],"authors_cnr_id":["5595","10441","10442","11969"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Giovannetti, E.","Marchi, S.","Montemagni, S.","Andreatta, C.","Brunelli, R.","Stecher, R.","Bouquet, P."],"abstract":"The demand for efficient methods for extracting knowledge from multimedia content has led to a growing research community investigating the convergence of multimedia and knowledge technologies. In this paper we describe a methodology for extracting multimedia information from product catalogues empowered by the synergetic use and extension of a domain ontology. The methodology was implemented in the Trade Fair Advanced Semantic Annotation Pipeline of the VIKE-framework.","keywords":["Semantic Web Technologies","ontology creation","ontology extraction","ontology evolution","semantic annotation of multimedia content"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84664","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"SWAP 2006","conference_place":"Pisa","conference_date":"18-20 December 2006"},{"id":131091,"last_updated":"2012-05-31 18:50:31","id_people":84629,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Dialectal resources on-line: the ALT-Web experience","year":2006,"authors_people":"Cucurullo S., Montemagni S., Paoli M., Picchi E., Sassolini E.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":["048","048","048","048"],"authors":["Cucurullo, S.","Montemagni, S.","Paoli, M.","Picchi, E.","Sassolini, E."],"abstract":"The paper presents an on-line dialectal resource, ALT-Web, which gives access to the linguistic data of the Atlante Lessicale Toscano, a specially designed linguistic atlas in which lexical data have both a diatopic and diastratic characterisation. The paper focuses on: the dialectal data representation model; the access modalities to the ALT dialectal corpus; ontology-based search.","keywords":["Computational dialectology","Dialectal databases","Construction of lexical resources"],"pages":"1846-1851","url":"http:\/\/www.lrec-conf.org\/lrec2006\/","volume":"Proceedings","doi":"","editors_people":"","editors":[""],"published":"Dialectal resources on-line: the ALT-Web experience","publisher":"","issn":"","isbn":"2-9517408-2-4","conference_name":"LREC 2006: 5th International Conference on Language Resources and Evaluation","conference_place":"Genoa","conference_date":"24-25-26 Maggio 2006"},{"id":131121,"last_updated":"2012-05-07 15:39:56","id_people":84661,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Atlante Dialettale in rete: ALT-Web","year":2006,"authors_people":"Cucurullo S., Montemagni S., Paoli M., Picchi E., Sassolini E.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":["048","048","048","048"],"authors":["Cucurullo, S.","Montemagni, S.","Paoli, M.","Picchi, E.","Sassolini, E."],"abstract":"The paper presents an on-line dialectal resource, ALT-Web, which gives access to the linguistic data of the Lexical Atlas of Tuscany or Atlante Lessicale Toscano, a specially designed linguistic atlas in which lexical data have both a diatopic and diastratic characterisation. The paper illustrates ALT-Web with particular emphasis on: 1) the dialectal data representation model; 2) the access modalities to the ALT dialectal corpus designed to produce an output tailored to the specific needs of the different classes of users (both professionals and common citizens); 3) ontology-based search. These represent three main features which differentiate ALT-Web both from the previous digitalised ALT version and, most interestingly, from other on-line dialectal resources. At the time of writing, this is the first resource of this type in Italy, and one of the few at the international level.","keywords":["dialectal resources","information retrieval"],"pages":"661-672","url":"http:\/\/www.euralex.org\/publications\/","volume":"2","doi":"","editors_people":"E. Corino, C. Marello, C. Onesti","editors":["Corino, E.","Marello, C.","Onesti, C."],"published":"Proceedings in 12\u00b0 EURALEX International Congress, Congresso internazionale di lessicografia","publisher":"Edizioni dell'ORSO (Alessandria, ITA)","issn":"","isbn":"8876949186","conference_name":"12\u00b0 EURALEX International Congress","conference_place":"Torino","conference_date":"6-9 Settembre 2006"},{"id":131092,"last_updated":"2023-11-06 19:34:24","id_people":84630,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Searching treebanks for functional constraints: cross-lingual experiments in grammatical relation assignment","year":2006,"authors_people":"Dell\u0092Orletta F., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84630","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LREC 2006: 5th International Conference on Language Resources and Evaluation","conference_place":"Genoa","conference_date":""},{"id":131120,"last_updated":"2023-11-06 19:34:23","id_people":84660,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Probing the space of grammatical variation: induction of cross-lingual grammatical constraints from treebanks","year":2006,"authors_people":"Dell'Orletta F.; Lenci A.; Montemagni S.; Pirrelli","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":["048","048","048"],"authors":["Dell'Orletta, F.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"The paper reports on a detailed quantitative analysis of distributional language data of both Italian and Czech, highlighting the relative contribution of a number of distributed grammatical factors to sentence-based identification of subjects and direct objects. The work uses a Maximum Entropy model of stochastic resolution of conflicting grammatical constraints and is demonstrably capable of putting explanatory theoretical accounts to the test of usage-based empirical verification.","keywords":[""],"pages":"21-28","url":"https:\/\/publications.cnr.it\/doc\/84660","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of the Workshop on Frontiers in Linguistically Annotated Corpora 2006 (LAC 06)","publisher":"Association for Computational Linguistics (Stroudsburg, USA)","issn":"","isbn":"1-932432-78-7","conference_name":"Coling\/ACL 2006","conference_place":"Sydney (Australia)","conference_date":"22 July 2006"},{"id":131119,"last_updated":"2012-06-05 17:20:11","id_people":84659,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"ALT-WEB: l\u0092'Atlante Lessicale Toscano in rete","year":2006,"authors_people":"Montemagni S.; Paoli M.; Picchi E.","authors_cnr":["Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":["048","048"],"authors":["Montemagni, S.","Paoli, M.","Picchi, E."],"abstract":"Scopo dell'articolo \u00e8 la presentazione di ALT-Web, ovvero l'Atlante Lessicale Toscano in rete. ALT-Web \u00e8 stato ideato per rendere il patrimonio linguistico-culturale testimoniato dall'Atlante Lessicale Toscano una risorsa educativa realmente disponibile in modo che possa fornire un contributo alla conservazione della memoria dell'identit\u00e0 culturale toscana e al contempo costituisca un prezioso punto di riferimento per lo studio di dinamiche linguistiche sia a livello areale sia a livello socio-culturale. La sua collocazione in rete porta inevitabilmente ALT-Web a rivolgersi a una vasta gamma di utenti non pi\u00f9 circoscritta agli addetti ai lavori (ovvero dialettologi, linguisti, etno-linguisti), ma che include anche insegnanti, operatori culturali (ad esempio, personale di musei e di istituzioni culturali pubbliche e private) fino al cittadino navigatore di Internet che voglia capire di pi\u00f9 della propria identit\u00e0 linguistica e culturale. Il vasto e variegato bacino di utenza a cui intende rivolgersi ALT-Web ha portato alla trasformazione della versione informatizzata dell'Atlante Lessicale Toscano (conosciuta come DBT-ALT) in una rete ipertestuale con modalit\u00e0 e funzionalit\u00e0 di accesso differenziate in relazione alle diverse classi di utenza; a questo aspetto, \u00e8 legata l'altra interpretazione dell'acronimo ALT-Web, ovvero quella di \"ALT come rete\". L'articolo illustra aspetti del processo di progettazione e realizzazione dell'opera che rivestono un qualche interesse per il linguista e il dialettologo. In particolare, dopo un breve excursus che riepiloga le caratteristiche principali della risorsa di partenza, l'articolo illustra la progettazione e realizzazione di ALT-Web, partendo dall'analisi dei requisiti e la definizione delle caratteristiche generali per arrivare ad aspetti pi\u00f9 specifici che riguardano le modalit\u00e0 di accesso ai materiali e la normalizzazione dei materiali dialettali in trascrizione fonetica.","keywords":["Dialettologia Computazionale-Risorse dialettali in rete-Atlante lessicale"],"pages":"209-241","url":"https:\/\/publications.cnr.it\/doc\/84659","volume":"","doi":"","editors_people":"F. Bruni; C. Marcato","editors":["Bruni, F.","Marcato, C."],"published":"Lessicografia dialettale: ricordando Paolo Zolli-Atti del convegno di studi, Venezia, 9-11 dicembre 2004","publisher":"Antenore (Roma, ITA)","issn":"","isbn":"88-8455-606-6","conference_name":"Lessicografia Dialettale. Ricordando Paolo Zolli. Atti del Convegno di Studi","conference_place":"Venezia","conference_date":"9-11 dicembre 2004"},{"id":131123,"last_updated":"2014-07-28 11:57:41","id_people":84663,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Ontology Learning in Multimedia Information Extraction from Product Catalogues","year":2006,"authors_people":"Bartolini R., Giovannetti E., Marchi S., Montemagni S., Andreatta C., Brunelli R., Stecher R., Nieder\u00e9e C., Bouquet P. and Bortoli S.","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone","Giovannetti, Emiliano"],"authors_cnr_id":["5595","10441","10442","11969"],"authors_cnr_institute":["048"],"authors":["Bartolini, R.","Giovannetti, E.","Marchi, S.","Montemagni, S.","Andreatta, C.","Brunelli, R.","Stecher, R.","Nieder\u00e9e, C.","Bouquet, P.","Bortoli, S."],"abstract":"We propose a methodology for extracting multimedia information from product catalogues empowered by the synergetic use and extension of a domain ontology. The use of domain ontologies in this context additionally opens up innovative ways of catalogue use. The method is characterized by incrementally feeding and exploiting the ontology during an information extraction process, implemented by the semantic annotation of the analysed document, and by providing support for detecting existing similar ontologies to enable reuse of (parts of) them.","keywords":["knowledge-drive multimedia analysis","ontology learning","semi-automatic content annotation tools"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84663","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"BOEMIE 2006","conference_place":"Podebrady, Czech Republic","conference_date":"6 ottobre 2006"},{"id":131275,"last_updated":"2009-06-16 00:00:00","id_people":112916,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Probing the space of grammatical variation: induction of cross-lingual grammatical constraints from treebanks","year":2006,"authors_people":"Pirrelli V., Lenci A., Montemagni S.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Pirrelli, V.","Lenci, A.","Montemagni, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112916","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Language resources and language research: typology, second language acquisition, English Linguistics","conference_place":"Pavia","conference_date":"2006"},{"id":131437,"last_updated":"2023-11-06 19:34:25","id_people":151563,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Text-to-Knowledge (T2K) Versione 2","year":2006,"authors_people":"Bartolini R., Dell'Orletta F., Lenci A., Marchi S., Montemagni S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["326","5595","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Dell'Orletta, F.","Lenci, A.","Marchi, S.","Montemagni, S.","Pirrelli, V."],"abstract":"Versione 2. Text-to-Knowledge (T2K) \u00e8 una piattaforma software di supporto avanzato alla gestione documentale per la creazione dinamica di repertori terminologici e ontologie di dominio a partire da testi e per l'indicizzazione concettuale di documenti. Il sistema T2K si propone di offrire una batteria integrata di strumenti avanzati di analisi linguistica del testo, analisi statistica e apprendimento automatico del linguaggio, destinati a offrire una rappresentazione accurata del contenuto di una base documentale non strutturata, per scopi di indicizzazione avanzata e navigazione intelligente. I risultati di questo processo di acquisizione sono annotati in forma di metadati XML, offrendo in tal modo la prospettiva di una sempre crescente e diretta interoperabilit\u00e0 con sistemi automatici per la produzione di contenuti digitali selezionati e strutturati dinamicamente su misura, per diversi profili di utenza. Versioni prototipali di T2K sono gi\u00e0 operative su alcuni portali della pubblica amministrazione e sono state applicate per l'indicizzazione di contenuti didattici multimediali. E' in corso l'integrazione della tecnologia T2K nel sistema di gestione informatica di documentazione scientifica del CNR.","keywords":["text to knowledge","nlp","estrazione terminologica","ontology learning","indicizzazione terminologica"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151563","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131431,"last_updated":"2009-06-18 00:00:00","id_people":151556,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"La Treebank Sintattico Semantica dell'Italiano del progetto SI-TAL","year":2006,"authors_people":"Montemagni S.","authors_cnr":["Montemagni, Simonetta"],"authors_cnr_id":["5595"],"authors_cnr_institute":[""],"authors":["Montemagni, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151556","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131432,"last_updated":"2017-06-21 16:27:13","id_people":151557,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"ALTWEB","year":2006,"authors_people":"Picchi E., Montemagni S., Sassolini E., Cucurullo S., Paoli M.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Cucurullo, Sebastiana","Picchi, Eugenio"],"authors_cnr_id":["5595","11479","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Montemagni, S.","Sassolini, E.","Cucurullo, S.","Paoli, M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151557","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130960,"last_updated":"2009-06-16 00:00:00","id_people":64502,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Acquiring and Representing Meaning: Theoretical and Computational Perspectives","year":2005,"authors_people":"Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"19-66","url":"https:\/\/publications.cnr.it\/doc\/64502","volume":"22-23","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131349,"last_updated":"2012-05-05 08:42:01","id_people":136436,"institutes":["ILC"],"type":"book","type_order":1,"type_people":"book","title":"Acquiring and Representing Word Meaning: Computational perspectives","year":2005,"authors_people":"Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/136436","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Istituti Editoriali e Poligrafici Internazionali (Pisa-Roma, ITA)","issn":"","isbn":"88-8147-413-1","conference_name":"","conference_place":"","conference_date":""},{"id":131350,"last_updated":"2012-06-04 16:26:22","id_people":136437,"institutes":["ILC"],"type":"book","type_order":1,"type_people":"book","title":"Testo e computer-Elementi di linguistica computazionale","year":2005,"authors_people":"Lenci A.; Montemagni S.; Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":["048","048"],"authors":["Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"In che modo il computer pu\u00f2 aiutarci a comprendere come funziona la nostra lingua? Cosa significa analizzare un testo con l'aiuto di un calcolatore? In che misura possiamo estendere le potenzialit\u00e0 del computer rendendolo capace di interagire con gli utenti umani nella loro lingua' Queste e altre domande sono l'oggetto di indagine della linguistica computazionale, una disciplina che ha al suo centro proprio il rapporto tra lingua e computer. Il libro fornisce gli elementi di base della linguistica computazionale partendo da un interesse primario per il testo, la sua struttura e il suo contenuto. Il volume propone una sintesi equilibrata e accessibile tra sapere e fare, nozioni di base e loro applicazione, ed \u00e8 destinato in primo luogo agli studenti delle facolt\u00e0 umanistiche e scientifiche interessati all'interazione tra scienze umane e informatica, ma anche agli studiosi che vogliano imparare a usare il computer come strumento di ricerca sul linguaggio.","keywords":["Linguistica Computazionale"],"pages":"255","url":"https:\/\/publications.cnr.it\/doc\/136437","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Carocci (Roma, ITA)","issn":"","isbn":"8843034251","conference_name":"","conference_place":"","conference_date":""},{"id":131391,"last_updated":"2012-06-07 09:47:48","id_people":146069,"institutes":["ILC"],"type":"edited_volume","type_order":3,"type_people":"book","title":"Acquisition and Representation of Word Meaning: Theoretical and computational perspectives","year":2005,"authors_people":"-","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Pirrelli, V.","Montemagni, S."],"abstract":"","keywords":["Lexical semantics","Distributional semantics","Lexicon acquisition"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/146069","volume":"XXII-XXIII","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Istituti Editoriali e Poligrafici Internazionali (Pisa-Roma, ITA)","issn":"","isbn":"88-8147-413-1","conference_name":"","conference_place":"","conference_date":""},{"id":131039,"last_updated":"2015-02-23 14:55:26","id_people":84576,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Automatic Incremental Term Acquisition from Domain Corpora","year":2005,"authors_people":"Bartolini R., Giorgetti D., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Bartolini, Roberto"],"authors_cnr_id":["326","5595","10441"],"authors_cnr_institute":["048"],"authors":["Bartolini, R.","Giorgetti, D.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"We describe a technique for the acquisition of terms from Italian domain text corpora, which relies both on sophisticated linguistic analysis and on statistical measures applied to linguistically processed text rather than to raw text as it is usually the case. The main advantage of this technique is that minimal a priori knowledge of term structure is required, thus allowing to explore and discover terms in a given domain without imposing a strict pattern matching structure on them, and also to easily extend it to different domains. The approach we present in this paper is incremental as it may be iterated to discover terms of increasing complexity built on top of terms discovered in the previous iteration. The reason why it is convenient to adopt such an incremental approach is that it allows to \"clean\" data from noise in the first step, elicitating the constituent terms, and then to refine term acquisition on \"skimmed\" term data.","keywords":[""],"pages":"293-300","url":"https:\/\/publications.cnr.it\/doc\/84576","volume":"","doi":"","editors_people":"","editors":[""],"published":"Proceedings of TKE 2005-7th International Conference on Terminology and Knowledge Engineering","publisher":"","issn":"","isbn":"","conference_name":"7th International conference on Terminology and Knowledge Engineering (TKE2005)","conference_place":"Copenhagen","conference_date":"2005"},{"id":123414,"last_updated":"2012-03-27 15:07:38","id_people":172458,"institutes":["ILC","ITTIG","IGSG"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Automatic semantics extraction in law documents","year":2005,"authors_people":"Biagioli C., Francesconi E., Passerini A., Montemagni S., Soria C. Biagioli C., Francesconi E., Montemagni S., Passerini A., Soria C.","authors_cnr":["Biagioli, Carlo","Montemagni, Simonetta","Soria, Claudia","Francesconi, Enrico"],"authors_cnr_id":["2712","5595","9887","10498"],"authors_cnr_institute":[""],"authors":["Biagioli, C.","Francesconi, E.","Passerini, A.","Montemagni, S.","Soria, C."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/172458","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Tenth International Conference on Artificial Intelligence and Law (ICAIL 2005)","conference_place":"Bologna","conference_date":"2005"},{"id":131042,"last_updated":"2023-11-06 19:34:26","id_people":84579,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Climbing the path to grammar: a maximum entropy model of subject\/object learning","year":2005,"authors_people":"Dell'Orletta F., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Dell'Orletta, F.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84579","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"Psychocomputational Models of Human Language Acquisition (PsychoCompLA-2005)","conference_place":"Ann Arbour (USA)","conference_date":""},{"id":131497,"last_updated":"2020-11-27 14:35:04","id_people":157366,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ILC-CNR Contribution to Deliverable 4. 1","year":2005,"authors_people":"Bartolini R., Giorgetti D., Marchi S., Montemagni S.","authors_cnr":["Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Giorgetti, D.","Marchi, S.","Montemagni, S."],"abstract":"The goal of the semantic annotation is the annotation of entities and relations starting from input documents conformant with the harmonisation output schema as defined within WP3. This harmonisation schema will focus on the structural and logical organisation of the documents, while WP4 will concentrate on the annotation of textual entities and image elements. The results of semantic annotation are intended to populate the domain ontology.","keywords":["NLP"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157366","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131498,"last_updated":"2020-11-27 14:35:36","id_people":157367,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Personalizzazione degli Italian NLP tools","year":2005,"authors_people":"Bartolini R., Lenci A., Marchi S., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["326","5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, A.","Marchi, S.","Montemagni, S.","Pirrelli, V."],"abstract":"Il presente documento intende offrire criteri e risultati della fase di personalizzazione dei moduli per l'analisi automatica del testo (Italian NLP tools o \"AnITA\") all'interno dell'architettura prevista nell'ambito del progetto FuLL.","keywords":["NLP"],"pages":"13","url":"https:\/\/publications.cnr.it\/doc\/157367","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131500,"last_updated":"2009-06-16 00:00:00","id_people":157369,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Modellazione del motore sintattico e delle strutture dati di supporto","year":2005,"authors_people":"Bartolini R., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157369","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131501,"last_updated":"2023-07-11 15:16:12","id_people":157370,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Text-2-Knowledge: Acquisizione semi-automatica di ontologie per l'indicizzazione semantica di documenti","year":2005,"authors_people":"Bartolini R., Lenci L., Marchi S., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["326","5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, L.","Marchi, S.","Montemagni, S.","Pirrelli, V."],"abstract":"Text-2-Knowledge, Acquisizione semi-automatica di ontologie per l'indicizzazione semantica di documenti","keywords":["nlp","terminology extraction"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157370","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131504,"last_updated":"2009-06-16 00:00:00","id_people":157373,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Atlante Lessicale Toscano in rete (ALT-Web). Relazione finale","year":2005,"authors_people":"Cucurullo S., Montemagni S., Paoli M., Picchi E., Sassolini E.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":[""],"authors":["Cucurullo, S.","Montemagni, S.","Paoli, M.","Picchi, E.","Sassolini, E."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157373","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131511,"last_updated":"2020-09-11 12:26:34","id_people":157380,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ILC-CNR Contribution to Deliverable 5. 1","year":2005,"authors_people":"Giorgetti D., Marchi S., Montemagni S.","authors_cnr":["Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["5595","10442"],"authors_cnr_institute":[""],"authors":["Giorgetti, D.","Marchi, S.","Montemagni, S."],"abstract":"This document describes the high level infrastructure designed as part of the project VIKEF for creating a Virtual Information and Knowledge Environment (VIKE), namely an environment made up of explicit representation of the information and knowledge implicitly contained in one or more collections of Information-Content-Knowledge (ICK) resources, and of a collection of services operating on this explicit representation of information and knowledge; it is a virtual environment, as the representation and the services for accessing information and knowledge is almost completely independent from the physical properties of the original data.","keywords":["NLP"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157380","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131515,"last_updated":"2020-09-11 12:41:59","id_people":157384,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"ILC-CNR Contribution to Deliverable 3. 1","year":2005,"authors_people":"Marchi S., Montemagni S.","authors_cnr":["Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["5595","10442"],"authors_cnr_institute":[""],"authors":["Marchi, S.","Montemagni, S."],"abstract":"This document presents the first set of knowledge and content acquisition components. Starting from the Annotation Schema definition, it will then describe the Harmonization support and the Annotation components, as well as the various resources needed all along the current chain.","keywords":["NLP"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157384","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131425,"last_updated":"2023-11-06 19:34:27","id_people":151548,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"Text-to-Knowledge (T2K)","year":2005,"authors_people":"Bartolini R., Dell'Orletta F., Giorgetti D., Marchi S., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Dell'Orletta, Felice","Pirrelli, Vito","Montemagni, Simonetta","Bartolini, Roberto","Marchi, Simone"],"authors_cnr_id":["326","5595","10441","10442"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Dell'Orletta, F.","Giorgetti, D.","Marchi, S.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"Piattaforma di estrazione e indicizzazione terminologica.","keywords":["NLP","estrazione terminologica"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151548","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131426,"last_updated":"2009-06-18 00:00:00","id_people":151550,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"NLPtools","year":2005,"authors_people":"Bartolini R., Marchi S., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Marchi, S.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151550","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131409,"last_updated":"2009-06-18 00:00:00","id_people":151532,"institutes":["ILC"],"type":"misc","type_order":12,"type_people":"other","title":"ALTWEB","year":2005,"authors_people":"Picchi E., Montemagni S., Sassolini E., Cucurullo S., Paoli M.","authors_cnr":["Cucurullo, Sebastiana","Sassolini, Eva","Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Montemagni, S.","Sassolini, E.","Cucurullo, S.","Paoli, M."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/151532","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131351,"last_updated":"2009-06-16 00:00:00","id_people":136438,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Lessicografia dialettale e computer: questioni di rappresentazione e recupero dei dati","year":2004,"authors_people":"Agostiniani L., Montemagni S., Paoli M., Picchi E.","authors_cnr":["Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":[""],"authors":["Agostiniani, L.","Montemagni, S.","Paoli, M.","Picchi, E."],"abstract":"","keywords":["Lessicografia computazionale","Lessicografia Dialettale"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/136438","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Centro Interuniversitario di Studi Veneti (Venezia, ITA)","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130892,"last_updated":"2023-06-27 11:50:18","id_people":30867,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Automatic Classification and Analysis of Provisions in Italian Legal Texts: A Case Study","year":2004,"authors_people":"Bartolini R.; Lenci A.; Montemagni S.; Pirrelli V.; Soria C.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Soria, Claudia","Bartolini, Roberto"],"authors_cnr_id":["326","5595","9887","10441"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V.","Soria, C."],"abstract":"In this paper we address the problem of automatically enriching legal texts with semantic annotation, an essential pre\u0096requisite to effective indexing and retrieval of legal documents. This is done through illustration of SALEM (Semantic Annotation for LEgal Management), a computational system developed for automated semantic annotation of (Italian) law texts. SALEM is an incremental system using Natural Language Processing techniques to perform two tasks: i) classify law paragraphs according to their regulatory content, and ii) extract relevant text fragments corresponding to specific semantic roles that are relevant for the different types of regulatory content. The paper sketches the overall architecture of SALEM and reports results of a preliminary case study on a sample of Italian law texts.","keywords":["Annotazione semantica","Classificazione automatica"],"pages":"593-604","url":"https:\/\/rdcu.be\/dftjm","volume":"3292","doi":"10.1007\/978-3-540-30470-8_72","editors_people":"Meersman, R., Tari, Z., Corsaro, A.","editors":["Meersman, R.","Tari, Z.","Corsaro, A."],"published":"On the Move to Meaningful Internet Systems 2004: OTM 2004 Workshops. OTM 2004","publisher":"Springer (Berlin, DEU)","issn":"","isbn":"978-3-540-23664-1","conference_name":"","conference_place":"","conference_date":""},{"id":131357,"last_updated":"2009-06-16 00:00:00","id_people":136444,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"ALT Web: l'Atlante Lessicale Toscano in rete","year":2004,"authors_people":"Paoli M., Montemagni S., Picchi E.","authors_cnr":["Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":[""],"authors":["Paoli, M.","Montemagni, S.","Picchi, E."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/136444","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"Centro Interuniversitario di Studi Veneti (Venezia, ITA)","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131034,"last_updated":"2009-06-16 00:00:00","id_people":84570,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Hybrid Constraints for Robust Parsing: First Experiments and Evaluation","year":2004,"authors_people":"Bartolini R., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84570","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"LREC 2004: Fourth International Conference on Language Resources and Evaluation","conference_place":"Lisbon, Portugal","conference_date":"2004"},{"id":131035,"last_updated":"2012-05-04 11:58:28","id_people":84571,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"Semantic Mark-up of Italian Legal Texts Through NLP-based Techniques","year":2004,"authors_people":"Bartolini R.; Lenci A.; Montemagni S.; Pirrelli V.; Soria C.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Soria, Claudia","Bartolini, Roberto"],"authors_cnr_id":["326","5595","9887","10441"],"authors_cnr_institute":["048","048","048","048"],"authors":["Bartolini, R.","Lenci, A.","Montemagni, S.","Pirrelli, V.","Soria, C."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/84571","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"2-9517408-1-6","conference_name":"LREC 2004: Fourth International Conference on Language Resources and Evaluation","conference_place":"Lisbon, Portugal","conference_date":"2004"},{"id":131071,"last_updated":"2020-09-12 13:17:59","id_people":84609,"institutes":["ILC"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"NLP-enhanced Content filtering within the POESIA Project","year":2004,"authors_people":"Hepple M.; N. Ireson; Allegrini P.; Marchi S.; Montemagni S.; G\u00f3mez Hidalgo J.M.","authors_cnr":["Montemagni, Simonetta","Marchi, Simone"],"authors_cnr_id":["5595","10442"],"authors_cnr_institute":[""],"authors":["Hepple, M.","Ireson, N.","Allegrini, P.","Marchi, S.","Montemagni, S.","G\u00f3mez Hidalgo, J. M."],"abstract":"This paper introduces the POESIA internet filtering system, which is open-source, and which combines standard filtering methods, such as positive\/negative URL lists, with more advanced techniques, such as image processing and NLP-enhanced text filtering. The description here focusses on components providing textual content filtering for three European languages (English, Italian and Spanish), employing NLP methods to enhance performance. We address also the acquisition of language data needed to develop these filters, and the evaluation of the system and its components.","keywords":["Image processing","Natural language processing systems","Open systems"],"pages":"1967-1970","url":"https:\/\/www.aclweb.org\/anthology\/L04-1507\/","volume":"","doi":"","editors_people":"Maria Teresa Lino, Maria Francisca Xavier, F\u00e1tima Ferreira, Rute Costa, Raquel Silva,","editors":["Lino, M. T.","Xavier, M. F.","Ferreira, F.","Costa, R.","Silva, R."],"published":"Proceedings of the Fourth International Conference on Language Resources and Evaluation (LREC 2004)","publisher":"","issn":"","isbn":"2-9517408-1-6","conference_name":"LREC 2004: Fourth International Conference on Language Resources and Evaluation","conference_place":"Lisbona","conference_date":"26-28 May 2004"},{"id":131279,"last_updated":"2009-06-16 00:00:00","id_people":112920,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"Classifying text through time: a complexity science approach to dynamic web page filtering","year":2004,"authors_people":"Pirrelli V., Allegrini P., Montemagni S.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Pirrelli, V.","Allegrini, P.","Montemagni, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112920","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"International Conference on Text Mining (CIFT)","conference_place":"La Rochelle Francia","conference_date":"2004"},{"id":131282,"last_updated":"2009-06-16 00:00:00","id_people":112923,"institutes":["ILC"],"type":"conference_misc","type_order":6,"type_people":"conferenceObject","title":"The lexicon in context: distributional evidence and representational issues","year":2004,"authors_people":"Pirrelli V., Lenci A., Montemagni S.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Pirrelli, V.","Lenci, A.","Montemagni, S."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/112923","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"International Colloquium: Word Structure and Lexical Systems: models and applications","conference_place":"Pavia","conference_date":"2004"},{"id":131506,"last_updated":"2009-06-16 00:00:00","id_people":157375,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"Text-2-Knowledge: Acquisizione automatica di ontologie per l'indicizzazione semantica di documenti","year":2004,"authors_people":"Bartolini E., Giorgetti D., Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Bartolini, E.","Giorgetti, D.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/157375","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130926,"last_updated":"2009-06-16 00:00:00","id_people":64466,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Example-based automatic induction of semantic classes through entropic scores","year":2003,"authors_people":"Allegrini P., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Allegrini, P.","Montemagni, S.","Pirrelli, V."],"abstract":"Abstract - The paper deals in some detail with the application of examplebased machine learning techniques to the task of automatically acquiring semantic information from functionally annotated texts. Special emphasis is placed on the use of \u0093analogical proportions\u0094 as a means of structuring the knowledge embodied in attested examples, and weighing up their contribution to a variety of lexico-semantic classification tasks. Careful quantitative analysis of automatically acquired information proves to shed considerable light on the semantic inter-connectivity of input data, their structure and organising principles.","keywords":[""],"pages":"1-45","url":"https:\/\/publications.cnr.it\/doc\/64466","volume":"16-17","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130936,"last_updated":"2009-06-16 00:00:00","id_people":64476,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"Chunk-it. An Italian shallow parser for robust syntactic annotation","year":2003,"authors_people":"Lenci A., Montemagni S., Pirrelli V.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":[""],"pages":"353-386","url":"https:\/\/publications.cnr.it\/doc\/64476","volume":"16-17","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130937,"last_updated":"2009-06-16 00:00:00","id_people":64477,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"The syntactic-semantic Treebank of Italian. An Overview","year":2003,"authors_people":"Montemagni S., Barsotti F., Battista M., Calzolari N., Corazzari O., Lenci A., Pirrelli V., Zampolli A., Fanciulli F., Massetani M., Raffaelli R., Basili R., Pazienza M.T., Saracino D., Zanzotto F., Mana N., Pianesi F., Delmonte R.","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta","Zamorani, Nicoletta"],"authors_cnr_id":["326","5595","26123"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Barsotti, F.","Battista, M.","Calzolari, N.","Corazzari, O.","Lenci, A.","Pirrelli, V.","Zampolli, A.","Fanciulli, F.","Massetani, M.","Raffaelli, R.","Basili, R.","Pazienza, M. T.","Saracino, D.","Zanzotto, F.","Mana, N.","Pianesi, F.","Delmonte, R."],"abstract":"","keywords":[""],"pages":"461-492","url":"https:\/\/publications.cnr.it\/doc\/64477","volume":"16-17","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130938,"last_updated":"2009-06-16 00:00:00","id_people":64478,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"DBT-ALT: a system for storing and querying the data of the 'Atlante Linguistico Toscano'","year":2003,"authors_people":"Montemagni S., Picchi E., Biagini L.","authors_cnr":["Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Picchi, E.","Biagini, L."],"abstract":"Abstract - Computers can help dialectologists to make full use of the information they have so laboriously and painstakingly acquired: the basic dimensions of dialectal research can be enlarged and its possible outcomes can become more sophisticated. In this paper, we describe a lexical database for dialectal data, DBT-ALT, which has been designed and constructed to contain linguistic data collected for the Atlante Lessicale Toscano (ALT), a lexical atlas of Tuscany. DBT-ALT is illustrated in detail, with particular emphasis on its search functions which allow for complex queries taking into account a wide range of parameters interactively defined by the user on the basis of his\/her research interests.","keywords":[""],"pages":"493-517","url":"https:\/\/publications.cnr.it\/doc\/64478","volume":"18-19","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131341,"last_updated":"2009-06-16 00:00:00","id_people":136427,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Le forme del significato. Acquisizione e rappresentazione dell'informazione semantica","year":2003,"authors_people":"Allegrini P. 1, Lenci A. 2, Montemagni S. 3, Pirrelli V. 4","authors_cnr":["Pirrelli, Vito","Montemagni, Simonetta"],"authors_cnr_id":["326","5595"],"authors_cnr_institute":[""],"authors":["Allegrini, P.","Lenci, A.","Montemagni, S.","Pirrelli, V."],"abstract":"","keywords":["Acquisizione","Semantica Lessicale","Ontologia","Machine Learning"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/136427","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131336,"last_updated":"2009-06-16 00:00:00","id_people":136422,"institutes":["ILC"],"type":"book_chapter","type_order":2,"type_people":"bookPart","title":"Building the Italian Syntactic-Semantic Treebank","year":2003,"authors_people":"Montemagni S. 1, Barsotti F. 2, Battista M. 3, Calzolari N. 4 , Corazzari O. 5, Lenci A. 6, Zampolli A. 7, Raffaelli R. 8, Pazienza M.T. 9, Mana N. 10, Delmonte R. 11 [et alii]","authors_cnr":["Montemagni, Simonetta","Zamorani, Nicoletta"],"authors_cnr_id":["5595","26123"],"authors_cnr_institute":[""],"authors":["Montemagni, S.","Barsotti, F.","Battista, M.","Calzolari, N.","Corazzari, O.","Lenci, A.","Zampolli, A.","Raffaelli, R.","Pazienza, M. T.","Mana, N.","Delmonte, R."],"abstract":"","keywords":["Corpora testuali","Annot. sintattica","Annot. semantica","Treebank"],"pages":"","url":"https:\/\/publications.cnr.it\/doc\/136422","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":131480,"last_updated":"2020-09-10 17:59:47","id_people":157348,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"POESIA Lexical Resources and Tools for Each Language","year":2003,"authors_people":"Allegrini P., Calzolari N., Marchi S., Montemagni S., Hepple M., Ireson N. Gomez Hidalgo J.M., Carrero Garcia F., de Buenaga Rodriguez M., Puera Sanz E.","authors_cnr":["Montemagni, Simonetta","Marchi, Simone","Zamorani, Nicoletta"],"authors_cnr_id":["5595","10442","26123"],"authors_cnr_institute":[""],"authors":["Allegrini, P.","Calzolari, N.","Marchi, S.","Montemagni, S.","Hepple, M.","Ireson, N.","Gomez Hidalgo, J. M.","Carrero Garcia, F.","De Buenaga Rodriguez, M.","Puera Sanz, E."],"abstract":"The aim of this report is to review the various resources that the different language processing sites expect to use in the development of their language-specific text filtering components. Some of the required resources are ones that were developed before Poesia, possibly by one the Poesia partners, or possibly elsewhere but being now in the public domain. Such resources may require adaptation to the Poesia task. Other resources required for Poesia will be developed as part of the project. In some cases, this development has already been done or is in progress, whilst in others, it is yet to be undertaken. In what follows, the status of each of the resources described will be made clear in terms of these alternatives.","keywords":["Lexical Resources","nlp"],"pages":"30","url":"https:\/\/publications.cnr.it\/doc\/157348","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":359307,"last_updated":"2023-07-11 11:09:39","id_people":430635,"institutes":["ILC"],"type":"technical_report","type_order":8,"type_people":"report","title":"POESIA Software Architecture Definition Document","year":2002,"authors_people":"B Starynkevitch, M Daoudi, C Tombelle, H Zheng, M Hepple, N Ireson, JM Gomez-Hildago, Paolo Allegrini, Nicoletta Calzolari, Simone Marchi, Simonetta Montemagni, S Guerra","authors_cnr":["Montemagni, Simonetta","Marchi, Simone","Zamorani, Nicoletta"],"authors_cnr_id":["5595","10442","26123"],"authors_cnr_institute":[""],"authors":["Starynkevitch, B.","Daoudi, M.","Tombelle, C.","Zheng, H.","Hepple, M.","Ireson, N.","Gomez Hildago, J.","Allegrini, P.","Calzolari, N.","Marchi, S.","Montemagni, S.","Guerra, S."],"abstract":"Software Architecture Definition Document","keywords":["NLP","Software Engineering"],"pages":"68-80","url":"https:\/\/publications.cnr.it\/doc\/430635","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":130947,"last_updated":"2009-06-16 00:00:00","id_people":64487,"institutes":["ILC"],"type":"journal_article","type_order":0,"type_people":"article","title":"DBT-ALT: a System for Storying and Querying the Data of the Atlante Lessicale Toscano (ALT)","year":2001,"authors_people":"Picchi E. 1, Montemagni S. 2, Biagini L. 3","authors_cnr":["Montemagni, Simonetta","Picchi, Eugenio"],"authors_cnr_id":["5595","16688"],"authors_cnr_institute":[""],"authors":["Picchi, E.","Montemagni, S.","Biagini, L."],"abstract":"","keywords":["Atlanti linguistici","Dialettologia comput","Lessicografia dialet","Geolinguistica","Sociolinguistica"],"pages":"85-103","url":"https:\/\/publications.cnr.it\/doc\/64487","volume":"9","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132340,"last_updated":"2020-09-22 15:24:37","id_people":409402,"institutes":["ILC","ISTI"],"type":"conference_article","type_order":5,"type_people":"conferenceObject","title":"From machine readable dictionaries to lexicons for NLP: the cobuild dictionaries-a different approach","year":1994,"authors_people":"Peters C.; Federici S.; Montemagni S.; Zamorani Calzolari N.","authors_cnr":["Montemagni, Simonetta","Peters, Carol Ann","Zamorani, Nicoletta"],"authors_cnr_id":["5595","16906","26123"],"authors_cnr_institute":["074","074","048"],"authors":["Peters, C.","Federici, S.","Montemagni, S.","Zamorani, C. N."],"abstract":"We describe the results of a syntactic-semantic parser for Cobuild dictionary definitions. Unlike previous work on the automatic analysis of machine readable dictionaries, the particular structure of the Cobuild definition allows us to derive information that classifies the lexical item mainly in terms of the selectional restrictions or preferences encoded on its arguments. The resulting formalized lexical entries contain data that has generally been lacking in other lexical representations but which is expected to be very useful in a wide range of NLP purposes. We show how this information can be used in dictionary sense disambiguation by creating links throughout the lexicon both on the paradigmatic and the syntagmatic axes.","keywords":["Lexical databases","Information storage and retrieval. Dictionaries"],"pages":"147-157","url":"https:\/\/publications.cnr.it\/doc\/409402","volume":"","doi":"","editors_people":"Martin W. et al.","editors":["Martin, W."],"published":"Euralex 1994 Proceedings","publisher":"","issn":"","isbn":"","conference_name":"6th International Congress on Lexicography","conference_place":"Amsterdam, The Netherlands","conference_date":"1994"},{"id":132432,"last_updated":"2021-02-25 10:49:34","id_people":446186,"institutes":["ILC","ISTI"],"type":"technical_report","type_order":8,"type_people":"report","title":"ET10\/51-Deliverable 8: Evaluation Report","year":1994,"authors_people":"Barnbrook G.; Calzolari N.; Federici S.; Hoelter M.; Montemagni S.; Peters C.; Schnelle H.; Sinclair J.","authors_cnr":["Montemagni, Simonetta","Peters, Carol Ann"],"authors_cnr_id":["5595","16906"],"authors_cnr_institute":["048","074"],"authors":["Barnbrook, G.","Calzolari, N.","Federici, S.","Hoelter, M.","Montemagni, S.","Peters, C.","Schnelle, H.","Sinclair, J."],"abstract":"The objective of the work in Pisa has been to translate and produce instantiations of the syntactically parsed definitions of the Cobuild dictionary: provided by Birmingham in a Typed Feature Structure formalism. However, as described in Methodology above, our results have been produced at two different levels: intermediate results; final results in the form of TFS entries. In the following, we will discuss briefly the possible applications of these different results for the three user types recognized in the introduction to this section: i. Human user ii. Human user-assisted by the machine iii. The machine Obviously, the discussion here below refers entirely to the results that would be obtained once the parser has been applied to the whole dictionary.","keywords":["Language","Computational linguistics","Formal Definitions and Theory"],"pages":"38","url":"https:\/\/publications.cnr.it\/doc\/446186","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""},{"id":132433,"last_updated":"2021-02-25 10:52:15","id_people":446200,"institutes":["ILC","ISTI"],"type":"technical_report","type_order":8,"type_people":"report","title":"ET-10\/51-Final Report: Par. 3-Extracting, representing and using syntactic-semantic information from cobuild definitions","year":1994,"authors_people":"Calzolari N.; Federici S.;Montemagni S.; Peters C.","authors_cnr":["Montemagni, Simonetta","Peters, Carol Ann"],"authors_cnr_id":["5595","16906"],"authors_cnr_institute":["048","074"],"authors":["Calzolari, N.","Federici, S.","Montemagni, S.","Peters, C."],"abstract":"In May 1992 a new research project brought together the authors of this report. With the help and support of several other people and institutions, they worked steadily for two years, trying to improve the design and building of machine-usable lexicons, for automatic translation and many other applications. The starting point was clear. Around 1989 Helmut Schnelle of the Ruhr-Universitat Bochum became interested in the way in which words were defined in a new kind of dictionary called Cobuild. He thought that since theywere couched in sentences of apparently ordinary English, and had distinctive and repetitive shapes according to their meanings, it should be possible to represent them in logical form by means of regular rules.","keywords":["Language","Computational linguistics","Formal Definitions and Theory","Semantics"],"pages":"162","url":"https:\/\/publications.cnr.it\/doc\/446200","volume":"","doi":"","editors_people":"","editors":[""],"published":"","publisher":"","issn":"","isbn":"","conference_name":"","conference_place":"","conference_date":""}]